<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Form Res</journal-id><journal-id journal-id-type="publisher-id">formative</journal-id><journal-id journal-id-type="index">27</journal-id><journal-title>JMIR Formative Research</journal-title><abbrev-journal-title>JMIR Form Res</abbrev-journal-title><issn pub-type="epub">2561-326X</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v9i1e56973</article-id><article-id pub-id-type="doi">10.2196/56973</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>The Impact of ChatGPT Exposure on User Interactions With a Motivational Interviewing Chatbot: Quasi-Experimental Study</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Zhu</surname><given-names>Jiading</given-names></name><degrees>BASc</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Dong</surname><given-names>Alec</given-names></name><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Wang</surname><given-names>Cindy</given-names></name><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Veldhuizen</surname><given-names>Scott</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff4">4</xref><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Abdelwahab</surname><given-names>Mohamed</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Brown</surname><given-names>Andrew</given-names></name><degrees>MASc</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Selby</surname><given-names>Peter</given-names></name><degrees>MBBS, MHSc</degrees><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff5">5</xref><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Rose</surname><given-names>Jonathan</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff3">3</xref></contrib></contrib-group><aff id="aff1"><institution>The Edward S. Rogers Sr. Department of Electrical &#x0026; Computer Engineering, University of Toronto</institution><addr-line>Toronto</addr-line><addr-line>ON</addr-line><country>Canada</country></aff><aff id="aff2"><institution>Department of Mechanical &#x0026; Industrial Engineering, University of Toronto</institution><addr-line>Toronto</addr-line><addr-line>ON</addr-line><country>Canada</country></aff><aff id="aff3"><institution>INTREPID Lab, Centre for Addiction and Mental Health</institution><addr-line>Toronto</addr-line><addr-line>ON</addr-line><country>Canada</country></aff><aff id="aff4"><institution>Institute for Mental Health Policy Research, Centre for Addiction and Mental Health</institution><addr-line>Toronto</addr-line><addr-line>ON</addr-line><country>Canada</country></aff><aff id="aff5"><institution>Department of Family and Community Medicine, University of Toronto</institution><addr-line>Toronto</addr-line><addr-line>ON</addr-line><country>Canada</country></aff><aff id="aff6"><institution>Dalla Lana School of Public Health, University of Toronto</institution><addr-line>Toronto</addr-line><addr-line>ON</addr-line><country>Canada</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Mavragani</surname><given-names>Amaryllis</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Carcone</surname><given-names>April</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Balan</surname><given-names>Ivan</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Wilson</surname><given-names>Josephine</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Jonathan Rose, PhD, The Edward S. Rogers Sr. Department of Electrical &#x0026; Computer Engineering, University of Toronto, 10 King's College Road, Toronto, ON, M5S 3G8, Canada, 1 4169786992; <email>jonathan.rose@ece.utoronto.ca</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>21</day><month>3</month><year>2025</year></pub-date><volume>9</volume><elocation-id>e56973</elocation-id><history><date date-type="received"><day>02</day><month>02</month><year>2024</year></date><date date-type="rev-recd"><day>20</day><month>02</month><year>2025</year></date><date date-type="accepted"><day>21</day><month>02</month><year>2025</year></date></history><copyright-statement>&#x00A9; Jiading Zhu, Alec Dong, Cindy Wang, Scott Veldhuizen, Mohamed Abdelwahab, Andrew Brown, Peter Selby, Jonathan Rose. Originally published in JMIR Formative Research (<ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>), 21.3.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Formative Research, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://formative.jmir.org/2025/1/e56973"/><abstract><sec><title>Background</title><p>The worldwide introduction of ChatGPT in November 2022 may have changed how its users perceive and interact with other chatbots. This possibility may confound the comparison of responses to pre-ChatGPT and post-ChatGPT iterations of pre-existing chatbots, in turn affecting the direction of their evolution. Before the release of ChatGPT, we created a therapeutic chatbot, MIBot, whose goal is to use motivational interviewing to guide smokers toward making the decision to quit smoking. We were concerned that measurements going forward would not be comparable to those in the past, impacting the evaluation of future changes to the chatbot.</p></sec><sec><title>Objective</title><p>The aim of the study is to explore changes in how users interact with MIBot after the release of ChatGPT and examine the relationship between these changes and users&#x2019; familiarity with ChatGPT.</p></sec><sec sec-type="methods"><title>Methods</title><p>We compared user interactions with MIBot prior to ChatGPT&#x2019;s release and 6 months after the release. Participants (N=143) were recruited through a web-based platform in November of 2022, prior to the release of ChatGPT, to converse with MIBot, in an experiment we refer to as MIBot (version 5.2). In May 2023, a set of (n=129) different participants were recruited to interact with the same version of MIBot and asked additional questions about their familiarity with ChatGPT, in the experiment called MIBot (version 5.2A). We used the Mann-Whitney <italic>U</italic> test to compare metrics between cohorts and Spearman rank correlation to assess relationships between familiarity with ChatGPT and other metrics within the MIBot (version 5.2A) cohort.</p></sec><sec sec-type="results"><title>Results</title><p>In total, 83(64.3%) participants in the MIBot (version 5.2A) cohort had used ChatGPT, with 66 (51.2%) using it on a regular basis. Satisfaction with MIBot was significantly lower in the post-ChatGPT cohort (<italic>U</italic>=11,331.0; <italic>P</italic>=.001), driven by a decrease in perceived empathy as measured by the Average Consultation and Relational Empathy Measure (<italic>U</italic>=10,838.0; <italic>P</italic>=.01). Familiarity with ChatGPT was positively correlated with average response length (&#x03C1;=0.181; <italic>P</italic>=.04) and change in perceived importance of quitting smoking (&#x03C1;=0.296; <italic>P</italic>&#x003C;.001).</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>The widespread reach of ChatGPT has changed how users interact with MIBot. Post-ChatGPT users are less satisfied with MIBot overall, particularly in terms of perceived empathy. However, users with greater familiarity with ChatGPT provide longer responses and demonstrated a greater increase in their perceived importance of quitting smoking after a session with MIBot. These findings suggest the need for chatbot developers to adapt to evolving user expectations in the era of advanced generative artificial intelligence.</p></sec></abstract><kwd-group><kwd>chatbot</kwd><kwd>digital health</kwd><kwd>motivational interviewing</kwd><kwd>natural language processing</kwd><kwd>ChatGPT</kwd><kwd>large language models</kwd><kwd>artificial intelligence</kwd><kwd>experimental</kwd><kwd>smoking cessation</kwd><kwd>conversational agent</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><sec id="s1-1"><title>Background</title><p>Generative chatbots are conversational systems that provide synthesized replies using deep learning techniques [<xref ref-type="bibr" rid="ref1">1</xref>]. In recent years, generative chatbots based on large language models (LLMs) have made major advancements in their ability to engage in natural and human-like conversations [<xref ref-type="bibr" rid="ref2">2</xref>]. ChatGPT, a popular LLM-based generative chatbot developed by OpenAI [<xref ref-type="bibr" rid="ref3">3</xref>], has demonstrated significant potential to be applied in public health and medicine for a variety of purposes such as providing health information, supporting patient education, summarizing clinical notes, and assisting in administrative tasks [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. However, these applications have not typically focused on therapeutic interactions, such as those using motivational interviewing (MI) [<xref ref-type="bibr" rid="ref6">6</xref>] techniques.</p><p>Prior to ChatGPT&#x2019;s worldwide release in November 2022, our team developed MIBot [<xref ref-type="bibr" rid="ref7">7</xref>], a therapeutic chatbot using MI techniques to guide smokers toward the decision to quit smoking. MIBot has a structured conversation flow, using scripted questions and LLM-generated MI-style reflections [<xref ref-type="bibr" rid="ref6">6</xref>]. However, the popularity of ChatGPT and its advanced conversational capabilities raise questions about its influence on user interactions and expectations with simpler chatbots such as MIBot. These potential influences may in turn affect our future experiments with newer versions of MIBot, as the measurements used in future versions of MIBot may not be comparable to those in past versions, due to ChatGPT&#x2019;s potential influences on participants.</p></sec><sec id="s1-2"><title>Related Work</title><p>Several recent studies have delved into the realm of generative chatbots, used in a medical or therapeutic context, and explored their effect on users. Perski et al [<xref ref-type="bibr" rid="ref8">8</xref>] quantified the effect of the addition of a supportive chatbot to their smoking cessation application and found that it has increased user engagement and resulted in higher rates of quit success. Boucher et al [<xref ref-type="bibr" rid="ref9">9</xref>] provided a comprehensive review of artificially intelligent chatbots in digital mental health interventions, discussing their acceptability, effects on user engagement and mental health outcomes, as well as their weaknesses and risks at the time, such as language proficiency and understanding. Moilanen et al [<xref ref-type="bibr" rid="ref10">10</xref>] examined the effect of personality traits of a mental health chatbot on user engagement, finding that chatbots with a conscientious personality elicit the most user engagement and that users prefer their chatbot to be informative and confident rather than monotonic. Chow et al [<xref ref-type="bibr" rid="ref11">11</xref>] framed ChatGPT as a disruptive technology and explored its impact on medical chatbots, claiming that it has the potential to improve access to health care services while expressing concerns over factors of risks such as reliability, transparency, privacy, and bias.</p><p>Together, these findings illustrate the growing influence of generative chatbots on user engagement and expectations in health-related contexts, particularly as advanced chatbots like ChatGPT redefine conversational norms. However, the impact of ChatGPT&#x2019;s widespread use on users&#x2019; perceptions and behaviors toward other chatbots remains underexplored, raising questions about how exposure to such an advanced technology shifts user expectations and affects user behaviors. These findings served as important inspirations and motivations for this study, where we specifically investigate how users of one chatbot (MIBot) would change after being exposed to another chatbot (ChatGPT).</p></sec><sec id="s1-3"><title>Study Objective</title><p>This study aims to investigate how user interactions with MIBot have changed following the release of ChatGPT and examines the relationship between familiarity with ChatGPT and these changes. By comparing dialogue sessions with MIBot conducted before and after ChatGPT&#x2019;s release, this study analyzes metrics such as average response length, satisfaction ratings, and effectiveness of the therapy. Additionally, we assess the relationship between participants&#x2019; familiarity with ChatGPT and these metrics to better understand the impact of ChatGPT on user behaviors and expectations. Findings from this study are expected to provide insights into how user expectations have evolved since the release of ChatGPT and inform future development strategies for chatbots in health-related applications.</p></sec></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Experiments</title><sec id="s2-1-1"><title>Overview</title><p>An experiment was conducted on November 18, 2022, about 2 weeks before the worldwide introduction of ChatGPT by OpenAI [<xref ref-type="bibr" rid="ref3">3</xref>]. We then repeated that experiment on May 16, 2023, about half a year after ChatGPT was released. The 2 experiments used the exact same version of MIBot [<xref ref-type="bibr" rid="ref7">7</xref>] but on different groups of independently recruited participants. From this part on, we will refer to the first experiment as MIBot (version 5.2) and the second experiment as MIBot (version 5.2A).</p></sec><sec id="s2-1-2"><title>Overall Experiment Flow</title><p>The overall experiment flow strictly followed what was detailed in the original MIBot paper [<xref ref-type="bibr" rid="ref7">7</xref>]. Here is a brief overview:</p><list list-type="order"><list-item><p>Recruitment: Participants were recruited through the Prolific [<xref ref-type="bibr" rid="ref12">12</xref>] paid web-based recruitment system after providing consent.</p></list-item><list-item><p>Preconversation surveys: Participants filled out surveys about their smoking habits on a custom website, including metrics used in the filtering process.</p></list-item><list-item><p>Conversation initiation: MIBot initiated with a text chat about smoking, continuing only with participant consent.</p></list-item><list-item><p>Core conversation: The main chatbot conversation about smoking cessation, which contained prescripted questions, responses from the user, and then generated reflections from the chatbot, described in more detail in the Design of MIBot section.</p></list-item><list-item><p>Postconversation: Participants completed another readiness-to-quit survey, the Consultation and Relational Empathy (CARE) Measure [<xref ref-type="bibr" rid="ref13">13</xref>], and additional qualitative questions.</p></list-item><list-item><p>Reporting: Completion of tasks was recorded in the Prolific system [<xref ref-type="bibr" rid="ref12">12</xref>].</p></list-item><list-item><p>One-week-later survey: A week later, participants answered a follow-up survey, also including readiness-to-quit, the completion of which, along with passing a manual data quality review, was required for the participants to receive their payments.</p></list-item></list></sec><sec id="s2-1-3"><title>Design of MIBot</title><p>MIBot asked 2 types of questions. We call the first type &#x201C;main questions&#x201D; (<xref ref-type="other" rid="box1">Textbox 1</xref>) and the second type &#x201C;yes or no questions&#x201D; (<xref ref-type="other" rid="box2">Textbox 2</xref>). The main questions were open-ended questions that promoted self-reflection within users about their smoking habits, while yes or no questions were close-ended questions posed after each generated reflection to find out whether or not the generated reflection made sense, was on topic, and was used as a transition to the next main question.</p><boxed-text id="box1"><title> Main questions in MIBot conversations.</title><list list-type="order"><list-item><p>To start, what is the thing you like most about smoking?</p></list-item><list-item><p>What else do you like about smoking?</p></list-item><list-item><p>Now, what is the thing you like least about smoking?</p></list-item><list-item><p>What else do you dislike about smoking?</p></list-item><list-item><p>Now, what is one thing about your smoking that you would like to change?</p></list-item><list-item><p>What will it look like when you have made this change in your smoking addiction?</p></list-item><list-item><p>Finally, what are the steps you need to take to make this change?</p></list-item></list></boxed-text><boxed-text id="box2"><title> Yes or no questions in MIBot conversations.</title><list list-type="order"><list-item><p>Did that make sense?</p></list-item><list-item><p>Did what I said make sense to you?</p></list-item><list-item><p>Does this make sense to you?</p></list-item></list></boxed-text><p>The overall conversation structure was fixed as follows:</p><list list-type="order"><list-item><p>Introductory statement about MIBot and asking for permission to talk about the participant&#x2019;s smoking habits</p></list-item><list-item><p>Five to seven repetitions of</p><list list-type="alpha-lower"><list-item><p>Main question</p></list-item><list-item><p>User response</p></list-item><list-item><p>Generated reflection</p></list-item><list-item><p>Yes or no question</p></list-item><list-item><p>User response</p></list-item></list></list-item><list-item><p>Conclusion and thanking the participant for their time</p></list-item></list></sec><sec id="s2-1-4"><title>Smoking Status</title><p>The context of our study requires us to keep track of the smoking status of the participants, measured by the following three metrics:</p><list list-type="order"><list-item><p>User status: A label that denotes if a participant would have passed the screening from their preconversation survey imported from our previous MIBot studies [<xref ref-type="bibr" rid="ref7">7</xref>]. If they have passed the screening, they are denoted as low confidence or discordant; if not, they are instead denoted as high confidence and not discordant.</p></list-item><list-item><p>Heaviness of Smoking Index [<xref ref-type="bibr" rid="ref14">14</xref>]: A validated survey metric calculated from cigarettes per day and time to the first cigarette of the day. Heaviness of Smoking Index is an integer, where a higher value indicates a heavier smoking habit.</p></list-item><list-item><p>Quit attempts made: A binary value that denotes if a participant has made at least 1 quit attempt in the week leading up to the MIBot conversation.</p></list-item></list></sec><sec id="s2-1-5"><title>MIBot Surveys</title><p>There were 3 surveys delivered to the participants from the original MIBot experiment flow: preconversation survey, postconversation survey, and 1-week-later survey. These surveys were used to determine how effective MIBot was in motivating smokers to make the decision to quit smoking as well as how participants felt about the conversation with MIBot.</p><p>The relevant parts of the survey for this study are the following:</p><list list-type="order"><list-item><p>The CARE Measure [<xref ref-type="bibr" rid="ref13">13</xref>] consists of questions regarding the participant&#x2019;s satisfaction with the conversation. Each question asks the participant to rate how well they think MIBot did on a scale from 1 to 5 or 0 if it does not apply. For example, participants were asked to evaluate MIBot&#x2019;s ability to &#x201C;make you feel at ease&#x201D; or &#x201C;letting you tell your &#x2018;story&#x2019;&#x201D; back when they were interacting with MIBot. The CARE Measure is only included in the postconversation survey.</p></list-item><list-item><p>The Readiness Ruler [<xref ref-type="bibr" rid="ref15">15</xref>] measures how ready the participant is to quit smoking. It consists of 3 ratings on a 0&#x2010;10 scale: how confident they are about quitting smoking now, how important it is for them to quit smoking, and how ready they feel to quit smoking now. The Readiness Ruler is included in all 3 surveys.</p></list-item><list-item><p>Two additional feedback questions, included only in the postconversation survey:</p><list list-type="alpha-lower"><list-item><p>&#x201C;What are 3 words that you would use to describe the chatbot?&#x201D;</p></list-item><list-item><p>&#x201C;What would you change about the conversation?&#x201D;</p></list-item></list></list-item></list></sec><sec id="s2-1-6"><title>ChatGPT Survey</title><p>To determine the extent of exposure to ChatGPT, for each participant in MIBot (version 5.2A), we included an additional short survey in the 1-week-later survey referred to as the ChatGPT survey. It contained 8 new questions designed to evaluate the participant&#x2019;s knowledge and use of ChatGPT prior to engaging in MIBot (version 5.2A). The full ChatGPT survey can be found in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s2-1-7"><title>Recruitment and Data Inclusion</title><p>The steps taken for recruiting the participants for both MIBot (version 5.2) and MIBot (version 5.2A) were the exact same as detailed in the original MIBot paper [<xref ref-type="bibr" rid="ref7">7</xref>]. Participants were recruited through the Prolific [<xref ref-type="bibr" rid="ref12">12</xref>] web-based recruitment system, where they were informed by a recruitment description that they would engage in a text-based conversation with a chatbot designed to promote readiness to quit smoking, provide feedback on their experience, and complete the 1-week-later survey. The study was framed as an opportunity to contribute to research on chatbot-assisted smoking cessation, emphasized the confidentiality of participant data, and clearly stated that participation was voluntary, with the option to opt out if they did not agree to the terms. The entire study was delivered to the participants remotely, and they could participate in the study using their personal computers or mobile devices.</p><p>Notably, participants were screened using Prolific&#x2019;s filters based on the following inclusion criteria: participants could be located in any country, were at least 18 years of age, were fluent in English, had a smoking status defined as either a current smoker (smoking at least 5 cigarettes a day for at least 1 year) or a recent smoker (smoking at least 5 cigarettes a day for less than 1 year), and had a minimum approval rate of 90% on their prior Prolific studies. Additionally, Prolific was set to recruit an equal number of male and female participants. However, due to additional screening conducted after recruitment, the final sample was not perfectly balanced by sex.</p><p>The data collected were manually reviewed for data inclusion following the same criteria as listed in the MIBot paper [<xref ref-type="bibr" rid="ref7">7</xref>] except for 1 major difference. In the original MIBot study, we only included participants with either of the following qualities in their Readiness Ruler scores:</p><list list-type="bullet"><list-item><p>Low confidence: confidence level less than or equal to 5</p></list-item><list-item><p>Discordant: importance level more than 5 points below the confidence level</p></list-item></list><p>As the focus of this study is instead about ChatGPT&#x2019;s influence on participants, we decided to include as many valid data entries as possible. Therefore, this filtering was not conducted in this study. As a result, the number of participants we included in this study increased from 100 to 143.</p></sec></sec><sec id="s2-2"><title>Evaluation Metrics</title><p>To evaluate MIBot conversations and user behaviors from various aspects, we designed several evaluation metrics, for which detailed definitions are provided below.</p><sec id="s2-2-1"><title>Response Length</title><p>In this study, the key aspect of user behavior we focused on was the length of their responses to questions prompted by MIBot. Response length is an important indicator of user engagement and willingness to interact with the chatbot. Longer responses suggest that participants are more actively reflecting on the conversation, which aligns with the therapeutic goals of MI sessions.</p><p>We defined response length by its word count, excluding any punctuation. We also categorized the questions MIBot asks into 2 categories and looked at the user responses separately to gain more insight. As a result, there are three metrics we applied to measure the lengths of participant responses:</p><list list-type="order"><list-item><p>Average response length: average length of responses to all questions.</p></list-item><list-item><p>Average response length (main): average length of responses to main questions, which are the scripted questions MIBot asks to provoke contemplation of the users&#x2019; smoking habits.</p></list-item><list-item><p>Average response length (yes or no): average length of responses to yes or no questions, which are shown in <xref ref-type="other" rid="box2">Textbox 2</xref>.</p></list-item></list></sec><sec id="s2-2-2"><title>Satisfaction With MIBot</title><p>Satisfaction with MIBot is a metric designed to measure user satisfaction after participating in a conversation with MIBot, a value between 0 and 1, calculated as the mean of the following three quantities:</p><list list-type="order"><list-item><p>Average CARE Measure (integers ranging from 1 to 5, in order of increasing satisfaction with MIBot), excluding answers where does not apply was selected. The mean is then rescaled to a number between 0 and 1 by subtracting 1 from the original value and dividing the result by 4.</p></list-item><list-item><p>Feedback sentiment score, based on answers to the first feedback question, &#x201C;What are 3 words that you would use to describe the chatbot?&#x201D; (integers ranging from 1 to 5, in order of increasing positivity). These scores were generated by automatically measuring the sentiment of the 3 words given by the user as feedback, described in the MIBot Survey section. The sentiment is computed using the neural network bert-base-multilingual-uncased-sentiment [<xref ref-type="bibr" rid="ref16">16</xref>], which provides a score between 0 and 1.</p></list-item><list-item><p>MIBot improvement indicator, a binary value (0 or 1) if the participant indicated (in written feedback) that they would like MIBot improvement in response to the second feedback question, &#x201C;What would you change about the conversation?&#x201D; Responses are individually checked and manually labeled by a human collaborator. Since participants who suggested improvements are assumed to be less satisfied with MIBot, the value (1&#x2212;MIBot improvement indicator) is used in the averaging calculation to get satisfaction with MIBot.</p></list-item></list></sec><sec id="s2-2-3"><title>Effectiveness of MIBot</title><p>The goal of MIBot is to guide participants toward the decision to quit smoking by provoking contemplation. The more effective the conversation was, the more change we should observe in a participant. The effectiveness of MIBot is measured using 3 metrics related to the Readiness Ruler, as described in the MIBot Surveys section. The first of which, confidence change, is calculated as the difference between the confidence level before the conversation and the confidence level measured 1 week later, as recorded on the corresponding Readiness Rulers filled by the participants. Similarly, the importance change and readiness change were determined. As noted in the original MIBot paper [<xref ref-type="bibr" rid="ref7">7</xref>], the primary outcome is the confidence change, as this is the most predictive of smoking cessation success [<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref19">19</xref>].</p></sec><sec id="s2-2-4"><title>Familiarity With ChatGPT</title><p>Familiarity with ChatGPT was given as a score between 0 and 126 (inclusive) to each participant based on their answers to the ChatGPT survey. Participants were first given a starting score of either 0 or 1: those who had not heard of ChatGPT were given a score of 0, and those who had were given a score of 1. Among those who had heard of ChatGPT, the score of those who had never used ChatGPT stayed at 1; for those who had used ChatGPT on top of knowing about it, they received an additional score according to the answers they had provided for 3 questions in the ChatGPT survey regarding their past use of ChatGPT. The three questions are as follows: (1) How long ago did you start using ChatGPT? (2) How frequently do you use ChatGPT? (3) On average, how long do your ChatGPT sessions last?</p><p>These 3 questions were presented as multiple-choice questions, the answers to which are presented in an ordered way and assigned a corresponding integer score from 1 to 5, as presented in <xref ref-type="table" rid="table1">Table 1</xref>. The final familiarity score they received was the product of the 3 integer scores, in addition to the 1 they already received. As a result, familiarity scores ranged from 0 to 126, with 0 being having never heard of ChatGPT, 1 being having heard of but never used ChatGPT, 2 being having used ChatGPT once a month or less for less than 5 minutes each session starting from less than a week ago, and 126 being having used ChatGPT multiple times per day with each session lasting longer than an hour for the past 5 months.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Corresponding description for familiarity score assignment.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Corresponding score</td><td align="left" valign="bottom">Duration of use</td><td align="left" valign="bottom">Frequency of use</td><td align="left" valign="bottom">Length of each session</td></tr></thead><tbody><tr><td align="left" valign="top">1</td><td align="left" valign="top">Less than a week</td><td align="left" valign="top">Once a month or less</td><td align="left" valign="top">Less than 5 minutes</td></tr><tr><td align="left" valign="top">2</td><td align="left" valign="top">Less than a month</td><td align="left" valign="top">Every 2 weeks</td><td align="left" valign="top">Less than 10 minutes</td></tr><tr><td align="left" valign="top">3</td><td align="left" valign="top">1&#x2010;3 months</td><td align="left" valign="top">Every week</td><td align="left" valign="top">10 to 30 minutes</td></tr><tr><td align="left" valign="top">4</td><td align="left" valign="top">3&#x2010;5 months</td><td align="left" valign="top">Every day</td><td align="left" valign="top">30 minutes to 1 hour</td></tr><tr><td align="left" valign="top">5</td><td align="left" valign="top">Over 5 months</td><td align="left" valign="top">Multiple times per day</td><td align="left" valign="top">More than 1 hour</td></tr></tbody></table></table-wrap></sec></sec><sec id="s2-3"><title>Statistical Analysis</title><sec id="s2-3-1"><title>Comparison of Pre- and Post-ChatGPT Cohorts</title><p>To capture the differences in behavior between participants in the 2 cohorts&#x2014;November 2022 (MI version 5.2) and May 2023 (MI version 5.2A)&#x2014;we used the Mann-Whitney <italic>U</italic> test to compare various metrics, such as average response length, satisfaction with MIBot, and changes in Readiness Ruler scores. This nonparametric test provided test statistics and <italic>P</italic> values for each metric, which are used to determine significant differences between the 2 groups. The test was done using the Python programming language (Python Software Foundation) with the pandas [<xref ref-type="bibr" rid="ref20">20</xref>] and SciPy [<xref ref-type="bibr" rid="ref21">21</xref>] libraries.</p></sec><sec id="s2-3-2"><title>Relationships Between Familiarity With ChatGPT and Other Variables</title><p>To examine the impact of familiarity with ChatGPT within the MIBot (version 5.2A) cohort, we performed Spearman rank correlation analysis. This test assessed the relationships between participants&#x2019; familiarity scores (ranging from 0 to 126) and key metrics, such as average response length, satisfaction with MIBot, and changes in Readiness Ruler scores. Spearman rank correlation provided correlation coefficients and <italic>P</italic> values, indicating the strength and significance of each relationship. The test was also done using Python with the pandas [<xref ref-type="bibr" rid="ref20">20</xref>] and SciPy [<xref ref-type="bibr" rid="ref21">21</xref>] libraries.</p></sec></sec><sec id="s2-4"><title>Ethical Considerations</title><p>This research was approved by the University of Toronto Research Ethics Board (protocol # 35567), as amended on June 29, 2022. Participants voluntarily provided informed consent by agreeing to all the terms stated in a consent form presented digitally to all participants during recruitment, fully outlining the study&#x2019;s goals, procedures, potential risks, and privacy guarantees. It specified that no personally identifiable information would be collected, and any inadvertent identifiers would be removed prior to analysis or publication. Participants received a total of US $6.25 for MIBot (version 5.2) and US $6.18 for MIBot (version 5.2A) as compensation for completing all tasks in the study, and partial compensation was not provided to those who did not complete all components of the experiment. No identifiable participant information is included in any images or supplementary materials in the manuscript.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Participant Demographic</title><p>Participant demographic data of both MIBot (version 5.2) and MIBot (version 5.2A) are listed in <xref ref-type="table" rid="table2">Tables 2</xref> and <xref ref-type="table" rid="table3">3</xref>, including categorical and continuous variables, respectively. Additional data of the demographics of the participants in both MIBot (version 5.2) and MIBot (version 5.2A) are listed in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Categorical demographic data of participants in cohort MIBot (version 5.2; November 2022, pre-ChatGPT) and MIBot (version 5.2A; May 2023, post-ChatGPT).</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom" colspan="2">Characteristic</td><td align="left" valign="bottom">MIBot (version 5.2) (n=143), n (%)</td><td align="left" valign="bottom">MIBot (version 5.2A) (n=129), n (%)</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="4"><bold>Sex</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Male</td><td align="left" valign="top">72 (50.3)</td><td align="left" valign="top">63 (48.8)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Female</td><td align="left" valign="top">71 (49.7)</td><td align="left" valign="top">66 (51.2)</td></tr><tr><td align="left" valign="top" colspan="4"><bold>User status</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Low confidence or discordant</td><td align="left" valign="top">100 (69.9)</td><td align="left" valign="top">91 (70.5)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">High confidence and not discordant</td><td align="left" valign="top">43 (30.1)</td><td align="left" valign="top">38 (29.5)</td></tr><tr><td align="left" valign="top" colspan="4"><bold>Smoking status</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">I am a current smoker (smoke at least 5 cigarettes a day and have smoked this amount for at least 1 year)</td><td align="left" valign="top">121 (84.6)</td><td align="left" valign="top">107 (82.9)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">I am a recent smoker (smoke at least 5 cigarettes a day and have smoked this amount for less than 1 year)</td><td align="left" valign="top">22 (15.4)</td><td align="left" valign="top">22 (17.1)</td></tr><tr><td align="left" valign="top" colspan="4"><bold>Quit attempts made</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Yes</td><td align="left" valign="top">69 (48.3)</td><td align="left" valign="top">46 (35.7)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">No</td><td align="left" valign="top">74 (51.7)</td><td align="left" valign="top">83 (64.3)</td></tr></tbody></table></table-wrap><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Continuous demographic data of participants in cohort MIBot (version 5.2; November 2022, pre-ChatGPT) and MIBot (version 5.2A; May 2023, post-ChatGPT).</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Characteristic</td><td align="left" valign="bottom" colspan="2">MIBot (version 5.2)</td><td align="left" valign="bottom" colspan="2">MIBot (version 5.2A)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="bottom">Mean (SD)</td><td align="left" valign="bottom">Median (IQR)</td><td align="left" valign="bottom">Mean (SD)</td><td align="left" valign="bottom">Median (IQR)</td></tr></thead><tbody><tr><td align="left" valign="top">Age (years)</td><td align="left" valign="top">29.22 (9.69)</td><td align="left" valign="top">26.00 (23.00&#x2010;33.00)</td><td align="left" valign="top">32.75 (11.36)</td><td align="left" valign="top">29.00 (24.00&#x2010;39.00)</td></tr><tr><td align="left" valign="top">HSI<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="top">1.45 (1.38)</td><td align="left" valign="top">1.00 (0.00&#x2010;2.00)</td><td align="left" valign="top">1.67 (1.45)</td><td align="left" valign="top">1.00 (0.00&#x2010;3.00)</td></tr><tr><td align="left" valign="top" colspan="5"><bold>Readiness Rulers, preconversation</bold></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Confidence</td><td align="left" valign="top">4.52 (2.75)</td><td align="left" valign="top">4.00 (2.00&#x2010;7.00)</td><td align="left" valign="top">4.12 (2.60)</td><td align="left" valign="top">4.00 (2.00&#x2010;6.00)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Importance</td><td align="left" valign="top">5.84 (2.84)</td><td align="left" valign="top">6.00 (3.00&#x2010;8.00)</td><td align="left" valign="top">5.60 (2.65)</td><td align="left" valign="top">6.00 (3.00&#x2010;8.00)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Readiness</td><td align="left" valign="top">5.36 (2.83)</td><td align="left" valign="top">5.00 (3.00&#x2010;8.00)</td><td align="left" valign="top">4.79 (2.58)</td><td align="left" valign="top">5.00 (3.00&#x2010;7.00)</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>HSI: Heaviness of Smoking Index.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-2"><title>Reach of ChatGPT</title><p>The familiarity score, described in the Familiarity With ChatGPT section, provides an estimate of the reach of ChatGPT to the public. <xref ref-type="table" rid="table4">Table 4</xref> provides a more detailed description of the distribution of the familiarity score, where we bin the participants based on familiarity score ranges and assign labels to each score range. &#x201C;Unexposed&#x201D; is the group of participants who have not heard of ChatGPT prior to this study. &#x201C;Aware&#x201D; denotes that the participants have heard of ChatGPT but did not use it in any capacity. People who have used ChatGPT are separated into 3 groups, which are &#x201C;casual user,&#x201D; &#x201C;consistent user,&#x201D; and &#x201C;dedicated user,&#x201D; based on their familiarity score.</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Distribution of ChatGPT familiarity levels among participants in the MIBot (version 5.2A) cohort.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">ChatGPT familiarity level</td><td align="left" valign="bottom">Count, n (%)</td><td align="left" valign="bottom">Score</td></tr></thead><tbody><tr><td align="left" valign="top">Unexposed</td><td align="char" char="." valign="top">12 (9.3)</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">Aware</td><td align="char" char="." valign="top">34 (26.4)</td><td align="left" valign="top">1</td></tr><tr><td align="left" valign="top">Casual user</td><td align="char" char="." valign="top">17 (13.2)</td><td align="left" valign="top">2 to 8</td></tr><tr><td align="left" valign="top">Consistent user</td><td align="char" char="." valign="top">37 (28.7)</td><td align="left" valign="top">9 to 27</td></tr><tr><td align="left" valign="top">Dedicated user</td><td align="char" char="." valign="top">29 (22.5)</td><td align="left" valign="top">28 or higher</td></tr></tbody></table></table-wrap></sec><sec id="s3-3"><title>Comparison of Pre- and Post-ChatGPT Cohorts</title><p><xref ref-type="table" rid="table5">Table 5</xref> shows the Mann-Whitney <italic>U</italic> test results that compare between participants from the November 2022 (MI version 5.2) and May 2023 (MI version 5.2A) cohorts. In terms of average response length, there was no significant difference between the 2 cohorts, whether looking at all responses together or breaking them down into responses to main questions and responses to yes or no questions. Satisfaction with MIBot was significantly higher in MIBot (version 5.2) than in MIBot (version 5.2A; <italic>U</italic>=11,331.0; <italic>P</italic>=.001). Specifically, of the 3 metrics satisfaction with MIBot was aggregated of, Average CARE Measure was the only one showing any significant difference, with it being significantly higher in MIBot (version 5.2) compared to MIBot (version 5.2A; <italic>U</italic>=10,838; <italic>P</italic>=.01). As for changes in the Readiness Ruler, no significant differences were found between the cohorts in terms of confidence change, importance change, or readiness change.</p><table-wrap id="t5" position="float"><label>Table 5.</label><caption><p>Results of the Mann-Whitney <italic>U</italic> test comparing key metrics between cohort MIBot (version 5.2; pre-ChatGPT) and MIBot (version 5.2A; post-ChatGPT).</p></caption><table id="table5" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom" colspan="2">Variable</td><td align="left" valign="bottom" colspan="2">MIBot (version 5.2)</td><td align="left" valign="bottom" colspan="2">MIBot (version 5.2A)</td><td align="left" valign="bottom">Test statistic (<italic>U</italic>)</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr><tr><td align="left" valign="bottom" colspan="2"/><td align="left" valign="bottom">Mean (SD)</td><td align="left" valign="bottom">Median (IQR)</td><td align="left" valign="bottom">Mean (SD)</td><td align="left" valign="bottom">Median (IQR)</td><td align="left" valign="bottom"/><td align="left" valign="bottom"/></tr></thead><tbody><tr><td align="left" valign="top" colspan="8"><bold>Response length</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Average response length</td><td align="left" valign="top">4.98 (2.49)</td><td align="left" valign="top">4.46 (3.31&#x2010;5.89)</td><td align="left" valign="top">5.36 (3.54)</td><td align="left" valign="top">4.29 (3.13&#x2010;7.00)</td><td align="left" valign="top">9248.0</td><td align="left" valign="top">.97</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Average response length (main)</td><td align="left" valign="top">8.18 (4.00)</td><td align="left" valign="top">7.60 (5.50&#x2010;9.69)</td><td align="left" valign="top">8.04 (4.71)</td><td align="left" valign="top">6.62 (4.86&#x2010;10.43)</td><td align="left" valign="top">9936.5</td><td align="left" valign="top">.27</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Average response length (yes or no)</td><td align="left" valign="top">2.02 (1.91)</td><td align="left" valign="top">1.00 (1.00&#x2010;2.07)</td><td align="left" valign="top">2.44 (3.04)</td><td align="left" valign="top">1.17 (1.00&#x2010;2.80)</td><td align="left" valign="top">8301.5</td><td align="left" valign="top">.13</td></tr><tr><td align="left" valign="top" colspan="8"><bold>Satisfaction scores</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Satisfaction with MIBot</td><td align="left" valign="top">0.74 (0.22)</td><td align="left" valign="top">0.85 (0.52&#x2010;0.91)</td><td align="left" valign="top">0.66 (0.21)</td><td align="left" valign="top">0.61 (0.49&#x2010;0.85)</td><td align="left" valign="top">11,331.0</td><td align="left" valign="top">.001</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Average CARE<sup><xref ref-type="table-fn" rid="table5fn1">a</xref></sup> Measure</td><td align="left" valign="top">0.77 (0.16)</td><td align="left" valign="top">0.78 (0.66&#x2010;0.90)</td><td align="left" valign="top">0.72 (0.17)</td><td align="left" valign="top">0.74 (0.58&#x2010;0.84)</td><td align="left" valign="top">10,838.0</td><td align="left" valign="top">.01</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">MIBot improvement indicator</td><td align="left" valign="top">0.57 (1.01)</td><td align="left" valign="top">0.00 (0.00&#x2010;1.00)</td><td align="left" valign="top">0.76 (1.12)</td><td align="left" valign="top">0.00 (0.00&#x2010;1.00)</td><td align="left" valign="top">8192.5</td><td align="left" valign="top">.06</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Feedback sentiment score</td><td align="left" valign="top">0.79 (0.15)</td><td align="left" valign="top">0.80 (0.80&#x2010;0.80)</td><td align="left" valign="top">0.76 (0.18)</td><td align="left" valign="top">0.80 (0.80&#x2010;0.80)</td><td align="left" valign="top">10,028.0</td><td align="left" valign="top">.15</td></tr><tr><td align="left" valign="top" colspan="8"><bold>Readiness Ruler</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Confidence change</td><td align="left" valign="top">0.86 (2.32)</td><td align="left" valign="top">1.00 (0.00&#x2010;2.00)</td><td align="left" valign="top">0.60 (2.08)</td><td align="left" valign="top">0.00 (0.00&#x2010;2.00)</td><td align="left" valign="top">9893.0</td><td align="left" valign="top">.29</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Importance change</td><td align="left" valign="top">0.69 (1.85)</td><td align="left" valign="top">0.00 (0.00&#x2010;2.00)</td><td align="left" valign="top">0.40 (1.98)</td><td align="left" valign="top">0.00 (0.00&#x2010;1.00)</td><td align="left" valign="top">10,003.5</td><td align="left" valign="top">.21</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Readiness change</td><td align="left" valign="top">0.35 (1.82)</td><td align="left" valign="top">0.00 (&#x2212;1.00 to 1.00)</td><td align="left" valign="top">0.33 (2.07)</td><td align="left" valign="top">0.00 (&#x2212;1.00 to 1.00)</td><td align="left" valign="top">9260.0</td><td align="left" valign="top">.95</td></tr></tbody></table><table-wrap-foot><fn id="table5fn1"><p><sup>a</sup>CARE: Consultation and Relational Empathy.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-4"><title>Relationships Between Familiarity With ChatGPT and Other Variables</title><p><xref ref-type="table" rid="table6">Table 6</xref> shows the Spearman rank correlation results evaluating relationships between familiarity with ChatGPT and various other variables within the MIBot (version 5.2A) cohort. In terms of average response length, there was a significant positive correlation between familiarity with ChatGPT and overall average response length (&#x03C1;=0.181; <italic>P</italic>=.04) as well as with average response length for main questions (&#x03C1;=0.180; <italic>P</italic>=.04) and average response length for yes or no questions (&#x03C1;=0.197; <italic>P</italic>=.03). Satisfaction with MIBot had a weak negative correlation with familiarity score, but it was not statistically significant (&#x03C1;=&#x2212;0.171; <italic>P</italic>=.05). Of the 3 metrics aggregated into satisfaction with MIBot, only the MIBot improvement indicator showed a significant positive correlation with familiarity with ChatGPT (&#x03C1;=0.188; <italic>P</italic>=.03). Among the Readiness Ruler changes, a significant positive correlation was observed between familiarity with ChatGPT and importance change (&#x03C1;=0.296; <italic>P</italic>&#x003C;.001) but not for confidence change or readiness change.</p><table-wrap id="t6" position="float"><label>Table 6.</label><caption><p>Spearman rank correlation analysis for the MIBot (version 5.2A) cohort.</p></caption><table id="table6" frame="hsides" rules="groups"><thead><tr><td align="left" valign="top" colspan="2">Variable</td><td align="left" valign="bottom" colspan="2">Familiarity with ChatGPT</td></tr><tr><td align="left" valign="top" colspan="2"/><td align="left" valign="top">&#x03C1;</td><td align="left" valign="top"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="4"><bold>Response length</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Average response length</td><td align="left" valign="top">0.181</td><td align="char" char="." valign="top">.04</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Average response length (main)</td><td align="left" valign="top">0.180</td><td align="char" char="." valign="top">.04</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Average response length (yes or no)</td><td align="left" valign="top">0.197</td><td align="char" char="." valign="top">.03</td></tr><tr><td align="left" valign="top" colspan="4"><bold>Satisfaction scores</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Satisfaction with MIBot</td><td align="left" valign="top">&#x2212;0.171</td><td align="char" char="." valign="top">.05</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Average CARE<sup><xref ref-type="table-fn" rid="table6fn1">a</xref></sup> Measure</td><td align="left" valign="top">&#x2212;0.112</td><td align="char" char="." valign="top">.21</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">MIBot improvement indicator</td><td align="left" valign="top">0.188</td><td align="char" char="." valign="top">.03</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Feedback sentiment score</td><td align="left" valign="top">&#x2212;0.023</td><td align="char" char="." valign="top">.80</td></tr><tr><td align="left" valign="top" colspan="4"><bold>Readiness Ruler</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Confidence change</td><td align="left" valign="top">0.165</td><td align="char" char="." valign="top">.06</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Importance change</td><td align="left" valign="top">0.296</td><td align="char" char="." valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Readiness change</td><td align="left" valign="top">0.078</td><td align="char" char="." valign="top">.38</td></tr></tbody></table><table-wrap-foot><fn id="table6fn1"><p><sup>a</sup>CARE: Consultation and Relational Empathy.</p></fn></table-wrap-foot></table-wrap></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>This study aimed to investigate how user interactions with MIBot changed following the release of ChatGPT as well as the relationship between ChatGPT familiarity and these changes. From the results, we found that users interacting with MIBot after the release of ChatGPT were less satisfied with the chatbot, particularly in terms of perceived empathy, but users more familiar with ChatGPT provided longer responses and showed greater increase in their perceived importance of quitting smoking.</p><p>The premise of this study is that people have been exposed to ChatGPT due to its high popularity, which is supported by the distribution of familiarity scores in the MIBot (version 5.2A) cohort. From <xref ref-type="table" rid="table4">Table 4</xref>, ChatGPT is observed to have a widespread reach, with only 12 (9.3%) participants of MIBot (version 5.2A) having never heard of it, and 34 (26.4%) having only learned about it but never used it. Collectively, 83 (64.3%) participants have used ChatGPT at least to some capacity, most of whom are consistent or even dedicated users, indicating that the public has received massive exposure to the popular chatbot.</p><p>Using the Mann-Whitney <italic>U</italic> test (<xref ref-type="table" rid="table5">Table 5</xref>) to compare participants from the MIBot (version 5.2) and MIBot (version 5.2A) cohorts, we observed that most variables did not show significant differences between the groups. However, satisfaction with MIBot was significantly lower in the MIBot (version 5.2A) cohort (<italic>U</italic>=11,331.0; <italic>P</italic>=.001), a finding primarily driven by differences in the Average CARE Measure. This specific component of the satisfaction score, which reflects perceived empathy in interactions, was significantly higher in the MIBot (version 5.2) cohort (<italic>U</italic>=10,838.0; <italic>P</italic>=.01). These findings suggest that participants in the post-ChatGPT cohort, many of whom were familiar with or at least aware of ChatGPT&#x2019;s advanced conversational capabilities, may have developed higher expectations for chatbot empathy, which MIBot may not fully meet.</p><p>Within the MIBot (version 5.2A) cohort, Spearman rank correlation analysis revealed that familiarity with ChatGPT was positively correlated with average response length across all response types, indicating that more experienced users were likely to engage in longer interactions. However, while users who are more familiar with ChatGPT are more likely to suggest improvements for MIBot (&#x03C1;=0.188; <italic>P</italic>=.03), satisfaction with MIBot as a whole had only a weak, nonsignificant negative correlation with familiarity (&#x03C1;=&#x2212;0.171; <italic>P</italic>=.05), even though the <italic>U</italic> test results showed that satisfaction was significantly lower in the MIBot (version 5.2A) cohort. This discrepancy suggests that while ChatGPT exposure may influence satisfaction overall, familiarity alone does not predict satisfaction levels. It may be that other factors unique to the MIBot (version 5.2A) cohort, such as general exposure to more advanced conversational artificial intelligence or broader trends in technology expectations, are impacting satisfaction with MIBot in a way that the specific familiarity score we designed failed to capture. In other words, the drop in satisfaction with MIBot might reflect a general shift in expectations for chatbot performance rather than an effect specific to individual familiarity with ChatGPT.</p><p>Interestingly, although familiarity with ChatGPT appears to make users more critical of MIBot&#x2019;s capabilities, it is also associated with an increase in participants&#x2019; perceived importance of quitting smoking (&#x03C1;=0.296; <italic>P</italic>&#x003C;.001), a key measure of MIBot&#x2019;s effectiveness. This seemingly paradoxical finding could suggest that while exposure to advanced generative chatbots raises expectations for technical quality, it might also enhance users&#x2019; receptiveness to the broader goals of MIBot, such as helping users resolve ambivalence and guiding them toward change, and as a result, making a less advanced chatbot more effective.</p></sec><sec id="s4-2"><title>Practical Implications</title><p>The findings from this study suggest several practical implications for future chatbot development, especially in health-related applications. The decrease in satisfaction with MIBot from post-ChatGPT users highlights a need for researchers and developers to adapt to higher expectations of chatbots, especially for empathy. Additionally, the tendency of users familiar with ChatGPT to provide longer, more detailed responses suggests that chatbots should be capable of handling more nuanced interactions. Finally, the positive correlation between ChatGPT familiarity and MIBot&#x2019;s effectiveness in increasing the perceived importance of quitting smoking implies that users more experienced with advanced generative chatbots may have more trust in the technology and be more receptive to interactions guiding themselves toward change.</p></sec><sec id="s4-3"><title>Comparison With Prior Works</title><p>Unlike prior studies that examined and reviewed various aspects of chatbots that may affect user engagement and effectiveness in different contexts [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref10">10</xref>], this study specifically and uniquely investigates how exposure to and familiarity with a more advanced chatbot (ChatGPT) affect user interactions with a simpler chatbot (MIBot). Building on to our previous work, MIBot [<xref ref-type="bibr" rid="ref7">7</xref>], our new experiments suggest that MIBot continues to increase users&#x2019; readiness to quit even after the introduction of ChatGPT. Nevertheless, overall user satisfaction has decreased, possibly affected by higher user expectations among those exposed to ChatGPT. This could be a disruptive effect from ChatGPT as predicted by Chow et al [<xref ref-type="bibr" rid="ref11">11</xref>]. Moreover, our findings also provide unique insights not found in related prior works, such as that familiarity with ChatGPT positively correlates with core metrics for user engagement with and effectiveness of MIBot, a simpler chatbot than ChatGPT. It also presented a measurement, at a specific point in time, of the exposure level to ChatGPT among our recruited participants, which demonstrates the extent of ChatGPT&#x2019;s reach at that time.</p></sec><sec id="s4-4"><title>Limitations</title><p>There are several limitations regarding this study. Since we followed the same experiment flow as the original MIBot paper [<xref ref-type="bibr" rid="ref7">7</xref>] and used mostly the same evaluation metrics, the limitations of the MIBot experiments documented in the original MIBot paper [<xref ref-type="bibr" rid="ref7">7</xref>] also apply to this study. Moreover, there exists an additional type of sampling bias specific to this study. Since for both of our experiments, we recruited participants through Prolific [<xref ref-type="bibr" rid="ref12">12</xref>], a web-based recruitment system, it is possible that these participants are more fluent with technology than the general public and therefore more likely to have been exposed to ChatGPT or have the effects of ChatGPT manifest in a way that does not fairly represent a more general population. Furthermore, our 2 experiments used different groups of people with some demographic differences, notably with a difference in their average age, which may result in different smoking behaviors and success rates of smoking cessation [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. Finally, it is important to acknowledge the possibility of confounding factors not accounted for in our study, which may have influenced how participants interacted with MIBot or perceived its effectiveness, along with familiarity with ChatGPT.</p></sec><sec id="s4-5"><title>Conclusions</title><p>Given MIBot, a generative chatbot for smoking cessation less advanced than ChatGPT, this study aimed to find any potential changes to how users interact with MIBot by comparing user interactions before and after ChatGPT&#x2019;s release. We found that post-ChatGPT users are less satisfied with MIBot overall, particularly in terms of perceived empathy. Moreover, as users gain more familiarity with ChatGPT, they provide longer responses and show a greater increase in their perceived importance of quitting smoking. These findings suggest the need for continuous innovation in chatbot technology, particularly in digital health, to meet the evolving expectations of users accustomed to more advanced chatbot interactions.</p></sec></sec></body><back><ack><p>The authors acknowledge their long-standing collaboration with the Intrepid Lab of Dr Peter Selby at the Centre for Addiction and Mental Health in Toronto and Professor Matt Ratto in the Faculty of Information at the University of Toronto. This research was funded by a Natural Sciences and Engineering Research Council of Canada Discovery grant (RGPIN-2019-04395) and a New Frontiers in Research Fund grant (NFRFE-2021-00449).</p></ack><notes><sec><title>Data Availability</title><p>The datasets generated and analyzed during this study are available from the corresponding author on reasonable request.</p></sec></notes><fn-group><fn fn-type="con"><p>JZ and JR conceptualized this research work and oversaw project administration in terms of managing, planning, and coordinating the experiments. JZ, AD, CW, MA, and AB contributed to data curation and to developing the chatbot and the scripts. JZ, AD, CW, and SV contributed to conducting all the formal analyses. PS and JR secured funding for the project and provided overall supervision of all the research activities. JZ, AD, CW, and MA did all the investigation work related to the study. JZ, SV, AB, and JR contributed to developing the methodology. JR provided the computing and experimental resources for the study. JZ, AD, and CW contributed to the validation and visualization of the data collected. JZ, AD, CW, and JR were the writers of the original draft, while JZ and JR critically reviewed and edited the manuscript. All authors made significant contributions to this work and approved it for publication.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">CARE</term><def><p>Consultation and Relational Empathy</p></def></def-item><def-item><term id="abb2">LLM</term><def><p>large language model</p></def></def-item><def-item><term id="abb3">MI</term><def><p>motivational interviewing</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Adamopoulou</surname><given-names>E</given-names> </name><name name-style="western"><surname>Moussiades</surname><given-names>L</given-names> </name></person-group><article-title>Chatbots: history, technology, and applications</article-title><source>Mach Learn Appl</source><year>2020</year><month>12</month><volume>2</volume><fpage>100006</fpage><pub-id pub-id-type="doi">10.1016/j.mlwa.2020.100006</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shanahan</surname><given-names>M</given-names> </name><name name-style="western"><surname>McDonell</surname><given-names>K</given-names> </name><name name-style="western"><surname>Reynolds</surname><given-names>L</given-names> </name></person-group><article-title>Role play with large language models</article-title><source>Nature New Biol</source><year>2023</year><month>11</month><volume>623</volume><issue>7987</issue><fpage>493</fpage><lpage>498</lpage><pub-id pub-id-type="doi">10.1038/s41586-023-06647-8</pub-id><pub-id pub-id-type="medline">37938776</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="web"><article-title>Introducing ChatGPT</article-title><source>OpenAI</source><year>2022</year><access-date>2023-12-19</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://openai.com/blog/chatgpt/">https://openai.com/blog/chatgpt/</ext-link></comment></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Biswas</surname><given-names>SS</given-names> </name></person-group><article-title>Role of Chat GPT in public health</article-title><source>Ann Biomed Eng</source><year>2023</year><month>05</month><volume>51</volume><issue>5</issue><fpage>868</fpage><lpage>869</lpage><pub-id pub-id-type="doi">10.1007/s10439-023-03172-7</pub-id><pub-id pub-id-type="medline">36920578</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Thirunavukarasu</surname><given-names>AJ</given-names> </name><name name-style="western"><surname>Ting</surname><given-names>DSJ</given-names> </name><name name-style="western"><surname>Elangovan</surname><given-names>K</given-names> </name><name name-style="western"><surname>Gutierrez</surname><given-names>L</given-names> </name><name name-style="western"><surname>Tan</surname><given-names>TF</given-names> </name><name name-style="western"><surname>Ting</surname><given-names>DSW</given-names> </name></person-group><article-title>Large language models in medicine</article-title><source>Nat Med</source><year>2023</year><month>08</month><volume>29</volume><issue>8</issue><fpage>1930</fpage><lpage>1940</lpage><pub-id pub-id-type="doi">10.1038/s41591-023-02448-8</pub-id><pub-id pub-id-type="medline">37460753</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Miller</surname><given-names>W</given-names> </name><name name-style="western"><surname>Rollnick</surname><given-names>S</given-names> </name></person-group><source>Motivational Interviewing: Helping People Change and Grow</source><year>2023</year><publisher-name>The Guilford Press</publisher-name></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Brown</surname><given-names>A</given-names> </name><name name-style="western"><surname>Kumar</surname><given-names>AT</given-names> </name><name name-style="western"><surname>Melamed</surname><given-names>O</given-names> </name><etal/></person-group><article-title>A motivational interviewing chatbot with generative reflections for increasing readiness to quit smoking: iterative development study</article-title><source>JMIR Ment Health</source><year>2023</year><month>10</month><day>17</day><volume>10</volume><fpage>e49132</fpage><pub-id pub-id-type="doi">10.2196/49132</pub-id><pub-id pub-id-type="medline">37847539</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Perski</surname><given-names>O</given-names> </name><name name-style="western"><surname>Crane</surname><given-names>D</given-names> </name><name name-style="western"><surname>Beard</surname><given-names>E</given-names> </name><name name-style="western"><surname>Brown</surname><given-names>J</given-names> </name></person-group><article-title>Does the addition of a supportive chatbot promote user engagement with a smoking cessation app? An experimental study [published correction appears in Digit Health. 2020 May 22;6:2055207620930958]</article-title><source>Digit Health</source><year>2019</year><month>01</month><volume>5</volume><fpage>2055207619880676</fpage><pub-id pub-id-type="doi">10.1177/2055207619880676</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Boucher</surname><given-names>EM</given-names> </name><name name-style="western"><surname>Harake</surname><given-names>NR</given-names> </name><name name-style="western"><surname>Ward</surname><given-names>HE</given-names> </name><etal/></person-group><article-title>Artificially intelligent chatbots in digital mental health interventions: a review</article-title><source>Expert Rev Med Devices</source><year>2021</year><month>12</month><volume>18</volume><issue>sup1</issue><fpage>37</fpage><lpage>49</lpage><pub-id pub-id-type="doi">10.1080/17434440.2021.2013200</pub-id><pub-id pub-id-type="medline">34872429</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Moilanen</surname><given-names>J</given-names> </name><name name-style="western"><surname>Visuri</surname><given-names>A</given-names> </name><name name-style="western"><surname>Suryanarayana</surname><given-names>SA</given-names> </name><name name-style="western"><surname>Alorwu</surname><given-names>A</given-names> </name><name name-style="western"><surname>Yatani</surname><given-names>K</given-names> </name><name name-style="western"><surname>Hosio</surname><given-names>S</given-names> </name></person-group><article-title>Measuring the effect of mental health chatbot personality on user engagement</article-title><conf-name>MUM 2022: 21th International Conference on Mobile and Ubiquitous Multimedia</conf-name><conf-date>Nov 27-30, 2022</conf-date><conf-loc>Lisbon, Portugal</conf-loc><pub-id pub-id-type="doi">10.1145/3568444.3568464</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chow</surname><given-names>JCL</given-names> </name><name name-style="western"><surname>Sanders</surname><given-names>L</given-names> </name><name name-style="western"><surname>Li</surname><given-names>K</given-names> </name></person-group><article-title>Impact of ChatGPT on medical chatbots as a disruptive technology</article-title><source>Front Artif Intell</source><year>2023</year><volume>6</volume><pub-id pub-id-type="doi">10.3389/frai.2023.1166014</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Palan</surname><given-names>S</given-names> </name><name name-style="western"><surname>Schitter</surname><given-names>C</given-names> </name></person-group><article-title>Prolific.ac&#x2014;a subject pool for online experiments</article-title><source>J Behav Exp Finance</source><year>2018</year><month>03</month><volume>17</volume><fpage>22</fpage><lpage>27</lpage><pub-id pub-id-type="doi">10.1016/j.jbef.2017.12.004</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mercer</surname><given-names>SW</given-names> </name><name name-style="western"><surname>Maxwell</surname><given-names>M</given-names> </name><name name-style="western"><surname>Heaney</surname><given-names>D</given-names> </name><name name-style="western"><surname>Watt</surname><given-names>GC</given-names> </name></person-group><article-title>The consultation and relational empathy (CARE) measure: development and preliminary validation and reliability of an empathy-based consultation process measure</article-title><source>Fam Pract</source><year>2004</year><month>12</month><volume>21</volume><issue>6</issue><fpage>699</fpage><lpage>705</lpage><pub-id pub-id-type="doi">10.1093/fampra/cmh621.cmh621</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Heatherton</surname><given-names>TF</given-names> </name><name name-style="western"><surname>Kozlowski</surname><given-names>LT</given-names> </name><name name-style="western"><surname>Frecker</surname><given-names>RC</given-names> </name><name name-style="western"><surname>Rickert</surname><given-names>W</given-names> </name><name name-style="western"><surname>Robinson</surname><given-names>J</given-names> </name></person-group><article-title>Measuring the heaviness of smoking: using self-reported time to the first cigarette of the day and number of cigarettes smoked per day</article-title><source>Br J Addict</source><year>1989</year><month>07</month><volume>84</volume><issue>7</issue><fpage>791</fpage><lpage>799</lpage><pub-id pub-id-type="doi">10.1111/j.1360-0443.1989.tb03059.x</pub-id><pub-id pub-id-type="medline">2758152</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="web"><article-title>Readiness Ruler</article-title><source>Center for Evidence-Based Practices | Case Western Reserve University</source><year>2021</year><access-date>2023-12-19</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://case.edu/socialwork/centerforebp/resources/readiness-ruler">https://case.edu/socialwork/centerforebp/resources/readiness-ruler</ext-link></comment></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Peirsman</surname><given-names>Y</given-names> </name></person-group><article-title>bert-base-multilingual-uncased-sentiment</article-title><source>Hugging Face</source><year>2020</year><access-date>2020-12-19</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://huggingface.co/nlptown/bert-base-multilingual-uncased-sentiment">https://huggingface.co/nlptown/bert-base-multilingual-uncased-sentiment</ext-link></comment></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Smit</surname><given-names>ES</given-names> </name><name name-style="western"><surname>Hoving</surname><given-names>C</given-names> </name><name name-style="western"><surname>Schelleman-Offermans</surname><given-names>K</given-names> </name><name name-style="western"><surname>West</surname><given-names>R</given-names> </name><name name-style="western"><surname>de Vries</surname><given-names>H</given-names> </name></person-group><article-title>Predictors of successful and unsuccessful quit attempts among smokers motivated to quit</article-title><source>Addict Behav</source><year>2014</year><month>09</month><volume>39</volume><issue>9</issue><fpage>1318</fpage><lpage>1324</lpage><pub-id pub-id-type="doi">10.1016/j.addbeh.2014.04.017</pub-id><pub-id pub-id-type="medline">24837754</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gwaltney</surname><given-names>CJ</given-names> </name><name name-style="western"><surname>Metrik</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kahler</surname><given-names>CW</given-names> </name><name name-style="western"><surname>Shiffman</surname><given-names>S</given-names> </name></person-group><article-title>Self-efficacy and smoking cessation: a meta-analysis</article-title><source>Psychol Addict Behav</source><year>2009</year><month>03</month><volume>23</volume><issue>1</issue><fpage>56</fpage><lpage>66</lpage><pub-id pub-id-type="doi">10.1037/a0013529</pub-id><pub-id pub-id-type="medline">19290690</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Von Ah</surname><given-names>D</given-names> </name><name name-style="western"><surname>Ebert</surname><given-names>S</given-names> </name><name name-style="western"><surname>Ngamvitroj</surname><given-names>A</given-names> </name><name name-style="western"><surname>Park</surname><given-names>N</given-names> </name><name name-style="western"><surname>Kang</surname><given-names>DH</given-names> </name></person-group><article-title>Factors related to cigarette smoking initiation and use among college students</article-title><source>Tob Induc Dis</source><year>2005</year><month>12</month><day>15</day><volume>3</volume><issue>1</issue><fpage>27</fpage><lpage>40</lpage><pub-id pub-id-type="doi">10.1186/1617-9625-3-1-27</pub-id><pub-id pub-id-type="medline">19570288</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="web"><source>pandas&#x2014;Python Data Analysis Library homepage pandas&#x2014;Python Data Analysis Library</source><access-date>2024-11-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://pandas.pydata.org/">https://pandas.pydata.org/</ext-link></comment></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Virtanen</surname><given-names>P</given-names> </name><name name-style="western"><surname>Gommers</surname><given-names>R</given-names> </name><name name-style="western"><surname>Oliphant</surname><given-names>TE</given-names> </name><etal/></person-group><article-title>SciPy 1.0: fundamental algorithms for scientific computing in Python</article-title><source>Nat Methods</source><year>2020</year><month>03</month><day>2</day><volume>17</volume><issue>3</issue><fpage>261</fpage><lpage>272</lpage><pub-id pub-id-type="doi">10.1038/s41592-019-0686-2</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Townsend</surname><given-names>J</given-names> </name><name name-style="western"><surname>Roderick</surname><given-names>P</given-names> </name><name name-style="western"><surname>Cooper</surname><given-names>J</given-names> </name></person-group><article-title>Cigarette smoking by socioeconomic group, sex, and age: effects of price, income, and health publicity</article-title><source>BMJ</source><year>1994</year><month>10</month><day>8</day><volume>309</volume><issue>6959</issue><fpage>923</fpage><lpage>927</lpage><pub-id pub-id-type="doi">10.1136/bmj.309.6959.923</pub-id><pub-id pub-id-type="medline">7950662</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fidler</surname><given-names>J</given-names> </name><name name-style="western"><surname>Ferguson</surname><given-names>SG</given-names> </name><name name-style="western"><surname>Brown</surname><given-names>J</given-names> </name><name name-style="western"><surname>Stapleton</surname><given-names>J</given-names> </name><name name-style="western"><surname>West</surname><given-names>R</given-names> </name></person-group><article-title>How does rate of smoking cessation vary by age, gender and social grade? Findings from a population survey in England</article-title><source>Addiction</source><year>2013</year><month>09</month><volume>108</volume><issue>9</issue><fpage>1680</fpage><lpage>1685</lpage><pub-id pub-id-type="doi">10.1111/add.12241</pub-id><pub-id pub-id-type="medline">23668684</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Questions related to ChatGPT on the week-later survey.</p><media xlink:href="formative_v9i1e56973_app1.docx" xlink:title="DOCX File, 511 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Additional demographics data.</p><media xlink:href="formative_v9i1e56973_app2.docx" xlink:title="DOCX File, 20 KB"/></supplementary-material></app-group></back></article>