<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Form Res</journal-id><journal-id journal-id-type="publisher-id">formative</journal-id><journal-id journal-id-type="index">27</journal-id><journal-title>JMIR Formative Research</journal-title><abbrev-journal-title>JMIR Form Res</abbrev-journal-title><issn pub-type="epub">2561-326X</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v9i1e63257</article-id><article-id pub-id-type="doi">10.2196/63257</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Changes in Mental State for Help-Seekers of Lifeline Australia&#x2019;s Online Chat Service: Lexical Analysis Approach</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Mazzer</surname><given-names>Kelly</given-names></name><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Curll</surname><given-names>Sonia</given-names></name><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Barzinjy</surname><given-names>Hakar</given-names></name><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Goecke</surname><given-names>Roland</given-names></name><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Larsen</surname><given-names>Mark</given-names></name><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Batterham</surname><given-names>Philip J</given-names></name><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Titov</surname><given-names>Nickolai</given-names></name><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Rickwood</surname><given-names>Debra</given-names></name><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>Faculty of Health, University of Canberra</institution><addr-line>11 Kirinari Street, Bruce</addr-line><addr-line>Canberra</addr-line><country>Australia</country></aff><aff id="aff2"><institution>School of Systems &#x0026; Computing, University of New South Wales</institution><addr-line>Canberra</addr-line><country>Australia</country></aff><aff id="aff3"><institution>Centre for Big Data Research in Health, University of New South Wales</institution><addr-line>Sydney</addr-line><country>Australia</country></aff><aff id="aff4"><institution>Centre for Mental Health Research, Australian National University</institution><addr-line>Canberra</addr-line><country>Australia</country></aff><aff id="aff5"><institution>School of Psychological Sciences, Macquarie University</institution><addr-line>Sydney</addr-line><country>Australia</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Mavragani</surname><given-names>Amaryllis</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Yip</surname><given-names>Paul</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Kelly Mazzer, Faculty of Health, University of Canberra, 11 Kirinari Street, Bruce, Canberra, 2611, Australia, 610262015266; <email>Kelly.Mazzer@canberra.edu.au</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>20</day><month>6</month><year>2025</year></pub-date><volume>9</volume><elocation-id>e63257</elocation-id><history><date date-type="received"><day>14</day><month>06</month><year>2024</year></date><date date-type="rev-recd"><day>28</day><month>03</month><year>2025</year></date><date date-type="accepted"><day>01</day><month>04</month><year>2025</year></date></history><copyright-statement>&#x00A9; Kelly Mazzer, Sonia Curll, Hakar Barzinjy, Roland Goecke, Mark Larsen, Philip J Batterham, Nickolai Titov, Debra Rickwood. Originally published in JMIR Formative Research (<ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>), 20.6.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Formative Research, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://formative.jmir.org/2025/1/e63257"/><abstract><sec><title>Background</title><p>Mental health challenges are escalating globally, with increasing numbers of individuals accessing crisis helplines through various modalities. Despite this growing demand, there is limited understanding of how crisis helplines benefit help-seekers over the course of a conversation. Affective computing has the potential to transform this area of research, yet it remains relatively unexplored, partly due to the scarcity of available helpline data.</p></sec><sec><title>Objective</title><p>This study aimed to explore the feasibility of using lexical analysis to track dynamic changes in the mental state of help-seekers during online chat conversations with a crisis helpline.</p></sec><sec sec-type="methods"><title>Methods</title><p>Lexical analysis was conducted on 6618 deidentified online chat transcripts collected by Lifeline Australia between April and June 2023 using the validated Empath lexical categories of Positive Emotion, Negative Emotion, Suffering, and Optimism. Furthermore, 2 context-specific categories, Distress and Suicidality, were also developed and analyzed to reflect crisis support language. Correlation analyses evaluated the relationships between the 6 lexical categories. One-way ANOVAs assessed changes in each lexical category across 3 conversation phases (beginning, middle, and end). Trend analyses using regression modeling examined the direction and strength of changes in lexical categories across 9 overlapping conversation windows (20% size and 50% step overlap).</p></sec><sec sec-type="results"><title>Results</title><p>Significant changes were observed across conversation phases. The context-specific categories showed the strongest improvements from the beginning to end phase of conversation, with a large reduction in Distress (<italic>d</italic>=0.79) and a moderate reduction in Suicidality (<italic>d</italic>=0.49). The most frequently occurring terms representing Distress were &#x201C;hard,&#x201D; &#x201C;bad,&#x201D; and &#x201C;down,&#x201D; and for Suicidality were &#x201C;suicide,&#x201D; &#x201C;stop,&#x201D; and &#x201C;hurt.&#x201D; The negatively framed Empath categories also significantly reduced, with moderate effect sizes for Suffering (<italic>d=</italic>0.49) and Negative Emotion (<italic>d=</italic>0.39). There were also significant but small reductions in the positively framed Empath categories of Positive Emotion (<italic>d=</italic>0.15) and Optimism (<italic>d=</italic>0.07) from the beginning to end phase of conversation. Correlation coefficients indicated the lexical categories captured related but distinct constructs (<italic>r</italic>=.34 to <italic>r</italic>=0.82). Trend analyses revealed a consistent downward trajectory across most lexical categories. Distress showed the steepest decline (slope=&#x2212;0.15, <italic>R</italic>&#x00B2;=0.97), followed by Suffering (slope=&#x2212;0.11, <italic>R</italic>&#x00B2;=0.96), Negative Emotion (slope=&#x2212;0.10, <italic>R</italic>&#x00B2;=0.69), and Suicidality (slope=&#x2212;0.06, <italic>R</italic>&#x00B2;=0.88). Positive Emotion showed a slight negative trend (slope=&#x2212;0.04, <italic>R</italic>&#x00B2;=0.54), while Optimism remained relatively stable across the conversation windows (slope=0.01, <italic>R</italic>&#x00B2;=0.13).</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This study demonstrates the feasibility of using lexical analysis to represent and monitor mental state changes during online crisis support interactions. The findings highlight the potential for integrating affective computing into crisis helplines to enhance service delivery and outcome measurement. Future research should focus on validating these findings and exploring how lexical analysis can be applied to improve real-time support to those in crisis.</p></sec></abstract><kwd-group><kwd>crisis helpline</kwd><kwd>lexical analysis</kwd><kwd>mental health</kwd><kwd>outcomes</kwd><kwd>distress</kwd><kwd>affective computing</kwd><kwd>Lexical</kwd><kwd>suicidal</kwd><kwd>suicide</kwd><kwd>help-seeker</kwd><kwd>help-seeking</kwd><kwd>emotion</kwd><kwd>chat</kwd><kwd>mental state</kwd><kwd>caregivers</kwd><kwd>digital mental health</kwd><kwd>digital health</kwd><kwd>e-health</kwd><kwd>ANOVA</kwd><kwd>feasibility study</kwd><kwd>mental health intervention</kwd><kwd>crisis support</kwd><kwd>online communities</kwd><kwd>support service</kwd><kwd>online support</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><sec id="s1-1"><title>Background</title><p>Crisis helplines are a critical component of mental health care systems, offering immediate, confidential, free, and often 24/7 support to individuals experiencing emotional distress [<xref ref-type="bibr" rid="ref1">1</xref>]. These services are delivered primarily via telephone, with many now offering text and web-based alternatives. Crisis supporters are usually staff members or volunteers trained in crisis and suicide intervention, with the skills and knowledge to provide support to help-seekers (also known as clients or users) and pathways to further care where needed. With the high prevalence of suicide deaths and emotional distress around the world, crisis helplines offer a cost-effective and scalable way to improve the accessibility and responsiveness of mental health and crisis care [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>].</p><p>Crisis helplines face significant challenges in meeting the growing demand and diversity of help-seekers. Maintaining consistent, high-quality support across telephone and digital services is vital [<xref ref-type="bibr" rid="ref2">2</xref>], especially as digital services are often used by vulnerable groups including youth and people with disabilities [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. Crisis helplines also need to ensure they remain flexible and adapt quickly to the evolving communication preferences and needs of help-seekers, as highlighted during the recent COVID-19 pandemic [<xref ref-type="bibr" rid="ref5">5</xref>]. These challenges, compounded by the urgency of crisis support, exacerbate the pressure on a crisis helpline&#x2019;s resources and volunteer workforce [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>].</p><p>Conducting research in crisis helpline settings poses multiple challenges, many of which stem from the anonymous and one-off nature of these services [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. Most studies have relied on retrospective self-reports by help-seekers [<xref ref-type="bibr" rid="ref11">11</xref>], which can provide valuable insight into subjective experiences but are subject to recall biases and fail to capture fluctuations in mental state during the contact. Moreover, low completion rates (eg, 33% completion rate among chatters in one study [<xref ref-type="bibr" rid="ref3">3</xref>]) indicate potential self-selection bias, whereby help-seekers with more positive outcomes might be more likely to complete a postcontact survey. Alternative approaches, such as crisis supporter assessments, are limited by judgement biases (eg, social desirability concerns) and recall errors, while using external raters tends to be very labor-intensive with consequently small samples [<xref ref-type="bibr" rid="ref12">12</xref>]. Improved approaches are urgently needed to inform strategies aimed at enhancing service delivery [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref4">4</xref>].</p><p>Integrating affective computing approaches within the crisis helpline context presents an opportunity for a transformative shift from traditional research approaches and holds substantial promise for enhancing mental health interventions [<xref ref-type="bibr" rid="ref13">13</xref>]. Affective computing is concerned with developing systems and devices that can recognize, interpret, process, and simulate human emotions [<xref ref-type="bibr" rid="ref14">14</xref>]. These systems collect and analyze various data on users&#x2019; mental states, including text-based emotional cues, vocal tone, and physiological signals. This information is then used by researchers and service providers to understand and enhance user experience in applications such as psychiatry, teaching, and social media [<xref ref-type="bibr" rid="ref14">14</xref>].</p><p>In the helpline context, these advanced computational methods offer several ethical and practical advantages. Affective computing algorithms can be applied to large datasets, with the ability to detect meaningful patterns and insights difficult or impossible to obtain with traditional methods. Automated data collection techniques such as text or voice analysis can provide more representative and objective data than self-report of human-coded data by mitigating human judgment errors and biases (eg, recall, social desirability, and self-selection). They are also unobtrusive, imposing no additional burden on the help-seeker or crisis supporter. Crucially, affective computing techniques facilitate continuous assessment, opening possibilities for dynamic support tools and informing a deeper understanding of emotional responses and outcomes of accessing a crisis helpline [<xref ref-type="bibr" rid="ref14">14</xref>].</p><p>Natural language processing (NLP) and computational linguistics play an important role in affective computing, especially in systems designed to process and understand emotions through text. These techniques can automatically analyze the words people use to provide insight into their mental states and emotions [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. For instance, lexical analysis using existing and widely available lexicon-based software, such as Empath and Linguistic Inquiry and Word Count (LIWC) [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>], has been applied to electronic health records to detect suicide risk [<xref ref-type="bibr" rid="ref19">19</xref>] and to text-based transcripts from online therapy to predict depression symptom severity [<xref ref-type="bibr" rid="ref20">20</xref>].</p><p>The past 5 years have seen a rapid growth in studies using NLP for mental health interventions [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>] and it has now moved into the crisis helpline context, providing initial support for the development of NLP-based tools to provide adjunct assistance to crisis supporters. Recent research has demonstrated the usefulness of NLP to identify and classify self-harm or suicide risk among digital help-seekers [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. Cognitive overload among digital crisis supporters has also been shown to reduce with support from NLP-based tools, including helping to resolve writer&#x2019;s block and providing real-time information based on conversation content [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. Furthermore, NLP can support the efficiency of crisis support, with Althoff et al [<xref ref-type="bibr" rid="ref25">25</xref>] determining via NLP techniques that more successful online crisis support involved greater time devoted to exploring solutions, as opposed to defining problems.</p><p>However, few studies so far have applied NLP to understand help-seeker outcomes from crisis support. This is an important area to explore, as developing innovative ways to monitor and evaluate help-seeker outcomes is essential to maintaining quality service provision and informing service improvements [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. Althoff et al [<xref ref-type="bibr" rid="ref25">25</xref>] applied LIWIC to explore changes in help-seeker sentiment, being the relative proportion of positive to negative words, they demonstrated a trend toward a more positive perspective over the conversation, with a notable increase at the very end of the conversation. Progressing this area of research requires access to data from service providers, which necessitates sensitively and appropriately navigating protective regulations concerning data confidentiality and ethical considerations of help-seeker privacy [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref26">26</xref>].</p></sec><sec id="s1-2"><title>Current Study</title><p>This study is among the first to apply lexical analysis to explore changes in the frequency and intensity of language associated with mental states used by help-seekers over the duration of a single online chat conversation with a crisis helpline. Implementing lexical analysis overcomes many of the usual barriers to research in helplines. Specifically, it removes the need for human annotation, thereby eliminating the risks of annotator fatigue and bias, avoiding the resource heavy training of annotators, achieving greater efficiency and objectivity, and allowing for the analysis of a much larger amount of data [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref27">27</xref>]. This study aims to provide a proof-of-concept for using NLP to monitor the mental state of help-seekers. While some previous research has used NLP to explore broad changes in help-seekers&#x2019; positive and negative sentiment [eg, <xref ref-type="bibr" rid="ref25">25</xref>], in the current study we analyze a wider range of general mental states (Positive Emotion, Negative Emotion, Suffering, and Optimism) and crisis-specific mental states (Distress and Suicidality). In addition, our novel use of Empath allowed us to go beyond frequency (word counts) to examine context and reflect intensity, allowing a richer understanding of changes in help-seeker mental states. Our analyses examined trends across the crisis intervention including over 9 overlapping conversation windows as well as at the beginning, middle and end phases using a large deidentified dataset from Lifeline Australia&#x2019;s online chat service.</p></sec></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Data</title><p>For more than 60 years, Lifeline has been operating as Australia&#x2019;s national, free 24-hour telephone crisis support service. In recent years, Lifeline has also expanded its service delivery to also offer 24-hour digital support via text messaging and online chat services with crisis supporters [<xref ref-type="bibr" rid="ref6">6</xref>]. Lifeline Australia provided a census of routinely collected data from all contacts made to their online chat service for 3 months from April to June 2023, totaling 20,569 contacts of varying lengths that were answered by a crisis supporter. Consistent with previous research [<xref ref-type="bibr" rid="ref12">12</xref>], after excluding automated or chatbot messages, all conversations with 10 or more messages from the help-seeker were retained for analysis (N=6618). Data included the date of contact, time of each message, number of messages per conversation, and the content of messages from both the help-seeker and crisis supporter during the conversation. Help-seeker demographics were not available.</p></sec><sec id="s2-2"><title>Preprocessing</title><p>Lifeline Australia does not systematically collect identifiable information; however, any incidental identifying information contained in the messages were scrubbed before access and analysis. Data was divided into help-seeker or crisis supporter messages. Conversations were then split into equal thirds, based on total number of messages in the conversation, to create a beginning, middle, and end phase of each conversation. Conversations were also split into 9 overlapping conversation windows, using a 20% window size with a 50% step overlap, meaning that each subsequent window started at the midpoint of the previous window. Text was converted to lowercase and tokenized into individual words. The Porter Stemmer from The Natural Language Toolkit [<xref ref-type="bibr" rid="ref28">28</xref>] was used to stem words by removing common morphological affixes and reducing words to their root forms, which enabled the capture of various word forms (&#x201C;suicid*&#x201D; to capture &#x201C;suicide&#x201D;, &#x201C;suicidal&#x201D;, &#x201C;suicidality,&#x201D; etc). In addition, n-grams, specifically bigrams, was used to capture meaningful word pairs (2-word phrases) as tokens [<xref ref-type="bibr" rid="ref29">29</xref>], which provided a more accurate representation of the text&#x2019;s semantic content (eg, &#x201C;harm myself&#x201D; as a single Suicidality term). All remaining messages from help-seekers were included in analysis; crisis supporter messages were not analyzed. <xref ref-type="table" rid="table1">Table 1</xref> provides descriptive details of the dataset following preprocessing.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Total counts, means, and SDs of help-seeker messages and lexical terms included in the final analyses for each online chat conversation (N=6618) and conversation phase (beginning, middle, and end).</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Help-seeker data</td><td align="left" valign="bottom">Total count, n</td><td align="left" valign="bottom">Per conversation, mean (SD)</td><td align="left" valign="bottom">Per third<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup>, mean (SD)</td></tr></thead><tbody><tr><td align="left" valign="top">Messages</td><td align="left" valign="top">201,955</td><td align="left" valign="top">30.52 (20.55)</td><td align="left" valign="top">10.17 (6.86)</td></tr><tr><td align="left" valign="top">Terms<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="top">309,628</td><td align="left" valign="top">46.79 (26.67)</td><td align="left" valign="top">15.60 (10.83)</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>Thirds were created based on number of messages.</p></fn><fn id="table1fn2"><p><sup>b</sup>Terms represent key words used in conversation, also known as tokens.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2-3"><title>Empath Software</title><p>Empath is an open-source Python (Python Software Foundation) library and text analysis tool that can perform NLP tasks including lexical analysis. Empath contains around 200 data-driven emotional and topical categories, also known as lexicons, which have been validated through a combination of NLP and human validation. Empath uses a large dataset to evaluate text and assign lexical degree scores based on the presence of predefined categories related to emotions, behaviors, and themes [<xref ref-type="bibr" rid="ref17">17</xref>]. Empath lexicons are recognized as highly correlated to LIWC&#x2019;s gold-standard categories (<italic>r</italic>=0.91) [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. Each category has a large list of member terms (words) that represent the category; for example, the category of Optimism includes terms such as &#x201C;hopeful,&#x201D; &#x201C;perseverance,&#x201D; and &#x201C;progress&#x201D; [<xref ref-type="bibr" rid="ref17">17</xref>]. Refer to <xref ref-type="table" rid="table2">Table 2</xref> for the top 10 frequently occurring member terms for each category used in the current study.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Characteristics of the lexical categories used in the analyses, including source, top 10 terms, total terms, total occurrences, and means and SDs of terms per conversation (N=6618).</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Category</td><td align="left" valign="bottom">Empath or contextual</td><td align="left" valign="bottom">Top 10 terms<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td><td align="left" valign="bottom">Total terms<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup></td><td align="left" valign="bottom">Total occurrences<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup></td><td align="left" valign="bottom">Mean (SD) per conversation</td></tr></thead><tbody><tr><td align="left" valign="top">Negative Emotion</td><td align="left" valign="top">Empath</td><td align="left" valign="top">Want, think, see, hard, bad, care, stop, hurt, scary or scar*, and die</td><td align="left" valign="top">94</td><td align="left" valign="top">73,008</td><td align="left" valign="top">11.03 (7.09)</td></tr><tr><td align="left" valign="top">Positive Emotion</td><td align="left" valign="top">Empath</td><td align="left" valign="top">Feel*, friend*, better, keep, family or famili*, care, love, understand, hope, and happi*</td><td align="left" valign="top">75</td><td align="left" valign="top">43,666</td><td align="left" valign="top">6.60 (4.57)</td></tr><tr><td align="left" valign="top">Suffering</td><td align="left" valign="top">Empath</td><td align="left" valign="top">Feel*, bad, hurt, die, long, depress*, wors*, kill, pain*, and cry or cri*</td><td align="left" valign="top">127</td><td align="left" valign="top">42,125</td><td align="left" valign="top">6.37 (4.28)</td></tr><tr><td align="left" valign="top">Optimism</td><td align="left" valign="top">Empath</td><td align="left" valign="top">Feel*, like, will, thank, sure, better, love, hope*, happy or happi*, and appreci*</td><td align="left" valign="top">81</td><td align="left" valign="top">47,442</td><td align="left" valign="top">7.17 (4.20)</td></tr><tr><td align="left" valign="top">Distress</td><td align="left" valign="top">Contextual</td><td align="left" valign="top">Hard, bad, down, hurt, scary or scar*, struggl*, alon*, depress*, stress*, and wors*</td><td align="left" valign="top">137</td><td align="left" valign="top">53,423</td><td align="left" valign="top">8.07 (5.71)</td></tr><tr><td align="left" valign="top">Suicidality</td><td align="left" valign="top">Contextual</td><td align="left" valign="top">Suicid*, stop*, hurt, die, kill, hate, pain*, plan, harm*, and safe*</td><td align="left" valign="top">163</td><td align="left" valign="top">31,428</td><td align="left" valign="top">4.75 (3.98)</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>Top 10 terms represents 10 most frequently occurring terms in the dataset for each category, ranked in order of frequency.</p></fn><fn id="table2fn2"><p><sup>b</sup>Total terms are the total number of member terms or words representing a category. Count does not include member terms where a single term represents the name of another Empath category. For example, Death is an Empath category as well as a member term of Suffering<italic>;</italic> all of Death&#x2019;s 81 member terms would be identified as instances of Suffering<italic>,</italic> but are not included in the total terms value.</p></fn><fn id="table2fn3"><p><sup>c</sup>Total occurrences are the total count of occurrences of member terms or words in conversations.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2-4"><title>Lexical Categories</title><sec id="s2-4-1"><title>Empath Categories</title><p>All validated Empath categories were reviewed and 4 were selected for inclusion as they best represented concepts that help-seekers may aim to improve by contacting a crisis helpline like Lifeline. The 4 categories were: Negative Emotion, Positive Emotion, Suffering, and Optimism. Lexical degree scores, ranging from 0 to 1, were assigned to text for the Empath categories of Negative Emotion, Positive Emotion, Suffering, and Optimism. A higher score represents a greater proportion of words present in the text that fall into a category. For example, a degree score of 0.7 for Suffering would indicate a very high occurrence of Suffering-related words in the conversation.</p></sec><sec id="s2-4-2"><title>Contextual Categories</title><p>There is a risk that lexicons designed to understand general linguistic patterns, such as the Empath categories, may not be appropriate for highly domain specific tasks [<xref ref-type="bibr" rid="ref30">30</xref>]. Thus, in addition to the 4 Empath categories, 2 new categories were derived for analysis. The categories of Distress and Suicidality are highly context specific; reducing distress and suicidality are 2 of the highest priority outcomes for help-seekers accessing Lifeline services [<xref ref-type="bibr" rid="ref31">31</xref>].</p><p>Lexical categories representing Distress and Suicidality specific to the crisis helpline context were developed using a multistep process with input from various expert groups, including researchers, service providers, and people with lived experience. First, a team (n=8) of experienced crisis supporters from Lifeline Australia reviewed a sample of 200 online chat and text transcripts from a separate dataset not used in the current study. These crisis supporters received a training session from the research team (KM) on how to identify relevant keywords. They were also provided with written guidelines and examples to ensure consistency in their approach. The keywords identified by the crisis supporters were then collated and reviewed by the research team (KM and SC). The resulting list was then shared with several expert groups for further input and refinement, including Lifeline&#x2019;s lived experience advisory group, online chat service team leaders, and Lifeline&#x2019;s clinical practice team. The research team conducted a final review of all inputs, with any disagreements or ambiguous terms resolved through team discussion. Further refinement of keywords was undertaken using manual annotation of a random sample of 100 transcripts used in the current study (SC).</p><p>The same Empath lexical degree scoring system could not be applied for Distress and Suicidality as they were not pre-existing Empath categories. Instead, the lexical analysis of the contextual categories, Distress and Suicidality, were based on mean counts of terms present within the text. The mean of Distress represented the average number of occurrences of Distress member terms in a conversation.</p><p>The category of Distress had a total of 137 terms that occurred 53,423 times in the dataset; the top 10 Distress terms accounted for 40.26% (n=21,510) of these occurrences with &#x201C;hard&#x201D; being the most frequently occurring term (n=3118), followed by &#x201C;bad&#x201D; (n=2884), and &#x201C;down&#x201D; (n=2411).The Suicidality category had 163 total terms that occurred 31,428 times; the top 10 Suicidality terms accounted for 56.72% (n=17,825) of occurrences with &#x201C;suicid*&#x201D; occurring most frequently (n=2885), followed by &#x201C;stop*&#x201D; (n=2306), and &#x201C;hurt&#x201D; (n=2174).</p></sec></sec><sec id="s2-5"><title>Statistical Analysis</title><p>Pearson correlations were conducted based on the number of term occurrences to determine the strength of relationship between the 6 lexical categories. Lexical analyses were conducted to examine changes in mental state over the phases (beginning, middle, and end) of an online chat conversation with a help-seeker. One-way ANOVA was performed to determine whether the degree of occurrence of each category was significantly different between the start, middle, and end phases of conversation. Post hoc <italic>t</italic> tests were also conducted to determine which phases of conversation were significantly different from one another. Trend analysis and linear regression were then performed on the mean token counts across 9 overlapping conversation windows to determine the direction (slope) and magnitude (<italic>R</italic>&#x00B2;) of change within each lexical category. This method allowed better understanding of the dynamic change across conversations. <xref ref-type="fig" rid="figure1">Figure 1</xref> shows the workflow of analyses and included categories.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Overview of the design and structure of the study, including the lexical categories and conversation phases used in the analyses.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e63257_fig01.png"/></fig></sec><sec id="s2-6"><title>Ethical Considerations</title><p>This study was approved by the University of Canberra&#x2019;s Human Research Ethics Committee (approval no. 4673). The data that were analyzed were collected routinely by Lifeline Australia. Due to the anonymity of Lifeline Australia help-seekers, there was no opportunity to obtain specific consent from individuals to use their data. However, all Lifeline Australia help-seekers are informed that their personal data may be used to conduct research, evaluation, and assurance activities. No identifying information (eg, phone number, email address, or help-seeker name) were provided in the dataset. Deidentified data were stored and analyzed in a secure, Lifeline owned and managed environment.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Overview</title><p>Descriptive statistics of conversation length are presented, followed by correlations between all categories. Results for each of the Empath categories of Negative Emotion, Positive Emotion, Suffering and Optimism, are presented as means and SD of lexical degree scores for all conversations separated into the beginning, middle, and end phases of conversation. The contextual categories of Distress and Suicidality are presented as mean occurrences of terms across all conversations in the beginning, middle, and end phases. Tests of significance are reported for changes in each category over the phases of conversation.</p></sec><sec id="s3-2"><title>Descriptive Statistics</title><p>Conversations included in the final analyses had a range of 10 to 382 help-seeker messages (mean 30.52, SD 20.55; <xref ref-type="table" rid="table1">Table 1</xref>). A total of 309,628 occurrences of terms from all included lexical categories were identified, with a mean of 46.79 (SD 26.67) occurrences of terms per conversation. Negative Emotion had the highest occurrences of terms at 73,008, followed by Distress with 53,423. Note that categories can and do include overlapping member terms; in fact, similarity comparisons are used in Empath&#x2019;s mapping of vocabulary to categories [<xref ref-type="bibr" rid="ref17">17</xref>]. &#x201C;Feel*&#x201D; (feel, feels, feeling, and feelings) was among the most frequently occurring words for many of the emotion-based categories. <xref ref-type="table" rid="table2">Table 2</xref> provides descriptions of the categories and their occurrence at the conversation level.</p></sec><sec id="s3-3"><title>Correlations</title><p><xref ref-type="table" rid="table3">Table 3</xref> presents the correlations between mean number of occurrences across the categories. Positive Emotion and Optimism had the strongest relationship (<italic>r</italic>=0.82), whereby when a help-seeker expresses positive emotions they are also likely to use optimistic language. The next strongest correlations were between Distress with both Suffering (<italic>r</italic>=0.81) and Negative Emotion (<italic>r</italic>=0.77). These indicate that help-seekers experiencing high level of distress are also likely to express a lot of suffering and negative emotion. Correlations between all categories revealed significant, <italic>P</italic>&#x003C;.001, medium, or strong positive relationships (<italic>r</italic>=0.34 to 0.82), likely reflecting the shared foundation of emotion and emotion-related terms that each of these categories is defined by. No categories had correlations higher than <italic>r=</italic>0.82, suggesting each category represented a distinct construct.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>A correlation matrix showing the relationships between mean lexical category occurrences in help-seeker online chat messages.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Lexical category<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="bottom">1</td><td align="left" valign="bottom">2</td><td align="left" valign="bottom">3</td><td align="left" valign="bottom">4</td><td align="left" valign="bottom">5</td></tr></thead><tbody><tr><td align="left" valign="top">Negative Emotion</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">Positive Emotion</td><td align="left" valign="top">.71</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">Suffering</td><td align="left" valign="top">.63</td><td align="left" valign="top">.68</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">Optimism</td><td align="left" valign="top">.63</td><td align="left" valign="top">.82</td><td align="left" valign="top">.63</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">Distress</td><td align="left" valign="top">.77</td><td align="left" valign="top">.67</td><td align="left" valign="top">.81</td><td align="left" valign="top">.64</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">Suicidality</td><td align="left" valign="top">.62</td><td align="left" valign="top">.38</td><td align="left" valign="top">.58</td><td align="left" valign="top">.34</td><td align="left" valign="top">.45</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup><italic>P</italic>&#x003C;.001.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-4"><title>Changes in Emotions by Phase of Conversation</title><p><xref ref-type="fig" rid="figure2">Figure 2</xref> presents the mean occurrence of terms by category for the beginning, middle, and end phases of the conversation. Except for Optimism, all categories revealed a pattern of reduction in the number of term occurrences from the beginning phase of conversation to the end. Surprisingly, this includes the positively framed category of Positive Emotion<italic>,</italic> which would be expected to increase during a contact with Lifeline&#x2019;s online chat service.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Mean occurrences of lexical category terms across 3 phases of help-seeker online chat conversation (beginning, middle, and end).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e63257_fig02.png"/></fig></sec><sec id="s3-5"><title>Lexical Analyses</title><sec id="s3-5-1"><title>Empath Categories by Conversation Phase</title><p><xref ref-type="table" rid="table4">Table 4</xref> presents the lexical degree scores for all 4 Empath categories by phase of conversation. Help-seekers most frequently used terms related to Negative Emotion across all 3 phases. Both negative categories, Negative Emotion (<italic>F</italic><sub>19851,2</sub>=273.68, <italic>P</italic>&#x003C;.001) and Suffering (<italic>F</italic><sub>19851,2</sub>=424.30, <italic>P</italic>&#x003C;.001) significantly improved from the beginning, to middle, to end phase of conversation with both demonstrating medium effect sizes from beginning to end of conversation (<italic>d</italic>=0.39 and <italic>d</italic>=0.49, respectively). Surprisingly, Positive Emotion (<italic>F</italic><sub>19851,2</sub>=54.42, <italic>P</italic>&#x003C;.001) and Optimism (<italic>F</italic><sub>19851,2</sub>=70.49, <italic>P</italic>&#x003C;.001) also significantly reduced in the end phase of conversation compared to the beginning, although only with weak effect sizes (<italic>d</italic>=0.15 and <italic>d</italic>=0.07, respectively). Note that the pattern of results based on mean occurrence was similar to the pattern of results based on mean lexical degree score for all categories except Optimism (<xref ref-type="fig" rid="figure2">Figure 2</xref>).</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>One-way ANOVA and post hoc <italic>t</italic> tests comparing lexical degree scores across conversation phases (beginning, middle, and end) for Empath lexical categories.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom" rowspan="2">Lexical category</td><td align="left" valign="bottom" rowspan="2"><italic>F</italic> test (<italic>df</italic>)</td><td align="left" valign="bottom" colspan="3">Mean lexical degree score (SD)<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup></td><td align="left" valign="bottom" colspan="3">Cohen <italic>d</italic></td></tr><tr><td align="left" valign="bottom">Beginning</td><td align="left" valign="bottom">Middle</td><td align="left" valign="bottom">End</td><td align="left" valign="bottom">Beginning-middle</td><td align="left" valign="bottom">Middle-end</td><td align="left" valign="bottom">Beginning-end</td></tr></thead><tbody><tr><td align="left" valign="top">Negative Emotion</td><td align="left" valign="top">273.68<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup> (19851,2)</td><td align="left" valign="top">0.0248<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup> (0.0224)</td><td align="left" valign="top">0.0228<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup> (0.0210)</td><td align="left" valign="top">0.0166<sup><xref ref-type="table-fn" rid="table4fn4">d</xref></sup> (0.0198)</td><td align="left" valign="top">0.09</td><td align="left" valign="top">0.31</td><td align="left" valign="top">0.39</td></tr><tr><td align="left" valign="top">Positive Emotion</td><td align="left" valign="top">54.42<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup> (19851,2)</td><td align="left" valign="top">0.0129<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup>(0.0153)</td><td align="left" valign="top">0.0107<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup> (0.0130)</td><td align="left" valign="top">0.0106<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup> (0.0147)</td><td align="left" valign="top">0.15</td><td align="left" valign="top">0.01</td><td align="left" valign="top">0.15</td></tr><tr><td align="left" valign="top">Suffering</td><td align="left" valign="top">424.30<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup> (19851,2)</td><td align="left" valign="top">0.0134<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup> (0.0162)</td><td align="left" valign="top">0.0090<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup> (0.0131)</td><td align="left" valign="top">0.0065<sup><xref ref-type="table-fn" rid="table4fn4">d</xref></sup> (0.0118)</td><td align="left" valign="top">0.30</td><td align="left" valign="top">0.20</td><td align="left" valign="top">0.49</td></tr><tr><td align="left" valign="top">Optimism</td><td align="left" valign="top">70.49<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup> (19851,2)</td><td align="left" valign="top">0.0077<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup> (0.0121)</td><td align="left" valign="top">0.0054<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup> (0.0094)</td><td align="left" valign="top">0.0068<sup><xref ref-type="table-fn" rid="table4fn4">d</xref></sup> (0.0120)</td><td align="left" valign="top">0.21</td><td align="left" valign="top">&#x2013;0.13</td><td align="left" valign="top">0.07</td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup><italic>P</italic>&#x003C;.001.</p></fn><fn id="table4fn2"><p><sup>b</sup>Differing (b,c,d) superscripts represents differences at <italic>P</italic>&#x003C;.001 between conversation phases. Where the same superscript is shown across row (b,b), the conversation phases did not differ significantly.</p></fn><fn id="table4fn3"><p><sup>c</sup>Differing (b,c,d) superscripts represents differences at <italic>P</italic>&#x003C;.001 between conversation phases. Where the same superscript is shown (c,c), the conversation phases did not differ significantly.</p></fn><fn id="table4fn4"><p><sup>d</sup>Differing (b,c,d) superscripts represents differences at <italic>P</italic>&#x003C;.001 between conversation phases.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-5-2"><title>Contextual Categories by Conversation Phase</title><p><xref ref-type="table" rid="table5">Table 5</xref> presents changes in Distress and Suicidality based on the mean number of occurrences of terms. Both contextual categories significantly improved from the beginning, to middle, to end phase of conversation (Distress <italic>F</italic><sub>19851,2</sub>=1338.07, <italic>P</italic>&#x003C;.001 and Suicidality <italic>F</italic><sub>19851,2</sub>=421.45, <italic>P</italic>&#x003C;.001). Distress had the strongest effect size of any category (Cohen <italic>d</italic>=0.79), in its reduction from the beginning to the end of the conversation. Suicidality was also among the strongest effects of all categories with Cohen <italic>d</italic>=0.49 from the beginning to the end of the conversation.</p><table-wrap id="t5" position="float"><label>Table 5.</label><caption><p>One-way ANOVA and post hoc <italic>t</italic> tests comparing mean number of occurrences across conversation phases (beginning, middle, and end) for contextual lexical categories.</p></caption><table id="table5" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom" rowspan="2">Category</td><td align="left" valign="bottom" rowspan="2"><italic>F</italic><sup><xref ref-type="table-fn" rid="table5fn1">a</xref></sup> test (<italic>df</italic>)</td><td align="left" valign="bottom" colspan="3">Mean (SD)<sup><xref ref-type="table-fn" rid="table5fn2">b</xref></sup></td><td align="left" valign="bottom" colspan="3">Cohen <italic>d</italic></td></tr><tr><td align="left" valign="bottom">Beginning</td><td align="left" valign="bottom">Middle</td><td align="left" valign="bottom">End</td><td align="left" valign="bottom">Beginning-middle</td><td align="left" valign="bottom">Middle-end</td><td align="left" valign="bottom">Beginning-end</td></tr></thead><tbody><tr><td align="left" valign="top">Distress</td><td align="left" valign="top">1338.07<sup><xref ref-type="table-fn" rid="table5fn1">a</xref></sup> (19851,2)</td><td align="left" valign="top">3.64<sup><xref ref-type="table-fn" rid="table5fn2">b</xref></sup> (2.89)</td><td align="left" valign="top">2.73<sup><xref ref-type="table-fn" rid="table5fn3">c</xref></sup> (2.45)</td><td align="left" valign="top">1.70<sup><xref ref-type="table-fn" rid="table5fn4">d</xref></sup> (1.93)</td><td align="left" valign="top">0.34</td><td align="left" valign="top">0.47</td><td align="left" valign="top">0.79</td></tr><tr><td align="left" valign="top">Suicidality</td><td align="left" valign="top">421.45<sup><xref ref-type="table-fn" rid="table5fn1">a</xref></sup> (19851,2)</td><td align="left" valign="top">1.93<sup><xref ref-type="table-fn" rid="table5fn2">b</xref></sup> (1.98)</td><td align="left" valign="top">1.73<sup><xref ref-type="table-fn" rid="table5fn3">c</xref></sup> (1.81)</td><td align="left" valign="top">1.08<sup><xref ref-type="table-fn" rid="table5fn4">d</xref></sup> (1.46)</td><td align="left" valign="top">0.11</td><td align="left" valign="top">0.40</td><td align="left" valign="top">0.49</td></tr></tbody></table><table-wrap-foot><fn id="table5fn1"><p><sup>a</sup><italic>P</italic>&#x003C;.001.</p></fn><fn id="table5fn2"><p><sup>b</sup>Differing (b,c,d) superscripts represents differences at <italic>P</italic>&#x003C;.001 between conversation phases. Where the same superscript is shown acros row (b,b), the conversation phases did not differ significantly.</p></fn><fn id="table5fn3"><p><sup>c</sup>Differing (b,c,d) superscripts represents differences at <italic>P</italic>&#x003C;.001 between conversation phases.</p></fn><fn id="table5fn4"><p><sup>d</sup>Differing (b,c,d) superscripts represents differences at <italic>P</italic>&#x003C;.001 between conversation phases.</p></fn></table-wrap-foot></table-wrap></sec></sec><sec id="s3-6"><title>Trend Analyses</title><p>Regression results indicated a consistent downward trajectory for Distress (slope=&#x2212;0.1471, <italic>R</italic>&#x00B2;=0.9741), Suicidality (slope=&#x2212;0.0636, <italic>R</italic>&#x00B2;=0.8821), Negative Emotion (slope=&#x2212;0.1017, <italic>R</italic>&#x00B2;=0.6937), and Suffering (slope=&#x2212;0.1053, <italic>R</italic>&#x00B2;=0.9644), suggesting a steady decline in the expression of these categories over the course of the conversations (<xref ref-type="fig" rid="figure3">Figure 3</xref>). Among these, Distress maintained the steepest decline, aligning with findings from previous analyses demonstrating significant reductions in distress-related language.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Trend of mean occurrences for negative lexical categories (Negative Emotion, Distress, Suffering, Suicidality) across 9 overlapping conversation windows.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e63257_fig03.png"/></fig><p>Positive Emotion also displayed a slight negative trend (slope=&#x2212;0.0359, <italic>R</italic>&#x00B2;=0.5372), but its decline was less pronounced compared with the negatively framed categories. On the other hand, optimism remained relatively stable, with a weak positive slope (slope=0.0080, <italic>R</italic>&#x00B2;=0.1253), which indicates minimal variation across the conversation windows (<xref ref-type="fig" rid="figure4">Figure 4</xref>).</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Trend of mean occurrences for positive lexical categories (Positive Emotion, and Optimism) across 9 overlapping conversation windows.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e63257_fig04.png"/></fig><p>The strength of the regression models varied across categories. Distress, Suicidality, and Suffering, had high <italic>R</italic>&#x00B2; values, indicating strong model fit and predictable changes over time. In contrast, Optimism had the lowest explanatory power, suggesting that its variations may be influenced by additional conversational factors not captured by the linear model. Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> provides means and SD for each category across the 9 windows.</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>In this study, lexical analysis was combined with traditional statistical techniques to detect changes in language associated with the mental state of help-seekers accessing a chat-based national crisis helpline. Results provide meaningful new insights into how people interact with crisis chat helplines. Crucially, this research is the first to demonstrate the feasibility of a novel methodological approach that may facilitate unobtrusive, objective, and real-time assessment of help-seeker outcomes, with the potential to enhance the effectiveness and efficiency of crisis helplines globally.</p><p>Use of negative language reduced across each phase of the crisis chat conversation, from beginning, middle, to end. This pattern was evident across all categories representing negative mental states (Negative Emotion, Suffering, Distress, and Suicidality). Trend analyses across 9 overlapping conversation windows showed a small increase in use of negative language from the first to second window, followed by decreases across the remaining windows. These findings are consistent with meta-analytical evidence for the overall effectiveness of crisis helplines in reducing emotional distress and risk of suicide [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref13">13</xref>], providing validation for our approach. Specific to the chat modality, previous evidence based on help-seeker self-report has found that experiences of distress and feeling suicidal reduced pre-post contact [<xref ref-type="bibr" rid="ref3">3</xref>]. The current findings strengthen support for this outcome by demonstrating a similar decline in distress and suicidality during the conversation, using an approach unaffected by selection bias (ie, that only help-seekers who felt better or less suicidal completed the postcontact measures). Reducing distress is a core pillar of crisis helplines and has been identified as the most important outcome for help-seekers [<xref ref-type="bibr" rid="ref31">31</xref>]. Distress had the largest reduction over the conversations in the current study, showing a welcome marker of the effectiveness of crisis helplines.</p><p>The reduction in suicidality-related words is also encouraging and aligns with suicide prevention as a key objective of service delivery for crisis helplines [<xref ref-type="bibr" rid="ref31">31</xref>]. More than 90% of conversations in the current study involved suicidality-related content. Disclosures and discussions about suicide in a helpline context can occur at different stages of the contact depending on the needs of the help-seeker. While any immediate risk of suicide is addressed as soon as it is identified (beginning stage), for other help-seekers the sensitivity of the issue means it may be better discussed after rapport has been established (middle stage) [<xref ref-type="bibr" rid="ref32">32</xref>]. That the largest reduction in suicidality-related words occurred in the end phase of the conversation in this study supports this notion. The trend analysis further confirms this finding, as Suicidality maintained a downward trajectory across the conversation windows, indicating that the largest reduction in suicidality-related words occurred toward the later stages of the conversation. However, it is important to consider that these aggregate results mask individual variations. The timing of disclosure might also vary between telephone versus digital services, with previous research suggesting greater digital disclosure of sensitive and stigmatized issues among youth [<xref ref-type="bibr" rid="ref33">33</xref>]. Future studies exploring typical patterns in how and when suicidality is disclosed and discussed across different modalities are needed.</p><p>Contrary to expectations, there was a trend toward less expression of positive language across the conversation. Positive Emotion was higher in the beginning, compared with the middle and end phases, although these effects were weak. Findings based on lexical degree scores indicated that optimism was also highest in the beginning, although average word use was highest in the end phase of the conversation. Trend analyses across 9 overlapping segments also showed a slight decline in Positive Emotion, while Optimism was relatively stable. Unlike simple word occurrence counts, lexical degree scores account for term associations and strengths within a category, and hence these approaches can show some, though not substantive, divergence of results across conversation phases. Rather than indicating ineffectiveness, we suggest the heightened initial positive mental state may reflect hope or relief from deciding to seek help. In addition, the crisis supporter&#x2019;s model of practice is to, first, establish a connection with the help-seeker and then, second, explore their concerns, at which stage an understandable reduction in positive language may occur. Moreover, previous research indicates that most help-seekers do not access crisis support to achieve a positive emotional state but to alleviate an intensely negative one [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref34">34</xref>]. We suggest that while tracking positive mental states may be useful for understanding the complex dynamics of crisis helpline conversations, care should be taken when using positive emotions as outcomes or an indicator of service effectiveness.</p></sec><sec id="s4-2"><title>Implications for Research and Practice</title><p>This proof-of-concept study answers recent calls for innovative approaches to data collection in the crisis helpline context [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. The capacity of lexical analysis and advanced affective computing approaches to automatically detect and analyze emotion-based language in large datasets (and potentially in real-time) has the potential to transform crisis helpline research. Affective computing approaches hold promise for improved training instruments, quality assessment, and tools to help crisis supporters understand and respond to help-seekers&#x2019; needs.</p><p>The practical implications of our findings are considerable. By tracking help-seeker mental states in real-time, lexical analysis&#x2013;based tools may be able to enhance crisis supporter responsiveness, through methods such as visual aids or dashboards that support risk assessment and emotion detection. Such tools might be especially useful in the text and chat contexts where emotion recognition is more challenging due to the absence of vocal cues [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]. Similar tools could also be used for professional development and to enhance crisis supporter motivation and satisfaction, thus improving volunteer retention and reducing the risk and impact of negative well-being and burnout. Stronger evidence for crisis helpline effectiveness will facilitate funding opportunities and support more tailored service delivery.</p><p>The current findings were based on online chat data and other modalities, like telephone or SMS text message services, may show a different pattern of results. For example, some research shows that help-seekers accessing online crisis helplines have higher levels of suicidality than those accessing telephone helplines [<xref ref-type="bibr" rid="ref37">37</xref>]. As such, it will be important for future studies to conduct comparative analyses across modalities and to cross-validate NLP methods for monitoring user outcomes with real-time data.</p><p>The potential real-time application of lexical analysis-based tools in crisis helplines raises practical and ethical challenges that warrant careful consideration [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref39">39</xref>]. From a practical perspective, ongoing validation of context-specific categories with real-world data will be critical to maintaining accuracy and responsiveness. Language evolves rapidly, particularly in digital environments, with new slang, cultural references, and mental health terminology varying across social contexts [<xref ref-type="bibr" rid="ref30">30</xref>]. Future research could explore the development of automated methods for continuous learning to detect and incorporate new keywords, enhancing the adaptability of these tools. Ethically, there is a risk of over-reliance on automated tools at the expense of human judgment, potentially comprising the quality of crisis support. Furthermore, the use of these tools must be balanced with the paramount importance of help-seeker confidentiality and privacy. To navigate these ethical challenges, crisis helplines could consider implementing informed consent processes or opt-in mechanisms to provide users with choice and control over the use of artificial intelligence&#x2013;assisted tools in their interactions. To ensure transparency and maintain the trust of help-seekers, crisis supporters, and the broader community, crisis helplines should develop and publish clear policies on the role of artificial intelligence in crisis interventions, detailing how these tools are used, what data is collected, and how it is protected. Regular evaluation of the risks and benefits, together with robust safeguarding procedures, can help ensure new tools enhance rather than compromise the quality and ethics of crisis intervention delivery. As this field of research grows, it is vital to develop frameworks that ensure research rigor and integrity, including ways to facilitate the safe and ethical sharing of highly sensitive data between service providers and researchers [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref40">40</xref>].</p></sec><sec id="s4-3"><title>Limitations</title><p>This investigation revealed several interesting patterns in crisis chat conversations. The use of both pre-existing Empath categories alongside newly developed, context-specific categories, which both showed a similar pattern of results, strengthens the reliability of our findings [<xref ref-type="bibr" rid="ref41">41</xref>]. However, there are important limitations to note.</p><p>A well-known limitation of lexicon-based approaches is their inability to account for context (contextual agnosticism). For example, the use of the word suicide in a chat does not indicate whether the help-seeker is talking about suicide generally or expressing their own suicidality. Similarly, this approach is unable to account for sarcasm, negations, or misspellings. This deficit may be particularly problematic when analyzing crisis online chat conversations, where the language used is often fragmented and ambiguous [<xref ref-type="bibr" rid="ref4">4</xref>], and may have additional variations associated with computer-mediated communication norms (eg, emojis and abbreviations). To help overcome this limitation, future research could integrate lexical analysis with other approaches, such as sentiment analysis, topic modeling, and deep-learning features such as contextualized embeddings (eg, RoBERTa) [<xref ref-type="bibr" rid="ref42">42</xref>]. However, more complex approaches would sacrifice the transparency and interpretability of lexicon-based methods [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref43">43</xref>].</p><p>Another limitation of lexical-based approaches is the correlation within categories, that is, the overlap between different but related emotional categories. Specifically, the same lexical term, &#x201C;feel&#x201D;, represented the top occurring term in multiple categories (Positive Emotion, Suffering, and Optimism). This overlap may hide nuanced shifts in specific mental states, with patterns across categories appearing similar due to their shared expressions [<xref ref-type="bibr" rid="ref43">43</xref>]. Notably, correlations between the categories included in the current formative study were not exceedingly high and indicated sufficient variance to represent different constructs. Moreover, some overlap in terms and language used to express various emotions is to be expected. Future research may benefit from exploring those relationships between emotions using an approach such as network analysis.</p><p>Furthermore, data limitations constrain the generalizability of our findings. Analyzing data from a single helpline (Lifeline Australia), modality (online chat), and time period (3 months) increases risks of bias [<xref ref-type="bibr" rid="ref44">44</xref>]. A common challenge in crisis helpline research is the lack of access to demographic information about help-seekers due to the anonymous nature of service engagement, which limits understanding of variations across groups [<xref ref-type="bibr" rid="ref5">5</xref>]. Thus, it remains unclear whether the changes in mental states identified in this study would generalize to other helpline settings, temporal contexts, or service modalities.</p><p>Our formative approach of dividing the chats into thirds based on the total number of messages, as well as 9 overlapping windows, in the conversation used 2 methods to enhance comparability across chats of varying pace and length and allowed sufficient data in each segment for meaningful analysis. The use of 9 overlapping windows provides a more nuanced understanding of lexical shifts as it captures subtle fluctuations that may be obscured when dividing conversations into discrete phases (as in beginning, middle, and end). However, it is important to acknowledge that the unique and dynamic nature of each help-seeking process may not be entirely captured by the quantity of text exchanged. Future research may benefit from a dynamic and integrated approach that combines timestamps with message counts to identify more meaningful conversation stages. This could potentially capture both the temporal aspects and content progression of crisis chat interactions.</p><p>Finally, our approach assumes that the words used by help-seekers in the conversations reflect key help-seeker outcomes (changes in mental state and suicide risk). While this is likely the case, the validity of using lexical analysis to measure such outcomes needs to be further tested. For example, studies could compare the results of automated text analysis to expert human coding of the same conversations to determine concordance, or triangulate lexical results with self-report measures.</p></sec><sec id="s4-4"><title>Conclusions</title><p>A large dataset of crisis chats from Australia&#x2019;s national helpline demonstrated how NLP techniques can be used to track language associated with help-seeker mental states. Pending positive results from future validation studies, lexical analysis has the potential to be a valuable tool in monitoring and evaluating outcomes for help-seekers accessing a crisis chat service. The findings should be viewed as a successful test for the feasibility of approach rather than a real-world tool. We hope this formative research and initial step encourages further research toward the development and implementation of tools that can help crisis helplines meet the expanding needs of help-seekers in crisis.</p></sec></sec></body><back><ack><p>This work was conducted by the University of Canberra as part of a National Health and Medical Research Council (NHMRC) Partnership Grant with Lifeline Australia (GNT1153481). The NHMRC had no involvement in the conduct of this research or the preparation of this article. The authors would like to thank Lifeline Australia for their provision of the data analyzed in this study and support for this project.</p></ack><notes><sec><title>Data Availability</title><p>The datasets generated or analyzed during this study are not publicly available to protect the privacy and maintain the confidentiality of help-seekers but aggregate data are available from the corresponding author on reasonable request. Access to the aggregate data is contingent on obtaining permission from Lifeline Australia.</p></sec></notes><fn-group><fn fn-type="con"><p>ML, PJB, NT, RJ, DR, and KM contributed to conceptualizations. SC and KM handled writing&#x2013;original draft. HB and KM managed formal analysis and data curation. RG, HB, DR, and KM conducted methodology. DR handled funding acquisition. SC, ML, PJB, NT, RJ, DR, and KM performed writing&#x2013;review and editing.</p></fn><fn fn-type="conflict"><p>ML has collaborated with, and received funding managed by, Lifeline Australia for an unrelated project on preventing suicides in public places.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">LIWC</term><def><p>Linguistic Inquiry and Word Count</p></def></def-item><def-item><term id="abb2">NLP</term><def><p>natural language processing</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="web"><article-title>Preventing suicide: a resource for establishing a crisis line</article-title><source>World Health Organization</source><year>2018</year><access-date>2024-05-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://apps.who.int/iris/bitstream/handle/10665/311295/WHO-MSD-MER-18.4-eng.pdf">https://apps.who.int/iris/bitstream/handle/10665/311295/WHO-MSD-MER-18.4-eng.pdf</ext-link></comment></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zabelski</surname><given-names>S</given-names> </name><name name-style="western"><surname>Kaniuka</surname><given-names>AR</given-names> </name><name name-style="western"><surname>A Robertson</surname><given-names>R</given-names> </name><name name-style="western"><surname>Cramer</surname><given-names>RJ</given-names> </name></person-group><article-title>Crisis lines: current status and recommendations for research and policy</article-title><source>Psychiatr Serv</source><year>2023</year><month>05</month><day>1</day><volume>74</volume><issue>5</issue><fpage>505</fpage><lpage>512</lpage><pub-id pub-id-type="doi">10.1176/appi.ps.20220294</pub-id><pub-id pub-id-type="medline">36475827</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gould</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Chowdhury</surname><given-names>S</given-names> </name><name name-style="western"><surname>Lake</surname><given-names>AM</given-names> </name><etal/></person-group><article-title>National suicide prevention lifeline crisis chat interventions: evaluation of chatters&#x2019; perceptions of effectiveness</article-title><source>Suicide Life Threat Behav</source><year>2021</year><month>12</month><volume>51</volume><issue>6</issue><fpage>1126</fpage><lpage>1137</lpage><pub-id pub-id-type="doi">10.1111/sltb.12795</pub-id><pub-id pub-id-type="medline">34331471</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mokkenstorm</surname><given-names>JK</given-names> </name><name name-style="western"><surname>Eikelenboom</surname><given-names>M</given-names> </name><name name-style="western"><surname>Huisman</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Evaluation of the 113 online suicide prevention crisis chat service: outcomes, helper behaviors and comparison to telephone hotlines</article-title><source>Suicide &#x0026; Life Threat Behav</source><year>2017</year><month>06</month><volume>47</volume><issue>3</issue><fpage>282</fpage><lpage>296</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://onlinelibrary.wiley.com/toc/1943278x/47/3">https://onlinelibrary.wiley.com/toc/1943278x/47/3</ext-link></comment><pub-id pub-id-type="doi">10.1111/sltb.12286</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Turkington</surname><given-names>R</given-names> </name><name name-style="western"><surname>Mulvenna</surname><given-names>M</given-names> </name><name name-style="western"><surname>Bond</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Behavior of callers to a crisis helpline before and during the COVID-19 pandemic: quantitative data analysis</article-title><source>JMIR Ment Health</source><year>2020</year><month>11</month><day>6</day><volume>7</volume><issue>11</issue><fpage>e22984</fpage><pub-id pub-id-type="doi">10.2196/22984</pub-id><pub-id pub-id-type="medline">33112759</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="web"><article-title>Annual report: 2022-2023</article-title><source>Lifeline Australia</source><year>2023</year><access-date>2024-05-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.lifeline.org.au/media/quvfglvm/233-017-lifeline-annual-report-2023-v8-lr-1.pdf">https://www.lifeline.org.au/media/quvfglvm/233-017-lifeline-annual-report-2023-v8-lr-1.pdf</ext-link></comment></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kitchingman</surname><given-names>TA</given-names> </name><name name-style="western"><surname>Caputi</surname><given-names>P</given-names> </name><name name-style="western"><surname>Woodward</surname><given-names>A</given-names> </name><name name-style="western"><surname>Wilson</surname><given-names>CJ</given-names> </name><name name-style="western"><surname>Wilson</surname><given-names>I</given-names> </name></person-group><article-title>The impact of their role on telephone crisis support workers&#x2019; psychological wellbeing and functioning: Quantitative findings from a mixed methods investigation</article-title><source>PLoS ONE</source><year>2018</year><volume>13</volume><issue>12</issue><fpage>e0207645</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0207645</pub-id><pub-id pub-id-type="medline">30566435</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Willems</surname><given-names>R</given-names> </name><name name-style="western"><surname>Drossaert</surname><given-names>C</given-names> </name><name name-style="western"><surname>Vuijk</surname><given-names>P</given-names> </name><name name-style="western"><surname>Bohlmeijer</surname><given-names>E</given-names> </name></person-group><article-title>Impact of crisis line volunteering on mental wellbeing and the associated factors: a systematic review</article-title><source>Int J Environ Res Public Health</source><year>2020</year><month>03</month><day>3</day><volume>17</volume><issue>5</issue><fpage>1641</fpage><pub-id pub-id-type="doi">10.3390/ijerph17051641</pub-id><pub-id pub-id-type="medline">32138360</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mazzer</surname><given-names>K</given-names> </name><name name-style="western"><surname>O&#x2019;Riordan</surname><given-names>M</given-names> </name><name name-style="western"><surname>Woodward</surname><given-names>A</given-names> </name><name name-style="western"><surname>Rickwood</surname><given-names>D</given-names> </name></person-group><article-title>A systematic review of user expectations and outcomes of crisis support services</article-title><source>Crisis</source><year>2021</year><month>11</month><volume>42</volume><issue>6</issue><fpage>465</fpage><lpage>473</lpage><pub-id pub-id-type="doi">10.1027/0227-5910/a000745</pub-id><pub-id pub-id-type="medline">33275048</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Trail</surname><given-names>K</given-names> </name><name name-style="western"><surname>Baptiste</surname><given-names>PJ</given-names> </name><name name-style="western"><surname>Hunt</surname><given-names>T</given-names> </name><name name-style="western"><surname>Brooks</surname><given-names>A</given-names> </name></person-group><article-title>Conducting research in crisis helpline settings</article-title><source>Crisis</source><year>2022</year><month>07</month><volume>43</volume><issue>4</issue><fpage>263</fpage><lpage>269</lpage><pub-id pub-id-type="doi">10.1027/0227-5910/a000858</pub-id><pub-id pub-id-type="medline">35438001</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tyson</surname><given-names>P</given-names> </name><name name-style="western"><surname>Law</surname><given-names>C</given-names> </name><name name-style="western"><surname>Reed</surname><given-names>S</given-names> </name><name name-style="western"><surname>Johnsey</surname><given-names>E</given-names> </name><name name-style="western"><surname>Aruna</surname><given-names>O</given-names> </name><name name-style="western"><surname>Hall</surname><given-names>S</given-names> </name></person-group><article-title>Preventing suicide and self-harm</article-title><source>Crisis</source><year>2016</year><month>09</month><volume>37</volume><issue>5</issue><fpage>353</fpage><lpage>360</lpage><pub-id pub-id-type="doi">10.1027/0227-5910/a000390</pub-id><pub-id pub-id-type="medline">27278572</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lake</surname><given-names>AM</given-names> </name><name name-style="western"><surname>Niederkrotenthaler</surname><given-names>T</given-names> </name><name name-style="western"><surname>Aspden</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Lifeline crisis chat: coding form development and findings on chatters&#x2019; risk status and counselor behaviors</article-title><source>Suicide Life Threat Behav</source><year>2022</year><month>06</month><volume>52</volume><issue>3</issue><fpage>452</fpage><lpage>466</lpage><pub-id pub-id-type="doi">10.1111/sltb.12835</pub-id><pub-id pub-id-type="medline">35112387</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hoffberg</surname><given-names>AS</given-names> </name><name name-style="western"><surname>Stearns-Yoder</surname><given-names>KA</given-names> </name><name name-style="western"><surname>Brenner</surname><given-names>LA</given-names> </name></person-group><article-title>The effectiveness of crisis line services: a systematic review</article-title><source>Front Public Health</source><year>2019</year><volume>7</volume><issue>17</issue><fpage>399</fpage><pub-id pub-id-type="doi">10.3389/fpubh.2019.00399</pub-id><pub-id pub-id-type="medline">32010655</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Song</surname><given-names>W</given-names> </name><name name-style="western"><surname>Tao</surname><given-names>W</given-names> </name><etal/></person-group><article-title>A systematic review on affective computing: emotion models, databases, and recent advances</article-title><source>Information Fusion</source><year>2022</year><month>07</month><volume>83-84</volume><issue>83</issue><fpage>19</fpage><lpage>52</lpage><pub-id pub-id-type="doi">10.1016/j.inffus.2022.03.009</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nandwani</surname><given-names>P</given-names> </name><name name-style="western"><surname>Verma</surname><given-names>R</given-names> </name></person-group><article-title>A review on sentiment analysis and emotion detection from text</article-title><source>Soc Netw Anal Min</source><year>2021</year><volume>11</volume><issue>1</issue><fpage>81</fpage><pub-id pub-id-type="doi">10.1007/s13278-021-00776-6</pub-id><pub-id pub-id-type="medline">34484462</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Malgaroli</surname><given-names>M</given-names> </name><name name-style="western"><surname>Hull</surname><given-names>TD</given-names> </name><name name-style="western"><surname>Zech</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Althoff</surname><given-names>T</given-names> </name></person-group><article-title>Natural language processing for mental health interventions: a systematic review and research framework</article-title><source>Transl Psychiatry</source><year>2023</year><month>10</month><day>6</day><volume>13</volume><issue>1</issue><fpage>309</fpage><pub-id pub-id-type="doi">10.1038/s41398-023-02592-2</pub-id><pub-id pub-id-type="medline">37798296</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Fast</surname><given-names>E</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>B</given-names> </name><name name-style="western"><surname>Bernstein</surname><given-names>M</given-names> </name></person-group><article-title>Empath: understanding topic signals in large-scale text</article-title><source>ArXiv Preprint posted online on February 22, 2023</source><access-date>2025-06-11</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/1602.06979">https://arxiv.org/abs/1602.06979</ext-link></comment></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Pennebaker</surname><given-names>JW</given-names> </name><name name-style="western"><surname>Francis</surname><given-names>ME</given-names> </name><name name-style="western"><surname>Booth</surname><given-names>RJ</given-names> </name></person-group><article-title>LIWC 2015 operator&#x2019;s manual</article-title><source>Linguistic Inquiry and Word Count: LIWC 2015</source><year>2015</year><access-date>2024-05-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.liwc.app/help/psychometrics-manuals">https://www.liwc.app/help/psychometrics-manuals</ext-link></comment></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bittar</surname><given-names>A</given-names> </name><name name-style="western"><surname>Velupillai</surname><given-names>S</given-names> </name><name name-style="western"><surname>Roberts</surname><given-names>A</given-names> </name><name name-style="western"><surname>Dutta</surname><given-names>R</given-names> </name></person-group><article-title>Using general-purpose sentiment lexicons for suicide risk assessment in electronic health records: corpus-based analysis</article-title><source>JMIR Med Inform</source><year>2021</year><month>04</month><day>13</day><volume>9</volume><issue>4</issue><fpage>e22397</fpage><pub-id pub-id-type="doi">10.2196/22397</pub-id><pub-id pub-id-type="medline">33847595</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Howes</surname><given-names>C</given-names> </name><name name-style="western"><surname>Purver</surname><given-names>M</given-names> </name><name name-style="western"><surname>McCabe</surname><given-names>R</given-names> </name></person-group><article-title>Linguistic indicators of severity and progress in online text-based therapy for depression</article-title><access-date>2025-06-11</access-date><conf-name>Proceedings of the Workshop on Computational Linguistics and Clinical Psychology</conf-name><conf-date>Jun 27, 2014</conf-date><conf-loc>Baltimore, Maryland, USA</conf-loc><fpage>17145831</fpage><comment><ext-link ext-link-type="uri" xlink:href="http://aclweb.org/anthology/W14-32">http://aclweb.org/anthology/W14-32</ext-link></comment><pub-id pub-id-type="doi">10.3115/v1/W14-3202</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Broadbent</surname><given-names>M</given-names> </name><name name-style="western"><surname>Medina Grespan</surname><given-names>M</given-names> </name><name name-style="western"><surname>Axford</surname><given-names>K</given-names> </name><etal/></person-group><article-title>A machine learning approach to identifying suicide risk among text-based crisis counseling encounters</article-title><source>Front Psychiatry</source><year>2023</year><volume>14</volume><issue>14</issue><fpage>1110527</fpage><pub-id pub-id-type="doi">10.3389/fpsyt.2023.1110527</pub-id><pub-id pub-id-type="medline">37032952</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xu</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Chan</surname><given-names>CS</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>Q</given-names> </name><etal/></person-group><article-title>Network-based prediction of the disclosure of ideation about self-harm and suicide in online counseling sessions</article-title><source>Commun Med (Lond)</source><year>2022</year><month>12</month><day>6</day><volume>2</volume><issue>1</issue><fpage>156</fpage><pub-id pub-id-type="doi">10.1038/s43856-022-00222-4</pub-id><pub-id pub-id-type="medline">36474010</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Salmi</surname><given-names>S</given-names> </name><name name-style="western"><surname>M&#x00E9;relle</surname><given-names>S</given-names> </name><name name-style="western"><surname>Gilissen</surname><given-names>R</given-names> </name><name name-style="western"><surname>Brinkman</surname><given-names>WP</given-names> </name></person-group><article-title>Content-based recommender support system for counselors in a suicide prevention chat helpline: design and evaluation study</article-title><source>J Med Internet Res</source><year>2021</year><month>01</month><day>7</day><volume>23</volume><issue>1</issue><fpage>e21690</fpage><pub-id pub-id-type="doi">10.2196/21690</pub-id><pub-id pub-id-type="medline">33410755</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Dinakar</surname><given-names>K</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>J</given-names> </name><name name-style="western"><surname>Lieberman</surname><given-names>H</given-names> </name><name name-style="western"><surname>Picard</surname><given-names>R</given-names> </name><name name-style="western"><surname>Filbin</surname><given-names>R</given-names> </name></person-group><article-title>Mixed-initiative real-time topic modeling &#x0026; visualization for crisis counseling</article-title><conf-name>IUI '15: Proceedings of the 20th International Conference on Intelligent User Interfaces</conf-name><conf-date>May 18, 2015</conf-date><conf-loc>Atlanta Georgia USA</conf-loc><fpage>417</fpage><lpage>426</lpage><pub-id pub-id-type="doi">10.1145/2678025.2701395</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Althoff</surname><given-names>T</given-names> </name><name name-style="western"><surname>Clark</surname><given-names>K</given-names> </name><name name-style="western"><surname>Leskovec</surname><given-names>J</given-names> </name></person-group><article-title>Large-scale analysis of counseling conversations: an application of natural language processing to mental health</article-title><source>Trans Assoc Comput Linguist</source><year>2016</year><volume>4</volume><issue>4</issue><fpage>463</fpage><lpage>476</lpage><pub-id pub-id-type="doi">10.1162/tacl_a_00111</pub-id><pub-id pub-id-type="medline">28344978</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Raveau</surname><given-names>MP</given-names> </name><name name-style="western"><surname>Go&#x00F1;i</surname><given-names>JI</given-names> </name><name name-style="western"><surname>Rodr&#x00ED;guez</surname><given-names>JF</given-names> </name><etal/></person-group><article-title>Natural language processing analysis of the psychosocial stressors of mental health disorders during the pandemic</article-title><source>NPJ Ment Health Res</source><year>2023</year><month>10</month><day>5</day><volume>2</volume><issue>1</issue><fpage>17</fpage><pub-id pub-id-type="doi">10.1038/s44184-023-00039-6</pub-id><pub-id pub-id-type="medline">38609516</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>&#x00D6;hman</surname><given-names>E</given-names> </name></person-group><article-title>The validity of lexicon-based sentiment analysis in interdisciplinary research</article-title><access-date>2025-06-11</access-date><conf-name>Proceedings of the Workshop on Natural Language Processing for Digital Humanities</conf-name><conf-date>Dec 16-19, 2021</conf-date><conf-loc>Silchar, Assam, India</conf-loc><comment><ext-link ext-link-type="uri" xlink:href="https://aclanthology.org/2021.nlp4dh-1.2/">https://aclanthology.org/2021.nlp4dh-1.2/</ext-link></comment></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Porter</surname><given-names>MF</given-names> </name></person-group><article-title>An algorithm for suffix stripping</article-title><source>Program</source><year>1980</year><month>03</month><day>1</day><volume>14</volume><issue>3</issue><fpage>130</fpage><lpage>137</lpage><pub-id pub-id-type="doi">10.1108/eb046814</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Brown</surname><given-names>PF</given-names> </name><name name-style="western"><surname>Della Pietra</surname><given-names>VJ</given-names> </name><name name-style="western"><surname>Desouza</surname><given-names>PV</given-names> </name><name name-style="western"><surname>Lai</surname><given-names>JC</given-names> </name><name name-style="western"><surname>Mercer</surname><given-names>RL</given-names> </name></person-group><article-title>Class-based n-gram models of natural language</article-title><source>Comp Linguist</source><year>1992</year><access-date>2025-06-11</access-date><volume>18</volume><issue>4</issue><fpage>467</fpage><lpage>480</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://aclanthology.org/J92-4003/">https://aclanthology.org/J92-4003/</ext-link></comment></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hamilton</surname><given-names>WL</given-names> </name><name name-style="western"><surname>Clark</surname><given-names>K</given-names> </name><name name-style="western"><surname>Leskovec</surname><given-names>J</given-names> </name><name name-style="western"><surname>Jurafsky</surname><given-names>D</given-names> </name></person-group><article-title>Inducing domain-specific sentiment lexicons from unlabeled corpora</article-title><source>Proc Conf Empir Methods Nat Lang Process</source><year>2016</year><month>11</month><volume>2016</volume><fpage>595</fpage><lpage>605</lpage><pub-id pub-id-type="doi">10.18653/v1/D16-1057</pub-id><pub-id pub-id-type="medline">28660257</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Curll</surname><given-names>S</given-names> </name><name name-style="western"><surname>Mazzer</surname><given-names>K</given-names> </name><name name-style="western"><surname>Rickwood</surname><given-names>D</given-names> </name></person-group><article-title>The development of a core outcome set for crisis helplines: a three-panel Delphi study</article-title><source>Journal of Affective Disorders Reports</source><year>2024</year><month>04</month><volume>16</volume><issue>16</issue><fpage>100763</fpage><pub-id pub-id-type="doi">10.1016/j.jadr.2024.100763</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Woodward</surname><given-names>A</given-names> </name><name name-style="western"><surname>Wyllie</surname><given-names>C</given-names> </name></person-group><person-group person-group-type="editor"><name name-style="western"><surname>O&#x2019;Connor</surname><given-names>R</given-names> </name><name name-style="western"><surname>Pirkis</surname><given-names>J</given-names> </name></person-group><article-title>Helplines, tele&#x2010;web support services, and suicide prevention</article-title><source>The International Handbook of Suicide Prevention</source><year>2016</year><publisher-name>Wiley-Blackwell</publisher-name><fpage>490</fpage><lpage>504</lpage><pub-id pub-id-type="doi">10.1002/9781118903223</pub-id><pub-id pub-id-type="other">9781118903223</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rickwood</surname><given-names>D</given-names> </name><name name-style="western"><surname>Bradford</surname><given-names>S</given-names> </name></person-group><article-title>Putting young people at the forefront of their mental health care through technology for holistic assessment and routine outcome tracking</article-title><source>iproc</source><year>2016</year><volume>2</volume><issue>1</issue><fpage>e40</fpage><pub-id pub-id-type="doi">10.2196/iproc.6049</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>O&#x2019;Riordan</surname><given-names>M</given-names> </name><name name-style="western"><surname>Ma</surname><given-names>JS</given-names> </name><name name-style="western"><surname>Mazzer</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Help-seeker expectations and outcomes of a crisis support service: comparison of suicide-related and non-suicide-related contacts to lifeline Australia</article-title><source>Health Soc Care Community</source><year>2022</year><month>11</month><volume>30</volume><issue>6</issue><fpage>e4535</fpage><lpage>e4544</lpage><pub-id pub-id-type="doi">10.1111/hsc.13857</pub-id><pub-id pub-id-type="medline">35676830</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bambling</surname><given-names>M</given-names> </name><name name-style="western"><surname>King</surname><given-names>R</given-names> </name><name name-style="western"><surname>Reid</surname><given-names>W</given-names> </name><name name-style="western"><surname>Wegner</surname><given-names>K</given-names> </name></person-group><article-title>Online counselling: the experience of counsellors providing synchronous single&#x2010;session counselling to young people</article-title><source>Couns and Psychother Res</source><year>2008</year><month>06</month><volume>8</volume><issue>2</issue><fpage>110</fpage><lpage>116</lpage><pub-id pub-id-type="doi">10.1080/14733140802055011</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Moylan</surname><given-names>CA</given-names> </name><name name-style="western"><surname>Carlson</surname><given-names>ML</given-names> </name><name name-style="western"><surname>Campbell</surname><given-names>R</given-names> </name><name name-style="western"><surname>Fedewa</surname><given-names>T</given-names> </name></person-group><article-title>&#x201C;It&#x2019;s hard to show empathy in a text&#x201D;: developing a web-based sexual assault hotline in a college setting</article-title><source>J Interpers Violence</source><year>2022</year><month>09</month><volume>37</volume><issue>17-18</issue><fpage>NP16037</fpage><lpage>NP16059</lpage><pub-id pub-id-type="doi">10.1177/08862605211025036</pub-id><pub-id pub-id-type="medline">34134570</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gilat</surname><given-names>I</given-names> </name><name name-style="western"><surname>Shahar</surname><given-names>G</given-names> </name></person-group><article-title>Emotional first aid for a suicide crisis: comparison between telephonic hotline and internet</article-title><source>Psychiatry (Abingdon)</source><year>2007</year><volume>70</volume><issue>1</issue><fpage>12</fpage><lpage>18</lpage><pub-id pub-id-type="doi">10.1521/psyc.2007.70.1.12</pub-id><pub-id pub-id-type="medline">17492908</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ma</surname><given-names>JS</given-names> </name><name name-style="western"><surname>O&#x2019;Riordan</surname><given-names>M</given-names> </name><name name-style="western"><surname>Mazzer</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Consumer perspectives on the use of artificial intelligence technology and automation in crisis support services: mixed methods study</article-title><source>JMIR Hum Factors</source><year>2022</year><month>08</month><day>5</day><volume>9</volume><issue>3</issue><fpage>e34514</fpage><pub-id pub-id-type="doi">10.2196/34514</pub-id><pub-id pub-id-type="medline">35930334</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hopkins</surname><given-names>D</given-names> </name><name name-style="western"><surname>Rickwood</surname><given-names>DJ</given-names> </name><name name-style="western"><surname>Hallford</surname><given-names>DJ</given-names> </name><name name-style="western"><surname>Watsford</surname><given-names>C</given-names> </name></person-group><article-title>Structured data vs. unstructured data in machine learning prediction models for suicidal behaviors: a systematic review and meta-analysis</article-title><source>Front Digit Health</source><year>2022</year><volume>4</volume><issue>4</issue><fpage>945006</fpage><pub-id pub-id-type="doi">10.3389/fdgth.2022.945006</pub-id><pub-id pub-id-type="medline">35983407</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pisani</surname><given-names>AR</given-names> </name><name name-style="western"><surname>Kanuri</surname><given-names>N</given-names> </name><name name-style="western"><surname>Filbin</surname><given-names>B</given-names> </name><etal/></person-group><article-title>Protecting user privacy and rights in academic data-sharing partnerships: principles from a pilot program at crisis text line</article-title><source>J Med Internet Res</source><year>2019</year><month>01</month><day>17</day><volume>21</volume><issue>1</issue><fpage>e11507</fpage><pub-id pub-id-type="doi">10.2196/11507</pub-id><pub-id pub-id-type="medline">30664452</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Czarnek</surname><given-names>G</given-names> </name><name name-style="western"><surname>Stillwell</surname><given-names>D</given-names> </name></person-group><article-title>Two is better than one: using a single emotion lexicon can lead to unreliable conclusions</article-title><source>PLoS ONE</source><year>2022</year><volume>17</volume><issue>10</issue><fpage>e0275910</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0275910</pub-id><pub-id pub-id-type="medline">36240202</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Laricheva</surname><given-names>M</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>C</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Automated utterance labeling of conversations using natural language processing</article-title><source>ArXiv Preprint posted online on Aug 2, 2022</source><access-date>2025-06-11</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/2208.06525">https://arxiv.org/abs/2208.06525</ext-link></comment></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lekkas</surname><given-names>D</given-names> </name><name name-style="western"><surname>Jacobson</surname><given-names>NC</given-names> </name></person-group><article-title>The hidden depths of suicidal discourse: network analysis and natural language processing unmask uncensored expression</article-title><source>Digit Health</source><year>2023</year><volume>9</volume><issue>9</issue><fpage>20552076231210714</fpage><pub-id pub-id-type="doi">10.1177/20552076231210714</pub-id><pub-id pub-id-type="medline">37928333</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Linthicum</surname><given-names>KP</given-names> </name><name name-style="western"><surname>Schafer</surname><given-names>KM</given-names> </name><name name-style="western"><surname>Ribeiro</surname><given-names>JD</given-names> </name></person-group><article-title>Machine learning in suicide science: applications and ethics</article-title><source>Behav Sci Law</source><year>2019</year><month>05</month><volume>37</volume><issue>3</issue><fpage>214</fpage><lpage>222</lpage><pub-id pub-id-type="doi">10.1002/bsl.2392</pub-id><pub-id pub-id-type="medline">30609102</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Means and SDs of token counts for each category across the 9 windows.</p><media xlink:href="formative_v9i1e63257_app1.docx" xlink:title="DOCX File, 17 KB"/></supplementary-material></app-group></back></article>