<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Form Res</journal-id><journal-id journal-id-type="publisher-id">formative</journal-id><journal-id journal-id-type="index">27</journal-id><journal-title>JMIR Formative Research</journal-title><abbrev-journal-title>JMIR Form Res</abbrev-journal-title><issn pub-type="epub">2561-326X</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v10i1e76808</article-id><article-id pub-id-type="doi">10.2196/76808</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Knowledge Graphs Based on Meta-Analysis Papers Improve the Quality of Case Formulation: Mixed Methods Design</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Yokotani</surname><given-names>Kenji</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Jikihara</surname><given-names>Yasumitsu</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Koiwa</surname><given-names>Kohei</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib></contrib-group><aff id="aff1"><institution>Graduate School of Technology, Industrial and Social Sciences, Tokushima University</institution><addr-line>1-1, Minamijosanjima-cho</addr-line><addr-line>Tokushima</addr-line><country>Japan</country></aff><aff id="aff2"><institution>Department of Data Science, PsychoBit Inc.</institution><addr-line>Kobe</addr-line><country>Japan</country></aff><aff id="aff3"><institution>Graduate School of Human Sciences, The University of Osaka</institution><addr-line>Suita</addr-line><country>Japan</country></aff><aff id="aff4"><institution>Graduate School of Education, Hokkaido University of Education</institution><addr-line>Sapporo</addr-line><country>Japan</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Mavragani</surname><given-names>Amaryllis</given-names></name></contrib><contrib contrib-type="editor"><name name-style="western"><surname>Steenstra</surname><given-names>Ivan</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Bhasuran</surname><given-names>Balu</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Kenji Yokotani, PhD, Graduate School of Technology, Industrial and Social Sciences, Tokushima University, 1-1, Minamijosanjima-cho, Tokushima, 770-8502, Japan, 81 88-656-7000; <email>yokotanikenji@tokushima-u.ac.jp</email></corresp></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>30</day><month>6</month><year>2026</year></pub-date><volume>10</volume><elocation-id>e76808</elocation-id><history><date date-type="received"><day>01</day><month>05</month><year>2025</year></date><date date-type="rev-recd"><day>05</day><month>03</month><year>2026</year></date><date date-type="accepted"><day>06</day><month>03</month><year>2026</year></date></history><copyright-statement>&#x00A9; Kenji Yokotani, Yasumitsu Jikihara, Kohei Koiwa. Originally published in JMIR Formative Research (<ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>), 30.6.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Formative Research, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://formative.jmir.org/2026/1/e76808"/><abstract><sec><title>Background</title><p>Case formulation (CF) is a core skill for therapists; however, creating high-quality CFs requires considerable time.</p></sec><sec><title>Objective</title><p>This study aims to demonstrate that providing a knowledge graph based on meta-analytic literature can enhance CF quality.</p></sec><sec sec-type="methods"><title>Methods</title><p>Five groups were established, including 4 large language model groups and 1 human expert group, each generating 25 CFs based on 25 vignettes. The control group with Claude (Sonnet 3.7; Anthropic) produced 25 CFs. The personalization group served as the control group with additional personalization prompts. The knowledge graph group used a large language model that generated 25 CFs, which was provided with a meta-analysis knowledge graph. Further incorporation of additional personalization prompts then comprised the knowledge graph with personalization group. Finally, the expert group consisted of 25 CFs generated by a human expert. These 125 CFs in total were evaluated for general quality (ie, correctness, completeness, feasibility, and consistency) using a 7-point scale and 18 essential elements with binary scores (0 or 1) by another human expert. The CFs were also qualitatively analyzed.</p></sec><sec sec-type="results"><title>Results</title><p>The knowledge graph and knowledge graph with personalization groups scored significantly higher than the control group in terms of correctness, completeness, and feasibility. The expert group scored significantly higher on consistency than the machine-generated groups. Additionally, there was no significant difference in the feasibility scores among the knowledge graph, knowledge graph with personalization, and expert groups. The qualitative evaluation suggested that human CFs narrow the text to content that is easy for the client to read, whereas machine CFs are more likely to include expressions that are unnatural to the client.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>These results indicate that providing knowledge graphs to novice therapists increases the correctness, completeness, and feasibility of CF. Providing experienced therapists with knowledge graphs is suggested to improve the quality of their CF and mental health services.</p></sec></abstract><kwd-group><kwd>case formulation</kwd><kwd>knowledge graph</kwd><kwd>family therapy</kwd><kwd>large language model</kwd><kwd>LLM</kwd><kwd>reframing</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Case formulation (CF), or case conceptualization, is a hypothesis collaboratively developed by the therapist and the client to address the client&#x2019;s psychological difficulties [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. It influences both the choice of therapeutic approach [<xref ref-type="bibr" rid="ref3">3</xref>] and treatment outcomes [<xref ref-type="bibr" rid="ref4">4</xref>]. CF is a core skill for therapists [<xref ref-type="bibr" rid="ref5">5</xref>]; however, extensive training is required to develop high-quality CF [<xref ref-type="bibr" rid="ref6">6</xref>]. CF involves not only the diagnosis of mental disorders but also the comprehensive assessment of the client&#x2019;s psychological difficulties and associated risks [<xref ref-type="bibr" rid="ref7">7</xref>]. Consequently, it is a time-consuming process, with previous research indicating that the development of a single CF requires an average of approximately 52 minutes [<xref ref-type="bibr" rid="ref8">8</xref>]. In recent years, the automated generation of CF through a large language model (LLM) has been used as an auxiliary tool for therapists to create high-quality CF. It has been suggested that by using this CF, therapists can produce high-quality CF within a relatively short training period [<xref ref-type="bibr" rid="ref1">1</xref>]. This study demonstrates that by incorporating the collection of meta-analysis evidence as a knowledge graph into LLM [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>], a high-quality CF can be generated. High-quality CF could serve as an auxiliary clinical tool for therapists to develop their CF skills [<xref ref-type="bibr" rid="ref11">11</xref>].</p><p>The theoretical model of this study is an evidence-based CF model [<xref ref-type="bibr" rid="ref12">12</xref>], which emphasizes the incorporation of findings from previous research&#x2014;that is, evidence&#x2014;into CF. Evidence-based CF is currently considered the most reasonable approach [<xref ref-type="bibr" rid="ref13">13</xref>]. Although therapists understand the importance of citing evidence, it has been pointed out that, in practice, CF is conducted without using evidence because of the time-consuming nature of literature searches [<xref ref-type="bibr" rid="ref14">14</xref>]. However, theoretically, evidence-based assessments and CFs refine CFs and gradually improve their quality. [<xref ref-type="bibr" rid="ref15">15</xref>].</p><p>Knowledge graphs are used to retrieve evidence collections. A knowledge graph is a network that systematically connects various pieces of knowledge [<xref ref-type="bibr" rid="ref16">16</xref>] and represents them in a graph structure (<xref ref-type="fig" rid="figure1">Figure 1</xref>); knowledge graphs have been constructed from clinical trials [<xref ref-type="bibr" rid="ref17">17</xref>], medical records [<xref ref-type="bibr" rid="ref18">18</xref>], and research papers [<xref ref-type="bibr" rid="ref16">16</xref>]. Decision-making for therapists can be supported by such knowledge graphs [<xref ref-type="bibr" rid="ref19">19</xref>]. Furthermore, by incorporating a knowledge graph into the LLM, more accurate diagnoses [<xref ref-type="bibr" rid="ref10">10</xref>] and higher-quality diagnostic report generation [<xref ref-type="bibr" rid="ref9">9</xref>] become possible.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Examples of nodes and edges in a knowledge graph based on meta-analytic studies of parenting stress.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v10i1e76808_fig01.png"/></fig><p>Based on previous findings [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>], as well as the premise that an accurate diagnosis is an essential component of high-quality CF [<xref ref-type="bibr" rid="ref20">20</xref>], it is posited that augmenting an LLM with a knowledge graph would result in the generation of high-quality CF. Furthermore, CF is personalized through collaboration with the client [<xref ref-type="bibr" rid="ref21">21</xref>], and personalized CF has been suggested to be more effective in treatment than nonpersonalized CF [<xref ref-type="bibr" rid="ref4">4</xref>]. Based on these previous studies, this study also investigated the personalization of CF.</p><p>As indices of CF general quality, 4 indicators (ie, correctness, completeness, consistency, and feasibility) that were used in previous research [<xref ref-type="bibr" rid="ref1">1</xref>] were used. In addition, as an index of the individual components of CF, 18 key components derived from previous research [<xref ref-type="bibr" rid="ref2">2</xref>] were used to examine their presence or absence. Moreover, a qualitative evaluation was conducted to examine CFs from multiple perspectives [<xref ref-type="bibr" rid="ref22">22</xref>]. Standardized evaluation metrics for CF were not used in this study because their reliability and validity have not yet been sufficiently established [<xref ref-type="bibr" rid="ref23">23</xref>].</p><p>The hypotheses of this study are as follows: the LLM augmented with both the knowledge graph and personalization (knowledge graph and personalization group) is expected to generate a higher-quality CF than an LLM with no augmentation (control group). For comparison, this study also created a group with an LLM augmented with a knowledge graph only (knowledge graph&#x2013;only group), a group with an LLM augmented with personalization only (personalization-only group), and a group of human therapists (expert group).</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Construction of 25 Vignettes</title><p>Clinical psychologist A, who is the sole author of a book on CF in family therapy [<xref ref-type="bibr" rid="ref24">24</xref>], created 25 fictional parenting stress vignettes. Various episodes were extracted from parenting blogs on <italic>Ameba Blog</italic>, a popular blogging platform in Japan [<xref ref-type="bibr" rid="ref25">25</xref>]. Each episode was summarized after removing personal information and commercial content (prior confirmation was obtained from the administrators of the <italic>Ameba Blog</italic>, indicating there were no issues with such usage). An example of a vignette is shown in <xref ref-type="other" rid="box1">Textbox 1</xref>. Two additional fictional parenting stress vignettes were created using the same method as that used for the preliminary datasets in order to develop the evaluation criteria.</p><boxed-text id="box1"><title> Example of a vignette.</title><p>I&#x2019;m in my 40s, raising my first son born in 2018 and my second son born in 2020 who has autism and severe intellectual disability. I'&#x2019;ve been completely exhausted from caring for my second son and have been seeing a psychiatrist. Recently, when I consulted with Child Protection Services about short-stay respite care due to parental fatigue, unexpectedly my second son was taken into temporary protective custody the very next day.</p><p>Initially, I just wanted to communicate that I was at my limit with exhaustion and needed temporary childcare. However, as I explained my situation in detail, I ended up confessing that I had been so desperate that the terrifying thought, "&#x201C;Would I feel relief if I killed my child...." had crossed my mind. I also mentioned that I had run out of my prescribed medication. This became a serious issue, and protective custody was decided that same day.</p><p>When I explained the situation to my husband, I thought he would be angry, but he just quietly cried. Seeing him like that, I felt overwhelmingly guilty. I realized I had caused a terrible situation.... I felt so sorry for my second son as well.</p><p>About a month after my son was taken into protective custody, discussions about ending the protection finally began. The conditions include arranging visiting nurses and helpers for me, and most importantly, securing regular short-stay respite care. However, although the city office had told us that finding short-stay facilities was the parents'&#x2019; responsibility, it turned out this should have been handled by the consultation service office. The city office&#x2019;s incorrect information was one factor that led to this situation.</p><p>Currently, nearby facilities are full, and we'&#x2019;re searching for short-stay options throughout the entire prefecture. I understand there may be criticism for writing this blog, but I hope my experience can be helpful to others in similar situations, so I plan to continue sharing my story.</p></boxed-text></sec><sec id="s2-2"><title>Construction of the Knowledge Graph</title><p>Semantic Scholar [<xref ref-type="bibr" rid="ref26">26</xref>] was used to search for research studies related to the following 10 phrases: &#x201C;maternal anxiety meta-analysis,&#x201D; &#x201C;parental anxiety meta-analysis,&#x201D; &#x201C;maternal depression meta-analysis,&#x201D; &#x201C;parental depression meta-analysis,&#x201D; &#x201C;autism spectrum disorder parenting meta-analysis,&#x201D; &#x201C;attention deficit hyperactivity disorder parenting meta-analysis,&#x201D; &#x201C;developmental disorder parenting meta-analysis,&#x201D; &#x201C;intellectual disabilities parenting meta-analysis,&#x201D; &#x201C;parenting child with chronic illness meta-analysis,&#x201D; and &#x201C;parenting child with chronic medical problem meta-analysis.&#x201D; Up to 500 studies were retrieved per phrase, resulting in a total of 4251 studies. Subsequently, duplicate studies based on the article IDs were removed. Additionally, studies whose titles did not include both &#x201C;meta&#x201D; and &#x201C;analysis&#x201D; were excluded, resulting in 2233 selected studies. Finally, studies without available abstracts were excluded, leaving 1544 studies. The text used in the titles and abstracts of these studies (410,654 words) served as the corpus for constructing the knowledge graph.</p><p>Next, each sentence within this corpus was translated into relational data for the knowledge graph using an LLM called Claude (Sonnet 3.5; &#x201C;Claude-3&#x2010;5-sonnet-20240620&#x201D;; Anthropic) [<xref ref-type="bibr" rid="ref27">27</xref>], which has been frequently used in clinical contexts [<xref ref-type="bibr" rid="ref28">28</xref>]. The relational data in a knowledge graph explicitly indicates the relationships between entities. For example, the sentence &#x201C;Parent Distress was positively associated with their Child Distress&#x201D; translates into relational data as &#x201C;[Parent Distress] -[:ASSOCIATED_WITH]-&#x003E; [Child Distress],&#x201D; illustrating 2 entities and their connecting relationship. This resulted in the extraction of 7740 entities and 2348 relationships. The constructed knowledge graph is depicted in <xref ref-type="fig" rid="figure1">Figure 1</xref>, where individual nodes represent entities and the edges connecting these nodes represent relationships. Knowledge graphs have also been used in clinical contexts [<xref ref-type="bibr" rid="ref19">19</xref>].</p></sec><sec id="s2-3"><title>Generation of CFs Across 5 Groups</title><p>First, for the control group, an LLM named Claude (Sonnet 3.7; &#x201C;Claude-3&#x2010;7-sonnet-20250219&#x201D;) [<xref ref-type="bibr" rid="ref27">27</xref>], which has also been used in clinical contexts [<xref ref-type="bibr" rid="ref29">29</xref>], was used with a basic prompt. It read the 25 vignettes (<xref ref-type="other" rid="box1">Textbox 1</xref>) and generated 25 CFs (<xref ref-type="fig" rid="figure2">Figure 2</xref>). Next, the personalization group incorporated a personalization prompt into the basic prompt; otherwise, the procedure was identical to that of the control group (<xref ref-type="fig" rid="figure2">Figure 2</xref>). For the knowledge graph group, the Japanese text was translated into English via Claude (Sonnet 3.7), and the previously constructed knowledge graph was queried using this translated English text. Based on prior studies [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>], the similarity threshold was set at 0.9. Clinical psychologist A also judged the literature citations retrieved using this threshold to be appropriate. Relationships with similarity scores exceeding 0.9 between the English sentences and the relational data were extracted, compiled, and summarized as prior study findings (Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). These findings were used for the knowledge graph group. Additionally, the knowledge graph group used a knowledge graph prompt alongside the 25 vignettes to generate 25 CFs (<xref ref-type="fig" rid="figure2">Figure 2</xref>). In the knowledge graph and personalization groups, a personalization prompt was added to the knowledge graph group&#x2019;s prompt. Otherwise, the procedures matched those of the knowledge graph group. Finally, clinical psychologist B, a human expert who has presented as a symposium speaker on CF in family therapy [<xref ref-type="bibr" rid="ref32">32</xref>], read basic prompts, excuse prompts, and 25 vignettes, and then generated 25 CFs (<xref ref-type="fig" rid="figure2">Figure 2</xref>). Each of the 5 groups performed 25 CFs for the 25 vignettes, producing 125 CFs (5&#x00D7;25).</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Comparison of prompts, input, and output across 5 groups.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v10i1e76808_fig02.png"/></fig></sec><sec id="s2-4"><title>Evaluation of CFs</title><p>Clinical psychologist C, a Japanese expert who validated the assessment tools for stepfamilies in Japan [<xref ref-type="bibr" rid="ref33">33</xref>], evaluated the previously created preliminary datasets (2 vignettes) across the 5 groups. These expert CFs were conducted only for the preliminary datasets by clinical psychologist A, rather than by clinical psychologist B, and were not used in the main evaluation of the 25 vignettes. The evaluation criteria consisted of 4 items assessing the general quality of CFs (on a 7-point scale) [<xref ref-type="bibr" rid="ref1">1</xref>] and 18 items evaluating key components (presence or absence, coded as 0 or 1) [<xref ref-type="bibr" rid="ref2">2</xref>]. Based on this evaluation, clinical psychologist A suggested adjustments to ensure broader variability in general quality scores and recommended broadly defining the presence of the 18 key components. Clinical psychologist C agreed with these recommendations. Using these criteria, clinical psychologist C evaluated the 125 CFs, which were presented randomly to ensure that clinical psychologist C remained unaware of the group assignments, thus ensuring a single-blind condition.</p></sec><sec id="s2-5"><title>Statistics</title><p>A one-factor ANOVA was performed to determine the effects of the 5 groups on the quality of the CF. The Tukey multiple comparison test was used for comparisons between groups.</p></sec><sec id="s2-6"><title>Ethical Considerations</title><p>This study did not involve experimental participants, nor did it include personal data; therefore, an ethical review of personal data was not required.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Comparison of Text Style Among the 5 Groups</title><p>Before testing our hypotheses, we compared the length of the CF texts across the 5 groups (<xref ref-type="table" rid="table1">Table 1</xref>). As shown in <xref ref-type="table" rid="table1">Table 1</xref>, the number of characters in CFs produced by human experts was significantly lower than that of the 4 LLM conditions. Although the evaluator was blinded to the source of each CF, it is possible that the evaluator inferred human authorship based on text length. Therefore, the results should be interpreted with caution.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Comparison of sentence structure, general quality, and individual key components of the 25 case formulations across the 5 groups. The significant differences in evaluation indicators were confirmed by multiple comparisons using the Tukey test.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="top" rowspan="2"/><td align="left" valign="top" rowspan="2">Control, mean (SD)</td><td align="left" valign="top" rowspan="2">Personalization, mean (SD)</td><td align="left" valign="top" rowspan="2">KG<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup>, mean (SD)</td><td align="left" valign="top" rowspan="2">KG_P<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup>, mean (SD)</td><td align="left" valign="top" rowspan="2">Expert, mean (SD)</td><td align="left" valign="top" colspan="2">Statistics</td></tr><tr><td align="left" valign="top">F test (<italic>df</italic>)</td><td align="left" valign="top"><italic>P</italic> value</td></tr><tr><td align="left" valign="top" colspan="8">Sentence structure</td></tr></thead><tbody><tr><td align="left" valign="top">&#x2003;Number of characters<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">885.4 (143.1)</td><td align="left" valign="top">1002.3 (142.6)</td><td align="left" valign="top">1040.2 (135.0)</td><td align="left" valign="top">1218.8 (155.1)</td><td align="left" valign="top">542.0 (182.2)</td><td align="left" valign="top">68.01 (4, 120)</td><td align="left" valign="top">&#x003C;.001<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top" colspan="8">General qualities</td></tr><tr><td align="left" valign="top">&#x2003;Consistency<sup><xref ref-type="table-fn" rid="table1fn5">e</xref></sup></td><td align="left" valign="top">5.36 (0.81)</td><td align="left" valign="top">5.72 (0.46)</td><td align="left" valign="top">5.64 (0.49)</td><td align="left" valign="top">5.80 (0.50)</td><td align="left" valign="top">6.20 (0.91)</td><td align="left" valign="top">5.28 (4, 120)</td><td align="left" valign="top">.001<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">&#x2003;Correctness<sup><xref ref-type="table-fn" rid="table1fn6">f</xref></sup></td><td align="left" valign="top">4.56 (0.77)</td><td align="left" valign="top">5.16 (0.99)</td><td align="left" valign="top">5.96 (0.73)</td><td align="left" valign="top">6.00 (0.91)</td><td align="left" valign="top">5.12 (1.01)</td><td align="left" valign="top">11.88 (4, 120)</td><td align="left" valign="top">&#x003C;.001<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">&#x2003;Completeness<sup><xref ref-type="table-fn" rid="table1fn7">g</xref></sup></td><td align="left" valign="top">4.60 (0.76)</td><td align="left" valign="top">5.28 (0.74)</td><td align="left" valign="top">6.12 (0.60)</td><td align="left" valign="top">5.92 (0.91)</td><td align="left" valign="top">4.32 (0.90)</td><td align="left" valign="top">24.95 (4, 120)</td><td align="left" valign="top">&#x003C;.001<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">&#x2003;Feasibility<sup><xref ref-type="table-fn" rid="table1fn8">h</xref></sup></td><td align="left" valign="top">4.76 (1.01)</td><td align="left" valign="top">5.32 (0.56)</td><td align="left" valign="top">5.48 (0.51)</td><td align="left" valign="top">5.56 (0.92)</td><td align="left" valign="top">5.12 (0.88)</td><td align="left" valign="top">4.00 (4, 120)</td><td align="left" valign="top">.004<sup><xref ref-type="table-fn" rid="table1fn9">i</xref></sup></td></tr><tr><td align="left" valign="top" colspan="8">Individual key components</td></tr><tr><td align="left" valign="top">&#x2003;List of problems</td><td align="left" valign="top">0.04 (0.20)</td><td align="left" valign="top">0.04 (0.20)</td><td align="left" valign="top">0.08 (0.28)</td><td align="left" valign="top">0.16 (0.37)</td><td align="left" valign="top">0.12 (0.33)</td><td align="left" valign="top">0.84 (4, 120)</td><td align="left" valign="top">.51</td></tr><tr><td align="left" valign="top">&#x2003;Sociocultural factors</td><td align="left" valign="top">0.04 (0.20)</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">1.00 (4, 120)</td><td align="left" valign="top">.41</td></tr><tr><td align="left" valign="top">&#x2003;Tailored language and metaphors</td><td align="left" valign="top">0.08 (0.28)</td><td align="left" valign="top">0.36 (0.49)</td><td align="left" valign="top">0.20 (0.41)</td><td align="left" valign="top">0.08 (0.28)</td><td align="left" valign="top">0.12 (0.33)</td><td align="left" valign="top">2.60 (4, 120)</td><td align="left" valign="top">.04<sup><xref ref-type="table-fn" rid="table1fn10">j</xref></sup></td></tr><tr><td align="left" valign="top">&#x2003;Perpetuating factors</td><td align="left" valign="top">0.04 (0.20)</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">0.08 (0.28)</td><td align="left" valign="top">0.04 (0.20)</td><td align="left" valign="top">0.89 (4, 120)</td><td align="left" valign="top">.47</td></tr><tr><td align="left" valign="top">&#x2003;Protective factors</td><td align="left" valign="top">0.44 (0.51)</td><td align="left" valign="top">0.28 (0.46)</td><td align="left" valign="top">0.36 (0.49)</td><td align="left" valign="top">0.44 (0.51)</td><td align="left" valign="top">0.36 (0.49)</td><td align="left" valign="top">0.47 (4, 120)</td><td align="left" valign="top">.76</td></tr><tr><td align="left" valign="top">&#x2003;Personal meaning</td><td align="left" valign="top">0.16 (0.37)</td><td align="left" valign="top">0.08 (0.28)</td><td align="left" valign="top">0.08 (0.28)</td><td align="left" valign="top">0.08 (0.28)</td><td align="left" valign="top">0.04 (0.20)</td><td align="left" valign="top">0.59 (4, 120)</td><td align="left" valign="top">.67</td></tr><tr><td align="left" valign="top">&#x2003;Accessible language<sup><xref ref-type="table-fn" rid="table1fn11">k</xref></sup></td><td align="left" valign="top">0.64 (0.49)</td><td align="left" valign="top">0.76 (0.44)</td><td align="left" valign="top">0.80 (0.41)</td><td align="left" valign="top">0.64 (0.49)</td><td align="left" valign="top">1.00 (0.00)</td><td align="left" valign="top">3.27 (4, 120)</td><td align="left" valign="top">.01<sup><xref ref-type="table-fn" rid="table1fn10">j</xref></sup></td></tr><tr><td align="left" valign="top">&#x2003;Physiological effects</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">0.04 (0.20)</td><td align="left" valign="top">0.08 (0.28)</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">1.37 (4, 120)</td><td align="left" valign="top">.25</td></tr><tr><td align="left" valign="top">&#x2003;Organic causes</td><td align="left" valign="top">0.08 (0.28)</td><td align="left" valign="top">0.04 (0.20)</td><td align="left" valign="top">0.08 (0.28)</td><td align="left" valign="top">0.16 (0.37)</td><td align="left" valign="top">0.04 (0.20)</td><td align="left" valign="top">0.80 (4, 120)</td><td align="left" valign="top">.53</td></tr><tr><td align="left" valign="top">&#x2003;Recent history</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table1fn12">l</xref></sup></td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">&#x2003;Coping strategies<sup><xref ref-type="table-fn" rid="table1fn13">m</xref></sup></td><td align="left" valign="top">0.44 (0.51)</td><td align="left" valign="top">0.36 (0.49)</td><td align="left" valign="top">0.52 (0.51)</td><td align="left" valign="top">0.32 (0.48)</td><td align="left" valign="top">0.04 (0.20)</td><td align="left" valign="top">4.07 (4, 120)</td><td align="left" valign="top">.004<sup><xref ref-type="table-fn" rid="table1fn9">i</xref></sup></td></tr><tr><td align="left" valign="top">&#x2003;Maintenance patterns</td><td align="left" valign="top">0.08 (0.28)</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">0.08 (0.28)</td><td align="left" valign="top">0.08 (0.28)</td><td align="left" valign="top">0.12 (0.33)</td><td align="left" valign="top">0.71 (4, 120)</td><td align="left" valign="top">.59</td></tr><tr><td align="left" valign="top">&#x2003;Relationship dynamics</td><td align="left" valign="top">0.28 (0.46)</td><td align="left" valign="top">0.20 (0.41)</td><td align="left" valign="top">0.32 (0.48)</td><td align="left" valign="top">0.28 (0.46)</td><td align="left" valign="top">0.32 (0.48)</td><td align="left" valign="top">0.29 (4, 120)</td><td align="left" valign="top">.89</td></tr><tr><td align="left" valign="top">&#x2003;Strengths and achievements</td><td align="left" valign="top">0.72 (0.46)</td><td align="left" valign="top">0.72 (0.46)</td><td align="left" valign="top">0.80 (0.41)</td><td align="left" valign="top">0.68 (0.48)</td><td align="left" valign="top">0.68 (0.48)</td><td align="left" valign="top">0.29 (4, 120)</td><td align="left" valign="top">.89</td></tr><tr><td align="left" valign="top">&#x2003;Childhood history</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">&#x2003;Cognitive schemas</td><td align="left" valign="top">0.04 (0.20)</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">0.04 (0.20)</td><td align="left" valign="top">0.08 (0.28)</td><td align="left" valign="top">0.89 (4, 120)</td><td align="left" valign="top">.47</td></tr><tr><td align="left" valign="top">&#x2003;Meaning making<sup><xref ref-type="table-fn" rid="table1fn14">n</xref></sup></td><td align="left" valign="top">0.20 (0.41)</td><td align="left" valign="top">0.48 (0.51)</td><td align="left" valign="top">0.24 (0.44)</td><td align="left" valign="top">0.36 (0.49)</td><td align="left" valign="top">0.12 (0.33)</td><td align="left" valign="top">2.59 (4, 120)</td><td align="left" valign="top">.04<sup><xref ref-type="table-fn" rid="table1fn10">j</xref></sup></td></tr><tr><td align="left" valign="top">&#x2003;Perceived support</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">0.00 (0.00)</td><td align="left" valign="top">0.04 (0.20)</td><td align="left" valign="top">0.04 (0.20)</td><td align="left" valign="top">0.75 (4, 120)</td><td align="left" valign="top">0.56</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>KG: knowledge graph.</p></fn><fn id="table1fn2"><p><sup>b</sup>KG_P: knowledge graph with personalization.</p></fn><fn id="table1fn3"><p><sup>c</sup>&#x201C;Control &#x003C; expert: <italic>P</italic>&#x003C;.001; control &#x003C; KG_P: <italic>P</italic>=.004; expert&#x003C; KG: <italic>P</italic>&#x003C;.001; expert &#x003C; KG_P: <italic>P</italic>&#x003C;.001; expert &#x003C; personalization: <italic>P</italic>=.006; and KG_P &#x003C; personalization: <italic>P</italic>&#x003C;.001. </p></fn><fn id="table1fn4"><p><sup>d</sup>***<italic>P</italic>&#x003C;.001.</p></fn><fn id="table1fn5"><p><sup>e</sup>Control &#x003C; expert: <italic>P</italic>=.002 and KG &#x003C; expert: <italic>P</italic>=.03. </p></fn><fn id="table1fn6"><p><sup>f</sup>Control &#x003C; KG: <italic>P</italic>&#x003C;.001; control &#x003C; KG_P: <italic>P</italic>&#x003C;.001; expert &#x003C; KG: <italic>P</italic>=.01; expert &#x003C; KG_P: <italic>P</italic>=.006; personalization &#x003C; KG: <italic>P</italic>=.02; and personalization &#x003C; KG_P: <italic>P</italic>=.01. </p></fn><fn id="table1fn7"><p><sup>g</sup>Control &#x003C; KG: <italic>P</italic>&#x003C;.001; control &#x003C; KG_P: <italic>P</italic>&#x003C;.001; control &#x003C; personalization: <italic>P</italic>=.02; expert &#x003C; KG: <italic>P</italic>&#x003C;.001; expert&#x003C;KG_P: <italic>P</italic>&#x003C;.001; expert &#x003C; personalization: <italic>P</italic>=.003; personalization &#x003C; KG: <italic>P</italic>=.002; and personalization &#x003C; KG_P: <italic>P</italic>=.04. </p></fn><fn id="table1fn8"><p><sup>h</sup>Control &#x003C; KG: <italic>P</italic>=.02 and control &#x003C; KG_P: <italic>P</italic>=.005. </p></fn><fn id="table1fn9"><p><sup>i</sup>**<italic>P</italic>&#x003C;.01.</p></fn><fn id="table1fn10"><p><sup>j</sup>*<italic>P</italic>&#x003C;.05.</p></fn><fn id="table1fn11"><p><sup>k</sup>Control &#x003C; expert: <italic>P</italic>=.02 and KG_P &#x003C; expert: <italic>P</italic>=.02. </p></fn><fn id="table1fn12"><p><sup>l</sup>Not applicable.</p></fn><fn id="table1fn13"><p><sup>m</sup>Expert &#x003C; control: <italic>P</italic>=.02&#x201D; and &#x201C;expert &#x003C; KG: <italic>P</italic>=.003. </p></fn><fn id="table1fn14"><p><sup>n</sup>Expert &#x003C; personalization: <italic>P</italic>=.04.  </p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-2"><title>Evaluation of the General Quality of CF</title><p>The general quality of CF was evaluated (<xref ref-type="table" rid="table1">Table 1</xref>). Regarding consistency, the expert CFs showed significantly higher scores than the machine-generated CFs (<xref ref-type="fig" rid="figure3">Figure 3A</xref>). Regarding correctness, both the knowledge graph group and the knowledge graph with personalization group demonstrated significantly higher scores than the control group (<xref ref-type="fig" rid="figure3">Figure 3D</xref>). Surprisingly, the correctness scores of the knowledge graph and knowledge graph with personalization groups were significantly higher than those of the expert group (<xref ref-type="table" rid="table1">Table 1</xref>). Similar results were confirmed for completeness, indicating that both the knowledge graph group and the knowledge graph with personalization group had significantly higher completeness scores than the control group (<xref ref-type="fig" rid="figure3">Figure 3C</xref>). The completeness scores of these 2 groups were also significantly higher than those of the expert group (<xref ref-type="table" rid="table1">Table 1</xref>). Regarding feasibility, the knowledge graph group and the knowledge graph with personalization group showed significantly higher scores than the control group (<xref ref-type="fig" rid="figure3">Figure 3B</xref>). However, there was no significant difference in feasibility between the 2 groups. These results suggest that the correctness and completeness of CF can be improved by incorporating a meta-analysis knowledge graph. Although the consistency of the machine-generated CF did not reach human expert levels, providing machines with knowledge graphs allowed the feasibility to reach levels comparable to those of experts.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Impact of the knowledge graph (KG) on the general quality of the case formulation. (A) Consistency; (B) Feasibility; (C) Completeness; (D) Correctness. KG: knowledge gap; KG_P: Knowledge graph with personalization.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v10i1e76808_fig03.png"/></fig></sec><sec id="s3-3"><title>Evaluation of Key Components in CF</title><p>The key components of CF were compared (<xref ref-type="table" rid="table1">Table 1</xref>). For the accessible language component, the expert group scored significantly higher than the control group and the knowledge graph with personalization group (<xref ref-type="fig" rid="figure4">Figure 4A</xref>). Regarding the mean-making component, the personalization group scored significantly higher than the expert group (<xref ref-type="fig" rid="figure4">Figure 4B</xref>). These findings suggest that human experts are more likely to use accessible language than machines and that personalization prompts might increase the mean-making components within the CF.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Group comparisons for accessible language (A) and mean-making (B) components in the case formulation. KG: knowledge graph; KG_P: knowledge graph with personalization. *<italic>P</italic>&#x003C;.05.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v10i1e76808_fig04.png"/></fig></sec><sec id="s3-4"><title>Qualitative Analysis of CF</title><p>A qualitative analysis of the CFs from the 5 groups based on the vignette in <xref ref-type="other" rid="box1">Textbox 1</xref> was conducted (<xref ref-type="table" rid="table2">Table 2</xref>). Concerning the use of prior study findings, citations were present in the knowledge graph and the knowledge graph with personalization groups, but absent in the control, personalization, and expert groups (<xref ref-type="table" rid="table2">Table 2</xref>). Considering that human experts typically require more time to conduct literature searches, leading to fewer citations during CF [<xref ref-type="bibr" rid="ref14">14</xref>], it is possible that the control, personalization, and expert groups did not perform adequate literature searches during CF creation. In contrast, the knowledge graph and knowledge graph with personalization groups were provided with a list of relevant prior study findings in advance (<xref ref-type="fig" rid="figure2">Figure 2</xref>; Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), facilitating easier use of prior study findings.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Comparison of evidence use and reframing practices among the 5 groups.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">Control</td><td align="left" valign="bottom">Personalization</td><td align="left" valign="bottom">KG<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td><td align="left" valign="bottom">KG_P<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup></td><td align="left" valign="bottom">Expert</td></tr></thead><tbody><tr><td align="left" valign="top">Use of prior study findings</td><td align="left" valign="top">None</td><td align="left" valign="top">None</td><td align="left" valign="top">&#x201C;Insights from research<break/>indicates that parental stress, anxiety, and depression can also impact a child&#x2019;s condition. Thus, caring for yourself is crucial for your child&#x2019;s well-being as well. Parents of children with developmental disabilities are particularly prone to experiencing high stress levels, and early support has been shown to positively affect the health of both parents and children.&#x201D;</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>&#x201C;However, research clearly shows that such thoughts arise from extreme fatigue and stress, and parental stress closely relates to a child&#x2019;s condition.&#x201D;</p></list-item><list-item><p>&#x201C;Research indicates that paternal depression also affects children&#x2019;s behavior.&#x201D;</p></list-item><list-item><p>&#x201C;Research shows autism spectrum disorder (ASD) is associated with restricted and repetitive behaviors.&#x201D;</p></list-item></list></td><td align="left" valign="top">None</td></tr><tr><td align="left" valign="top">Content reframing the client&#x2019;s self-blame</td><td align="left" valign="top">&#x201C;First, reaching out to the Child Guidance Center for help was a very courageous and appropriate decision. Recognizing your limits and seeking support is a sign of being a good parent. The resulting temporary protective custody may have been unexpected, but it was likely a necessary step to ensure the safety of yourself, your younger son, and your entire family.&#x201D;</td><td align="left" valign="top">Raising a child with autism and severe intellectual disabilities involves unimaginable difficulties. You seem to be blaming yourself for having had the thought, &#x2019;Wouldn&#x2019;t it be easier if I killed my child?&#x2019; However, please remember that this was a temporary thought arising from extreme exhaustion and overwhelming stress&#x2014;it does not make you a bad parent. Rather, seeking help when these thoughts occurred was an incredibly brave action on your part.&#x201D;</td><td align="left" valign="top">&#x201C;You might be experiencing guilt and regret because your consultation with the Child Guidance Center unexpectedly led to temporary protective custody. However, this situation is not a &#x2018;failure&#x2019; on your part. Rather, seeking help when you felt overwhelmed demonstrates responsible parenting.&#x201D;</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>&#x201C;Let go of the self-blame (&#x2018;It&#x2019;s my fault this happened&#x2018;). Instead, recognize that your decision to seek help was an essential first step toward receiving future support.<italic>&#x201D;</italic></p></list-item></list></td><td align="left" valign="top">&#x201C;I think it is very meaningful that you have put your experiences into words and shared them up to this point. Particularly, the thought, &#x2018;Wouldn&#x2019;t it be easier if I killed my child&#x2026;?&#x2019; is something that must have been incredibly difficult for anyone to say out loud. Nevertheless, honestly expressing this was an essential SOS&#x2014;a significant signal that you were hurting and needed help. The fact that you had the strength to send this SOS is extremely important.</td></tr><tr><td align="left" valign="top">Client expressions used during reframing</td><td align="left" valign="top">None</td><td align="left" valign="top">&#x201C;Wouldn&#x2019;t it be easier if I killed my child?&#x201D;</td><td align="left" valign="top">&#x201C;Failure&#x201D;</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>&#x201C;It&#x2019;s my fault this happened&#x201D;</p></list-item></list></td><td align="left" valign="top">&#x201C;Wouldn&#x2019;t it be easier if I killed my child&#x2026;?&#x201D;</td></tr><tr><td align="left" valign="top">Comments after response and evaluation</td><td align="left" valign="top" colspan="4">&#x201C;While evaluating, I felt that the KG and KG_P models were highly comprehensive and accurate, and thus suitable for comparative purposes during the training process of psychologists. I believe they can be sufficiently utilized. Additionally, although some expressions appeared slightly unnatural if directly returned to the client, and these issues could be resolved if humans modify the outputs as necessary. Therefore, even for experienced psychologists, the use of these models might serve as supportive tools in preventing omissions.&#x201D; (Evaluator, clinical psychologist C)</td><td align="left" valign="top">&#x201C;When creating the CF, I was particularly mindful of the client&#x2019;s perspective, anticipating that they would read it. Due to the significant amount of information, I was concerned whether clients could fully absorb it, so I selectively included content that I deemed manageable for the current client and omitted content that might be less accessible. Particularly in severe cases, while a diagnostic impression existed, there were instances where I was uncertain whether directly confronting the client with such information was appropriate.&#x201D; (Respondent, clinical psychologist B)</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>KG: Knowledge graph.</p></fn><fn id="table2fn2"><p><sup>b</sup>KG_P: Knowledge graph with personalization.</p></fn></table-wrap-foot></table-wrap><p>The CFs were also examined from a reframing perspective. Reframing involves therapists actively attempting to transform their clients&#x2019; thoughts, which is a common technique in family therapy [<xref ref-type="bibr" rid="ref34">34</xref>]. The vignette in <xref ref-type="other" rid="box1">Textbox 1</xref> depicts a mother expressing self-blame, making reframing particularly applicable [<xref ref-type="bibr" rid="ref35">35</xref>]. All 5 groups applied reframing to this aspect (<xref ref-type="table" rid="table2">Table 2</xref>). While reframing recommends directly using client phrases [<xref ref-type="bibr" rid="ref36">36</xref>], only the expert, personalization, and knowledge graph with personalization groups adhered to this recommendation (<xref ref-type="table" rid="table2">Table 2</xref>). The control group did not use client expressions during reframing and the knowledge graph group used only single words, suggesting that they did not fully adhere to this recommendation (<xref ref-type="table" rid="table2">Table 2</xref>). This analysis indicates that personalization prompts facilitate the extraction of client-specific expressions, enhancing mean-making within CF.</p><p><xref ref-type="table" rid="table2">Table 2</xref> also includes comments from the experts following their responses and evaluations. The responding expert (clinical psychologist B) indicated a deliberate practice of writing only content considered easily acceptable to the recipient rather than exhaustively documenting the entirety of the CF. This practice is thought to contribute to the higher consistency observed in human-generated CFs compared to those generated by machines. Furthermore, an evaluation expert (clinical psychologist C) pointed out the unnatural expressions present in machine-generated CFs when directly returned to clients. This observation aligns with the lower scores for accessible language found in machine-generated CFs compared to human-generated CFs.</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Main Findings</title><p>This study demonstrates that the correctness and completeness of CF increase when using a knowledge graph based on meta-analyses. In addition, the use of a knowledge graph resulted in the feasibility of CF reaching a level comparable to that of human experts. These findings support the validity of the evidence-based CF model [<xref ref-type="bibr" rid="ref12">12</xref>]. Incorporating the findings of meta-analytic studies into CF has 3 advantages. First, integrating academic findings enhances the accuracy of CF content [<xref ref-type="bibr" rid="ref12">12</xref>]. Second, the inclusion of diverse academic findings increases CF completeness [<xref ref-type="bibr" rid="ref15">15</xref>]. Third, because meta-analyses often include specific therapeutic methods, their incorporation into CF enhances feasibility [<xref ref-type="bibr" rid="ref13">13</xref>]. This study provides concrete data to support the validity of the evidence-based CF model [<xref ref-type="bibr" rid="ref12">12</xref>]. This study is valuable in that it enhances CF by incorporating a knowledge graph derived from meta-analytic findings into an LLM. Although previous studies have applied knowledge graphs to diagnostic assessment [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>], research using knowledge graphs specifically for CF remains scarce. This study is novel in demonstrating that the use of a knowledge graph can improve the quality of CF. Furthermore, previous CF research has predominantly focused on cognitive-behavioral therapy in Western countries [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]; incorporating Asian family therapy has expanded the cultural diversity of CF research [<xref ref-type="bibr" rid="ref1">1</xref>].</p></sec><sec id="s4-2"><title>Strengths of Human Experts</title><p>Regarding consistency, the influence of the knowledge graph was minimal, and human expert CF generally scored higher than machine-generated CF. Human experts summarized the content in paragraphs rather than bullet points, potentially contributing to their higher consistency scores. In addition, human experts included more elements of accessible language than machines. Although the machines were prompted to use simple language and adhere to these instructions, the human experts still exhibited more explicit emotional expressions. The experts effectively combined the expressions presented in the vignettes to convey nuanced meanings. Nuanced expression is a difficult area for LLMs. Although LLMs may have an advantage over the general population [<xref ref-type="bibr" rid="ref37">37</xref>], human experts currently show an advantage, and a similar trend arises in a variety of specialties [<xref ref-type="bibr" rid="ref38">38</xref>].</p></sec><sec id="s4-3"><title>Effects of Personalization</title><p>Personalization had a limited impact on the general quality or specific key components of CF, which is inconsistent with previous findings [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. However, qualitative analysis indicated that personalization facilitates the extraction of client-specific expressions, promoting mean-making within CF. During vignette creation, writer-specific expressions were likely diminished because of the removal of proper nouns, potentially obscuring the personalization effect. Individual-specific expressions may also have been lost during the summarization process. One previous study has demonstrated that a 2-stage approach&#x2014;first summarizing individual-specific characteristics and subsequently performing diagnostic reasoning&#x2014;yields higher diagnostic accuracy in LLMs than direct diagnosis alone [<xref ref-type="bibr" rid="ref28">28</xref>]. Accordingly, adopting a 2-stage approach in which individual-specific expressions are first extracted and then used to generate CFs may facilitate the development of CFs that better capture individual-specific characteristics. Future research should use longer vignettes with more writer-specific expressions and a 2-stage approach to better examine personalization effects [<xref ref-type="bibr" rid="ref4">4</xref>].</p></sec><sec id="s4-4"><title>Practical Implications</title><p>This study has 2 practical implications. First, knowledge of graph-generated CF can be used to train novice therapists [<xref ref-type="bibr" rid="ref11">11</xref>]. Novice therapists can compare their CFs with machine-generated CFs based on knowledge graphs, which helps them identify missing perspectives or components in their formulations [<xref ref-type="bibr" rid="ref39">39</xref>]. Second, knowledge of graph-generated CFs can support expert therapists. Experts often lack time for literature searches, resulting in limited citations of previous research [<xref ref-type="bibr" rid="ref14">14</xref>]. Machines can automatically extract meta-analytic literature data and present experts with current evidence, thereby improving CF quality through the timely integration of such evidence [<xref ref-type="bibr" rid="ref15">15</xref>]. Since the knowledge extracted from meta-analyses may remain at a relatively superficial level, and even when the cited knowledge is accurate, its application in practice requires careful consideration to avoid placing undue burden on clients [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>]. Therefore, when such knowledge is used in clinical settings, professional experience and ethical judgment are essential [<xref ref-type="bibr" rid="ref28">28</xref>]. Indeed, the clinician involved in this study reported intentionally reducing the length of the CF to minimize the client&#x2019;s burden. Because CF generation by machines is less time-consuming and more cost-effective [<xref ref-type="bibr" rid="ref8">8</xref>], appropriately reviewing machine-generated CFs by human experts could contribute to improving the quality of CFs produced by humans.</p></sec><sec id="s4-5"><title>Limitations</title><p>This study has 4 limitations. First, there was a potential bias in the constructed data, as only 1 individual was involved in vignette creation, 1 in response, and 1 in evaluation. Because this study used only a single evaluator, interrater reliability could not be calculated. The scores used as the evaluation metric could not be examined in relation to other external measures, and thus the validity of the metric was not established. In addition, because test-retest assessments were not conducted for this measure, test-retest reliability could not be calculated. To ensure the reliability and validity of these measures, future research should incorporate test-retest evaluations and CF measures with established validity [<xref ref-type="bibr" rid="ref8">8</xref>]. Securing multiple vignette creators, respondents, and evaluators can prevent such bias [<xref ref-type="bibr" rid="ref2">2</xref>]. Second, human experts&#x2019; CFs differed significantly from machine-generated CFs in style and length, potentially enabling evaluators to infer human authorship despite the blinded condition. Evaluators may have identified and preferentially rated the machine responses negatively [<xref ref-type="bibr" rid="ref40">40</xref>]. Because the CFs produced by human experts were shorter, the evaluator may have recognized them as being authored by human experts. This recognition may have contributed to the higher consistency ratings observed for the human expert condition. Future research should standardize the length and style of responses to ensure more robust blinding. Third, vignette-style presentation may not be the optimal way to present clinical cases. Presenting clinical cases in a vignette style reportedly resulted in lower diagnostic accuracy among human experts compared with presentations that list symptoms alone [<xref ref-type="bibr" rid="ref41">41</xref>]. Similarly, when LLMs evaluate cases presented in a vignette style, they tend to generate an excessive number of diagnoses [<xref ref-type="bibr" rid="ref42">42</xref>]. Therefore, future studies should examine the quality of CF using a format in which symptoms are presented solely as structured lists. Fourth, qualitative analysis in this study did not use thematic analysis [<xref ref-type="bibr" rid="ref43">43</xref>]. In future research, more comprehensive qualitative analyses could be achieved by conducting thematic analysis and ensuring transparency in the coding process.</p></sec><sec id="s4-6"><title>Conclusions</title><p>Despite these limitations, our study demonstrated the effectiveness of knowledge graphs in enhancing the general quality of CF, which is consistent with studies showing the usefulness of knowledge graphs in the clinical domain [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref19">19</xref>]. A comparison of human and machine-generated CFs also highlighted human strengths in terms of clarity and machine strengths in terms of completeness and correctness. Future studies should demonstrate improvements in the quality of therapist-generated CFs by presenting machine-generated CFs with meta-analysis knowledge graphs to novice and expert therapists [<xref ref-type="bibr" rid="ref5">5</xref>]. Using machines as supplementary tools to enhance CF quality will enable therapists to rapidly produce high-quality CFs [<xref ref-type="bibr" rid="ref3">3</xref>], ultimately improving the mental health services provided to many individuals [<xref ref-type="bibr" rid="ref20">20</xref>].</p></sec></sec></body><back><ack><p>This study was partially presented in Japanese as a poster at the 89th Annual Convention of the Japanese Psychological Association in 2025. In this study, ChatGPT (GPT-5) was used to assist with computer-program code generation and the translation of Japanese manuscripts into English. All artificial intelligence (AI)-assisted outputs were subsequently reviewed and substantially revised by the authors. The authors declare the use of generative AI in the research and writing process. According to the GAIDeT taxonomy (2026) [<xref ref-type="bibr" rid="ref44">44</xref>], the following tasks were delegated to generative AI (GAI) tools under full human supervision: code generation, code optimization, data collection, and translation. The GAI tools used were: ChatGPT (GPT-4.1, GPT-5, GPT-5.1, GPT-5.2, GPT-5.3, and GPT-5.4) and Claude (Sonnet 3.5 and Sonnet 3.7). The responsibility for the final manuscript lies entirely with the authors. GAI tools are not listed as authors and do not bear responsibility for the final outcomes.</p></ack><notes><sec><title>Funding</title><p>This study was financially supported by the Japan Society for the Promotion of Science (grant 23H00080).</p></sec><sec><title>Data Availability</title><p>Data supporting the findings of this study are available from the corresponding author (KY) upon reasonable request.</p></sec></notes><fn-group><fn fn-type="con"><p>Conceptualization: KY</p><p>Data curation: KY</p><p>Formal analysis: KY</p><p>Funding acquisition: KY</p><p>Investigation: KY, YJ, KK</p><p>Methodology: KY</p><p>Project administration: KY</p><p>Resources: YJ, KK</p><p>Software: KY</p><p>Validation: KY</p><p>Visualization: KY</p><p>Writing &#x2013; original draft: KY</p><p>Writing &#x2013; review &#x0026; editing: KY</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">CF</term><def><p>case formulation</p></def></def-item><def-item><term id="abb2">LLM</term><def><p>large language model</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hsieh</surname><given-names>LH</given-names> </name><name name-style="western"><surname>Liao</surname><given-names>WC</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>EY</given-names> </name></person-group><article-title>Feasibility assessment of using ChatGPT for training case conceptualization skills in psychological counseling</article-title><source>Comput Hum Behav Artif Hum</source><year>2024</year><month>08</month><volume>2</volume><issue>2</issue><fpage>100083</fpage><pub-id pub-id-type="doi">10.1016/j.chbah.2024.100083</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Thrower</surname><given-names>NE</given-names> </name><name name-style="western"><surname>Bucci</surname><given-names>S</given-names> </name><name name-style="western"><surname>Morris</surname><given-names>L</given-names> </name><name name-style="western"><surname>Berry</surname><given-names>K</given-names> </name></person-group><article-title>The key components of a clinical psychology formulation: a consensus study</article-title><source>Br J Clin Psychol</source><year>2024</year><month>06</month><volume>63</volume><issue>2</issue><fpage>213</fpage><lpage>226</lpage><pub-id pub-id-type="doi">10.1111/bjc.12455</pub-id><pub-id pub-id-type="medline">38235902</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Easden</surname><given-names>MH</given-names> </name><name name-style="western"><surname>Kazantzis</surname><given-names>N</given-names> </name></person-group><article-title>Case conceptualization research in cognitive behavior therapy: a state of the science review</article-title><source>J Clin Psychol</source><year>2018</year><month>03</month><volume>74</volume><issue>3</issue><fpage>356</fpage><lpage>384</lpage><pub-id pub-id-type="doi">10.1002/jclp.22516</pub-id><pub-id pub-id-type="medline">28776663</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lundkvist-Houndoumadi</surname><given-names>I</given-names> </name><name name-style="western"><surname>Thastum</surname><given-names>M</given-names> </name><name name-style="western"><surname>Hougaard</surname><given-names>E</given-names> </name></person-group><article-title>Effectiveness of an individualized case formulation&#x2013;based CBT for non-responding youths with anxiety disorders</article-title><source>J Child Fam Stud</source><year>2016</year><month>02</month><volume>25</volume><issue>2</issue><fpage>503</fpage><lpage>517</lpage><pub-id pub-id-type="doi">10.1007/s10826-015-0225-4</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kendjelic</surname><given-names>EM</given-names> </name><name name-style="western"><surname>Eells</surname><given-names>TD</given-names> </name></person-group><article-title>Generic psychotherapy case formulation training improves formulation quality</article-title><source>Psychotherapy (Chic)</source><year>2007</year><volume>44</volume><issue>1</issue><fpage>66</fpage><lpage>77</lpage><pub-id pub-id-type="doi">10.1037/0033-3204.44.1.66</pub-id><pub-id pub-id-type="medline">22122169</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dudley</surname><given-names>R</given-names> </name><name name-style="western"><surname>Ingham</surname><given-names>B</given-names> </name><name name-style="western"><surname>Sowerby</surname><given-names>K</given-names> </name><name name-style="western"><surname>Freeston</surname><given-names>M</given-names> </name></person-group><article-title>The utility of case formulation in treatment decision making; the effect of experience and expertise</article-title><source>J Behav Ther Exp Psychiatry</source><year>2015</year><month>09</month><volume>48</volume><fpage>66</fpage><lpage>74</lpage><pub-id pub-id-type="doi">10.1016/j.jbtep.2015.01.009</pub-id><pub-id pub-id-type="medline">25748793</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mohtashemi</surname><given-names>R</given-names> </name><name name-style="western"><surname>Stevens</surname><given-names>J</given-names> </name><name name-style="western"><surname>Jackson</surname><given-names>PG</given-names> </name><name name-style="western"><surname>Weatherhead</surname><given-names>S</given-names> </name></person-group><article-title>Psychiatrists&#x2019; understanding and use of psychological formulation: a qualitative exploration</article-title><source>BJPsych Bull</source><year>2016</year><month>08</month><volume>40</volume><issue>4</issue><fpage>212</fpage><lpage>216</lpage><pub-id pub-id-type="doi">10.1192/pb.bp.115.051342</pub-id><pub-id pub-id-type="medline">27512592</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Abbas</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Fosker</surname><given-names>H</given-names> </name><name name-style="western"><surname>Dudson</surname><given-names>H</given-names> </name><name name-style="western"><surname>Ramewal</surname><given-names>S</given-names> </name></person-group><article-title>A comparison of the quality of integrated case formulations produced by UK psychiatric trainees and an artificial intelligence-assisted application</article-title><source>BJPsych Bull</source><year>2025</year><month>10</month><day>13</day><fpage>1</fpage><lpage>6</lpage><pub-id pub-id-type="doi">10.1192/bjb.2025.10160</pub-id><pub-id pub-id-type="medline">41077965</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gao</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Li</surname><given-names>R</given-names> </name><name name-style="western"><surname>Croxford</surname><given-names>E</given-names> </name><etal/></person-group><article-title>Leveraging medical knowledge graphs into large language models for diagnosis prediction: design and application study</article-title><source>JMIR AI</source><year>2025</year><month>02</month><day>24</day><volume>4</volume><fpage>e58670</fpage><pub-id pub-id-type="doi">10.2196/58670</pub-id><pub-id pub-id-type="medline">39993309</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jia</surname><given-names>M</given-names> </name><name name-style="western"><surname>Duan</surname><given-names>J</given-names> </name><name name-style="western"><surname>Song</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>J</given-names> </name></person-group><article-title>MedIKAL: integrating knowledge graphs as assistants of llms for enhanced clinical diagnosis on EMRS</article-title><source>Proceedings of the 31st International Conference on Computational Linguistics</source><year>2025</year><access-date>2026-03-17</access-date><fpage>9278</fpage><lpage>9298</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://aclanthology.org/2025.coling-main.624.pdf">https://aclanthology.org/2025.coling-main.624.pdf</ext-link></comment></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Abbas</surname><given-names>M</given-names> </name><name name-style="western"><surname>Walton</surname><given-names>R</given-names> </name><name name-style="western"><surname>Johnston</surname><given-names>A</given-names> </name><name name-style="western"><surname>Chikoore</surname><given-names>M</given-names> </name></person-group><article-title>Evaluation of teaching an integrated case formulation approach on the quality of case formulations: randomised controlled trial</article-title><source>Psychiatrist</source><year>2012</year><month>04</month><volume>36</volume><issue>4</issue><fpage>140</fpage><lpage>145</lpage><pub-id pub-id-type="doi">10.1192/pb.bp.110.033746</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Eells</surname><given-names>TD</given-names> </name><name name-style="western"><surname>Lombart</surname><given-names>KG</given-names> </name></person-group><article-title>Theoretical and evidence-based approaches to case formulation</article-title><source>Forensic Case Formulation</source><year>2011</year><publisher-name>John Wiley &#x0026; Sons, Ltd</publisher-name><fpage>1</fpage><lpage>32</lpage><pub-id pub-id-type="other">9781119977018</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pachankis</surname><given-names>JE</given-names> </name><name name-style="western"><surname>Soulliard</surname><given-names>ZA</given-names> </name><name name-style="western"><surname>Morris</surname><given-names>F</given-names> </name><name name-style="western"><surname>Seager van Dyk</surname><given-names>I</given-names> </name></person-group><article-title>A model for adapting evidence-based interventions to be LGBQ-affirmative: putting minority stress principles and case conceptualization into clinical research and practice</article-title><source>Cogn Behav Pract</source><year>2023</year><month>02</month><volume>30</volume><issue>1</issue><fpage>1</fpage><lpage>17</lpage><pub-id pub-id-type="doi">10.1016/j.cbpra.2021.11.005</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Huisman</surname><given-names>P</given-names> </name><name name-style="western"><surname>Kangas</surname><given-names>M</given-names> </name></person-group><article-title>Evidence-based practices in cognitive behaviour therapy (CBT) case formulation: what do practitioners believe is important, and what do they do?</article-title><source>Behav change</source><year>2018</year><month>04</month><volume>35</volume><issue>1</issue><fpage>1</fpage><lpage>21</lpage><pub-id pub-id-type="doi">10.1017/bec.2018.5</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Christon</surname><given-names>LM</given-names> </name><name name-style="western"><surname>McLeod</surname><given-names>BD</given-names> </name><name name-style="western"><surname>Jensen-Doss</surname><given-names>A</given-names> </name></person-group><article-title>Evidence-based assessment meets evidence-based treatment: an approach to science-informed case conceptualization</article-title><source>Cogn Behav Pract</source><year>2015</year><month>02</month><volume>22</volume><issue>1</issue><fpage>36</fpage><lpage>48</lpage><pub-id pub-id-type="doi">10.1016/j.cbpra.2013.12.004</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alam</surname><given-names>F</given-names> </name><name name-style="western"><surname>Giglou</surname><given-names>HB</given-names> </name><name name-style="western"><surname>Malik</surname><given-names>KM</given-names> </name></person-group><article-title>Automated clinical knowledge graph generation framework for evidence based medicine</article-title><source>Expert Syst Appl</source><year>2023</year><month>12</month><volume>233</volume><fpage>120964</fpage><pub-id pub-id-type="doi">10.1016/j.eswa.2023.120964</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Peng</surname><given-names>B</given-names> </name><name name-style="western"><surname>Ioannidis</surname><given-names>VN</given-names> </name><name name-style="western"><surname>Li</surname><given-names>M</given-names> </name><name name-style="western"><surname>Karypis</surname><given-names>G</given-names> </name><name name-style="western"><surname>Ning</surname><given-names>X</given-names> </name></person-group><article-title>A knowledge graph of clinical trials ([formula: see text])</article-title><source>Sci Rep</source><year>2022</year><month>03</month><day>18</day><volume>12</volume><issue>1</issue><fpage>4724</fpage><pub-id pub-id-type="doi">10.1038/s41598-022-08454-z</pub-id><pub-id pub-id-type="medline">35304504</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rotmensch</surname><given-names>M</given-names> </name><name name-style="western"><surname>Halpern</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Tlimat</surname><given-names>A</given-names> </name><name name-style="western"><surname>Horng</surname><given-names>S</given-names> </name><name name-style="western"><surname>Sontag</surname><given-names>D</given-names> </name></person-group><article-title>Learning a health knowledge graph from electronic medical records</article-title><source>Sci Rep</source><year>2017</year><month>07</month><day>20</day><volume>7</volume><issue>1</issue><fpage>5994</fpage><pub-id pub-id-type="doi">10.1038/s41598-017-05778-z</pub-id><pub-id pub-id-type="medline">28729710</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lyu</surname><given-names>K</given-names> </name><name name-style="western"><surname>Tian</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Shang</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Causal knowledge graph construction and evaluation for clinical decision support of diabetic nephropathy</article-title><source>J Biomed Inform</source><year>2023</year><month>03</month><volume>139</volume><fpage>104298</fpage><pub-id pub-id-type="doi">10.1016/j.jbi.2023.104298</pub-id><pub-id pub-id-type="medline">36731730</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Macneil</surname><given-names>CA</given-names> </name><name name-style="western"><surname>Hasty</surname><given-names>MK</given-names> </name><name name-style="western"><surname>Conus</surname><given-names>P</given-names> </name><name name-style="western"><surname>Berk</surname><given-names>M</given-names> </name></person-group><article-title>Is diagnosis enough to guide interventions in mental health? Using case formulation in clinical practice</article-title><source>BMC Med</source><year>2012</year><month>09</month><day>27</day><volume>10</volume><fpage>111</fpage><pub-id pub-id-type="doi">10.1186/1741-7015-10-111</pub-id><pub-id pub-id-type="medline">23016556</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>van den Bergh</surname><given-names>R</given-names> </name><name name-style="western"><surname>Olthof</surname><given-names>M</given-names> </name><name name-style="western"><surname>Goldbeck</surname><given-names>F</given-names> </name><etal/></person-group><article-title>The content of personalised network&#x2013;based case formulations</article-title><source>J Contemp Psychother</source><year>2024</year><month>09</month><volume>54</volume><issue>3</issue><fpage>181</fpage><lpage>192</lpage><pub-id pub-id-type="doi">10.1007/s10879-023-09613-7</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Spencer</surname><given-names>HM</given-names> </name><name name-style="western"><surname>Dudley</surname><given-names>R</given-names> </name><name name-style="western"><surname>Johnston</surname><given-names>L</given-names> </name><name name-style="western"><surname>Freeston</surname><given-names>MH</given-names> </name><name name-style="western"><surname>Turkington</surname><given-names>D</given-names> </name><name name-style="western"><surname>Tully</surname><given-names>S</given-names> </name></person-group><article-title>Case formulation-a vehicle for change? Exploring the impact of cognitive behavioural therapy formulation in first episode psychosis: a reflexive thematic analysis</article-title><source>Psychol Psychother</source><year>2023</year><month>06</month><volume>96</volume><issue>2</issue><fpage>328</fpage><lpage>346</lpage><pub-id pub-id-type="doi">10.1111/papt.12442</pub-id><pub-id pub-id-type="medline">36480353</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Flinn</surname><given-names>L</given-names> </name><name name-style="western"><surname>Braham</surname><given-names>L</given-names> </name><name name-style="western"><surname>das Nair</surname><given-names>R</given-names> </name></person-group><article-title>How reliable are case formulations? A systematic literature review</article-title><source>Br J Clin Psychol</source><year>2015</year><month>09</month><volume>54</volume><issue>3</issue><fpage>266</fpage><lpage>290</lpage><pub-id pub-id-type="doi">10.1111/bjc.12073</pub-id><pub-id pub-id-type="medline">25515566</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Yokotani</surname><given-names>K</given-names> </name></person-group><source>Illustrated Case-Based Family Therapy: Systems and Narrativist Case Formulation and Intervention [Book in Japanese]</source><year>2022</year><publisher-name>Tomishobo</publisher-name><pub-id pub-id-type="other">978-4-86616-155-6</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Takano</surname><given-names>M</given-names> </name><name name-style="western"><surname>Taka</surname><given-names>F</given-names> </name><name name-style="western"><surname>Ogiue</surname><given-names>C</given-names> </name><name name-style="western"><surname>Nagata</surname><given-names>N</given-names> </name></person-group><article-title>Online harassment of Japanese celebrities and influencers</article-title><source>Front Psychol</source><year>2024</year><volume>15</volume><fpage>1386146</fpage><pub-id pub-id-type="doi">10.3389/fpsyg.2024.1386146</pub-id><pub-id pub-id-type="medline">38686089</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fricke</surname><given-names>S</given-names> </name></person-group><article-title>Semantic Scholar</article-title><source>J Med Libr Assoc</source><year>2018</year><month>01</month><volume>106</volume><issue>1</issue><fpage>145</fpage><lpage>147</lpage><pub-id pub-id-type="doi">10.5195/jmla.2018.280</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="web"><article-title>Models overview</article-title><source>Claude APIDocs</source><year>2021</year><access-date>2025-04-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://docs.anthropic.com/en/docs/about-claude/models/all-models">https://docs.anthropic.com/en/docs/about-claude/models/all-models</ext-link></comment></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kurokawa</surname><given-names>R</given-names> </name><name name-style="western"><surname>Ohizumi</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Kanzawa</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Diagnostic performances of Claude 3 Opus and Claude 3.5 Sonnet from patient history and key images in Radiology&#x2019;s &#x201C;Diagnosis Please&#x201D; cases</article-title><source>Jpn J Radiol</source><year>2024</year><month>12</month><volume>42</volume><issue>12</issue><fpage>1399</fpage><lpage>1402</lpage><pub-id pub-id-type="doi">10.1007/s11604-024-01634-z</pub-id><pub-id pub-id-type="medline">39096483</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Feng</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zheng</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>C</given-names> </name><etal/></person-group><article-title>M^3Builder: a multi-agent system for automated machine learning in medical imaging</article-title><access-date>2026-03-17</access-date><conf-name>AI for Clinical Applications Agentic AI CMLLMs CREATE 2025 2025 2025</conf-name><conf-date>Sep 23-27, 2025</conf-date><comment><ext-link ext-link-type="uri" xlink:href="https://link.springer.com/chapter/10.1007/978-3-032-06004-4_12#citeas">https://link.springer.com/chapter/10.1007/978-3-032-06004-4_12#citeas</ext-link></comment><pub-id pub-id-type="doi">10.1007/978-3-032-06004-4_12</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gao</surname><given-names>S</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>K</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Large language model powered knowledge graph construction for mental health exploration</article-title><source>Nat Commun</source><year>2025</year><month>08</month><day>13</day><volume>16</volume><issue>1</issue><fpage>7526</fpage><pub-id pub-id-type="doi">10.1038/s41467-025-62781-z</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Lui</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>Xiang</surname><given-names>C</given-names> </name><name name-style="western"><surname>Krishnaswamy</surname><given-names>S</given-names> </name></person-group><article-title>KAMEL: knowledge aware medical entity linkage to automate health insurance claims processing</article-title><conf-name>AAAI&#x2019;24/IAAI&#x2019;24/EAAI&#x2019;24: Proceedings of the Thirty-Eighth AAAI Conference on Artificial Intelligence and Thirty-Sixth Conference on Innovative Applications of Artificial Intelligence and Fourteenth Symposium on Educational Advances in Artificial Intelligence</conf-name><conf-date>Feb 20-27, 2024</conf-date><pub-id pub-id-type="doi">10.1609/aaai.v38i21.30314</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Uchiyama</surname><given-names>A</given-names> </name><name name-style="western"><surname>Wakashima</surname><given-names>K</given-names> </name><name name-style="western"><surname>Koiwa</surname><given-names>K</given-names> </name><name name-style="western"><surname>Nagano</surname><given-names>K</given-names> </name><name name-style="western"><surname>Kakei</surname><given-names>K</given-names> </name></person-group><article-title>Learning brief therapy and family therapy&#x2014;case formulation in brief therapy and family therapy [article in Japanese]</article-title><conf-name>43rd Annual Conference of the Japanese Association of Clinical Psychology</conf-name><conf-date>Oct 6, 2024</conf-date></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jikihara</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Nozawa</surname><given-names>S</given-names> </name><name name-style="western"><surname>Ando</surname><given-names>S</given-names> </name><name name-style="western"><surname>Higginbotham</surname><given-names>BJ</given-names> </name><name name-style="western"><surname>Schramm</surname><given-names>DG</given-names> </name><name name-style="western"><surname>Adler-Baeder</surname><given-names>F</given-names> </name></person-group><article-title>Exploring the factor structure and concurrent validity of two stepfamily measures for Japanese couples</article-title><source>J Divorce Remarriage</source><year>2023</year><month>05</month><day>19</day><volume>64</volume><issue>2-4</issue><fpage>156</fpage><lpage>172</lpage><pub-id pub-id-type="doi">10.1080/10502556.2023.2242751</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Moran</surname><given-names>G</given-names> </name><name name-style="western"><surname>Diamond</surname><given-names>GM</given-names> </name><name name-style="western"><surname>Diamond</surname><given-names>GS</given-names> </name></person-group><article-title>The relational reframe and parents&#x2019; problem constructions in attachment-based family therapy</article-title><source>Psychother Res</source><year>2005</year><month>07</month><volume>15</volume><issue>3</issue><fpage>226</fpage><lpage>235</lpage><pub-id pub-id-type="doi">10.1080/10503300512331387780</pub-id><pub-id pub-id-type="medline">22011152</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Munroe</surname><given-names>M</given-names> </name><name name-style="western"><surname>Al-Refae</surname><given-names>M</given-names> </name><name name-style="western"><surname>Chan</surname><given-names>HW</given-names> </name><name name-style="western"><surname>Ferrari</surname><given-names>M</given-names> </name></person-group><article-title>Using self-compassion to grow in the face of trauma: the role of positive reframing and problem-focused coping strategies</article-title><source>Psychol Trauma</source><year>2022</year><month>04</month><volume>14</volume><issue>S1</issue><fpage>S157</fpage><lpage>S164</lpage><pub-id pub-id-type="doi">10.1037/tra0001164</pub-id><pub-id pub-id-type="medline">34735189</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lyddon</surname><given-names>WJ</given-names> </name><name name-style="western"><surname>Clay</surname><given-names>AL</given-names> </name><name name-style="western"><surname>Sparks</surname><given-names>CL</given-names> </name></person-group><article-title>Metaphor and change in counseling</article-title><source>Jour of Counseling &#x0026; Develop</source><year>2001</year><month>07</month><volume>79</volume><issue>3</issue><fpage>269</fpage><lpage>274</lpage><pub-id pub-id-type="doi">10.1002/j.1556-6676.2001.tb01971.x</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sorin</surname><given-names>V</given-names> </name><name name-style="western"><surname>Brin</surname><given-names>D</given-names> </name><name name-style="western"><surname>Barash</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Large Language Models and empathy: systematic review</article-title><source>J Med Internet Res</source><year>2024</year><month>12</month><day>11</day><volume>26</volume><fpage>e52597</fpage><pub-id pub-id-type="doi">10.2196/52597</pub-id><pub-id pub-id-type="medline">39661968</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yokotani</surname><given-names>K</given-names> </name><name name-style="western"><surname>Takagi</surname><given-names>G</given-names> </name><name name-style="western"><surname>Wakashima</surname><given-names>K</given-names> </name></person-group><article-title>Advantages of virtual agents over clinical psychologists during comprehensive mental health interviews using a mixed methods design</article-title><source>Comput Human Behav</source><year>2018</year><month>08</month><volume>85</volume><fpage>135</fpage><lpage>145</lpage><pub-id pub-id-type="doi">10.1016/j.chb.2018.03.045</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liese</surname><given-names>BS</given-names> </name><name name-style="western"><surname>Esterline</surname><given-names>KM</given-names> </name></person-group><article-title>Concept mapping: a supervision strategy for introducing case conceptualization skills to novice therapists</article-title><source>Psychotherapy (Chic)</source><year>2015</year><month>06</month><volume>52</volume><issue>2</issue><fpage>190</fpage><lpage>194</lpage><pub-id pub-id-type="doi">10.1037/a0038618</pub-id><pub-id pub-id-type="medline">25730627</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Thuillard</surname><given-names>S</given-names> </name><name name-style="western"><surname>Adams</surname><given-names>M</given-names> </name><name name-style="western"><surname>Jelmini</surname><given-names>G</given-names> </name><name name-style="western"><surname>Schmutz</surname><given-names>S</given-names> </name><name name-style="western"><surname>Sonderegger</surname><given-names>A</given-names> </name><name name-style="western"><surname>Sauer</surname><given-names>J</given-names> </name></person-group><article-title>When humans and computers induce social stress through negative feedback: effects on performance and subjective state</article-title><source>Comput Human Behav</source><year>2022</year><month>08</month><volume>133</volume><fpage>107270</fpage><pub-id pub-id-type="doi">10.1016/j.chb.2022.107270</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Payton</surname><given-names>EM</given-names> </name><name name-style="western"><surname>Graber</surname><given-names>ML</given-names> </name><name name-style="western"><surname>Bachiashvili</surname><given-names>V</given-names> </name><name name-style="western"><surname>Mehta</surname><given-names>T</given-names> </name><name name-style="western"><surname>Dissanayake</surname><given-names>PI</given-names> </name><name name-style="western"><surname>Berner</surname><given-names>ES</given-names> </name></person-group><article-title>Impact of clinical note format on diagnostic accuracy and efficiency</article-title><source>Health Inf Manag J</source><year>2024</year><month>09</month><volume>53</volume><issue>3</issue><fpage>183</fpage><lpage>188</lpage><pub-id pub-id-type="doi">10.1177/18333583231151979</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sarma</surname><given-names>KV</given-names> </name><name name-style="western"><surname>Hanss</surname><given-names>KE</given-names> </name><name name-style="western"><surname>Halls</surname><given-names>AJM</given-names> </name><etal/></person-group><article-title>Integrating expert knowledge into large language models improves performance for psychiatric reasoning and diagnosis</article-title><source>Psychiatry Res</source><year>2026</year><month>01</month><volume>355</volume><fpage>116844</fpage><pub-id pub-id-type="doi">10.1016/j.psychres.2025.116844</pub-id><pub-id pub-id-type="medline">41270691</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Braun</surname><given-names>V</given-names> </name><name name-style="western"><surname>Clarke</surname><given-names>V</given-names> </name></person-group><article-title>Using thematic analysis in psychology</article-title><source>Qual Res Psychol</source><year>2006</year><month>01</month><volume>3</volume><issue>2</issue><fpage>77</fpage><lpage>101</lpage><pub-id pub-id-type="doi">10.1191/1478088706qp063oa</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Suchikova</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Tsybuliak</surname><given-names>N</given-names> </name><name name-style="western"><surname>Teixeira da Silva</surname><given-names>JA</given-names> </name><name name-style="western"><surname>Nazarovets</surname><given-names>S</given-names> </name></person-group><article-title>GAIDeT (Generative AI Delegation Taxonomy): a taxonomy for humans to delegate tasks to generative artificial intelligence in scientific research and publishing</article-title><source>Account Res</source><year>2026</year><month>04</month><volume>33</volume><issue>3</issue><fpage>2544331</fpage><pub-id pub-id-type="doi">10.1080/08989621.2025.2544331</pub-id><pub-id pub-id-type="medline">40781729</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Knowledge graphs.</p><media xlink:href="formative_v10i1e76808_app1.docx" xlink:title="DOCX File, 30 KB"/></supplementary-material></app-group></back></article>