<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Ment Health</journal-id><journal-id journal-id-type="publisher-id">mental</journal-id><journal-id journal-id-type="index">16</journal-id><journal-title>JMIR Mental Health</journal-title><abbrev-journal-title>JMIR Ment Health</abbrev-journal-title><issn pub-type="epub">2368-7959</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v13i1e82642</article-id><article-id pub-id-type="doi">10.2196/82642</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Effectiveness of a Fully Automated Mobile Therapeutic Versus a General Chatbot in Reducing Depression and Anxiety and Improving Well-Being: Feasibility Randomized Controlled Trial</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Kuta</surname><given-names>Barbora</given-names></name><degrees>MA</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Novak</surname><given-names>Lukas</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Zidkova</surname><given-names>Radka</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Furstova</surname><given-names>Jana</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Malinakova</surname><given-names>Klara</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>De Winter</surname><given-names>Andrea</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Husek</surname><given-names>V&#x00ED;t</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>Palack&#x00FD; University Olomouc</institution><addr-line>K&#x0159;&#x00ED;&#x017E;kovsk&#x00E9;ho 511/8</addr-line><addr-line>Olomouc</addr-line><country>Czech Republic</country></aff><aff id="aff2"><institution>Faculty of Medical Sciences, University Medical Center Groningen</institution><addr-line>Groningen</addr-line><country>The Netherlands</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Torous</surname><given-names>John</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Jabir</surname><given-names>Ahmad</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Suda</surname><given-names>Akira</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Fylaktou</surname><given-names>Fylaktis</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Leever</surname><given-names>William</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Barbora Kuta, MA, Palack&#x00FD; University Olomouc, K&#x0159;&#x00ED;&#x017E;kovsk&#x00E9;ho 511/8, Olomouc, 779 00, Czech Republic, 420 773981876; <email>barbora.kuta@oushi.upol.cz</email></corresp></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>22</day><month>4</month><year>2026</year></pub-date><volume>13</volume><elocation-id>e82642</elocation-id><history><date date-type="received"><day>27</day><month>08</month><year>2025</year></date><date date-type="rev-recd"><day>16</day><month>12</month><year>2025</year></date><date date-type="accepted"><day>25</day><month>12</month><year>2025</year></date></history><copyright-statement>&#x00A9; Barbora Kuta, Lukas Novak, Radka Zidkova, Jana Furstova, Klara Malinakova, Andrea De Winter, V&#x00ED;t Husek. Originally published in JMIR Mental Health (<ext-link ext-link-type="uri" xlink:href="https://mental.jmir.org">https://mental.jmir.org</ext-link>), 22.4.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Mental Health, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://mental.jmir.org/">https://mental.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://mental.jmir.org/2026/1/e82642"/><abstract><sec><title>Background</title><p>Given the increasing prevalence of depression and anxiety disorders and enduring barriers to care, there is a critical need for alternative treatment options. Generative artificial intelligence (AI) chatbots show promise for increasing access to mental health care, though more direct research is needed to establish their efficacy.</p></sec><sec><title>Objective</title><p>This pilot study aimed to test the efficacy of a generative mental health chatbot rooted in solution-focused therapy compared to the general-purpose ChatGPT and an assessment-only control (AOC) group on depression, anxiety, and well-being.</p></sec><sec sec-type="methods"><title>Methods</title><p>A total of 185 English-speaking adults were recruited online and randomly assigned to one of three groups: AI therapy, ChatGPT, or AOC. Of these, 147 eligible participants filled out a pretreatment assessment. Over a 3-week period, the AI therapy group (n=44) was instructed to complete 3 structured, fully automated app-based sessions per week (9 total), while the ChatGPT group (n=60) was instructed to engage in 9 unstructured conversations with ChatGPT (GPT-4o&#x2013;based models). The control group (n=43) received no intervention. In the AI therapy group, 39% (n=17) completed all sessions, as did 62% (n=38) of those in the ChatGPT group. Primary outcome measures, self-assessed online at baseline and postintervention, included the Patient Health Questionnaire-9 (PHQ-9), Overall Depression Severity and Impairment Scale (ODSIS) (depression), 7-item Generalized Anxiety Disorder Scale (anxiety), and World Health Organization Well-Being Index (5-item version) (well-being). Linear mixed effects models were used for data analysis.</p></sec><sec sec-type="results"><title>Results</title><p>Compared to AOC, both the AI therapy group (<italic>d</italic>=&#x2212;0.47; <italic>P</italic>=.01) and the ChatGPT group (<italic>d</italic>=&#x2212;0.44; <italic>P</italic>=.02) demonstrated significant reductions in depression scores measured by PHQ-9. The AI therapy group showed nonsignificant reductions in anxiety (<italic>d</italic>=&#x2212;0.37; <italic>P</italic>=.11) and ODSIS depression scores (<italic>d</italic>=&#x2212;0.25; <italic>P</italic>=.22) and an increase in well-being (<italic>d</italic>=0.12; <italic>P</italic>=.53) compared to AOC. Similarly, a nonsignificant reduction in anxiety (<italic>d</italic>=&#x2212;0.27; <italic>P</italic>=.22) and ODSIS depression scores (<italic>d</italic>=&#x2212;0.12; <italic>P</italic>=.53) and an increase in well-being (<italic>d</italic>=0.20; <italic>P</italic>=.29) were observed in the ChatGPT group compared to AOC. The AI therapy group did not significantly outperform the ChatGPT group on any outcomes (PHQ-9: <italic>b</italic>=&#x2212;0.19; <italic>d</italic>=0.03; <italic>P</italic>=.87; 7-item Generalized Anxiety Disorder Scale: <italic>b</italic>=&#x2212;0.57; <italic>d</italic>=&#x2212;0.11; <italic>P</italic>=.62; ODSIS: <italic>b</italic>=&#x2212;0.59; <italic>d</italic>=&#x2212;0.13; <italic>P</italic>=.50; and WHO: <italic>b</italic>=&#x2212;0.38; <italic>d</italic>=&#x2212;0.07; <italic>P</italic>=.69).</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>Both the structured generative AI chatbot and ChatGPT showed a significant reduction in depression scores compared to the control group. No significant effects were observed across other outcomes, although descriptive trends indicated improvements in anxiety. While the AI therapy group showed descriptively better outcomes for depression and anxiety, differences between groups were not significant. A larger sample and longer intervention may be needed for the emerging trends to yield clinically meaningful effect sizes.</p></sec><sec><title>Trial Registration</title><p>OSF Registries osf.io/r76ef; <ext-link ext-link-type="uri" xlink:href="https://osf.io/r76ef">https://osf.io/r76ef</ext-link></p></sec></abstract><kwd-group><kwd>depression</kwd><kwd>anxiety</kwd><kwd>well-being</kwd><kwd>conversational agents</kwd><kwd>digital intervention</kwd><kwd>randomized controlled trial</kwd><kwd>chatbot</kwd><kwd>solution-focused therapy</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>One in every 7 people met the criteria for a mental health disorder in 2021, with approximately 229 million people globally dealing with depression and 359 million with anxiety disorders [<xref ref-type="bibr" rid="ref1">1</xref>]. Mental health illnesses have moved from the 9th to the 6th leading cause of disability-adjusted life years from 1990 to 2021 [<xref ref-type="bibr" rid="ref2">2</xref>]. This shift highlights the growing societal burden of mental illness. Alongside the escalating prevalence of mental illness, the treatment gap is widening, with estimates indicating that fewer than 50% of adults with mental illness receive any form of mental health treatment, even in high-income countries [<xref ref-type="bibr" rid="ref3">3</xref>].</p><p>It is estimated that 58% of people with clinical-level mental health issues do not seek any professional help [<xref ref-type="bibr" rid="ref4">4</xref>], as access to care remains a salient barrier. Due to the lack of treatment services, only 23% of people affected by depression receive minimally adequate treatment according to current research standards in high-income countries, and even fewer (8%) receive such treatment in low and lower-middle-income countries [<xref ref-type="bibr" rid="ref5">5</xref>]. Additionally, the waiting times for mental health services are prohibitive, averaging longer than 3 months [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. Another barrier is financial affordability, though its impact has slightly decreased in recent years [<xref ref-type="bibr" rid="ref8">8</xref>]. Moreover, in addition to these systemic factors, individual factors may also explain reticence to seek care. People affected by mental illness report a low perceived need for treatment, a desire to handle problems independently [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>], or feeling too busy to pursue treatment [<xref ref-type="bibr" rid="ref8">8</xref>]. In light of these findings, it is critical to establish treatment options that are affordable, easily accessible, and, if possible, short-term and effective.</p><p>Digital mental health interventions (DMHIs) tools are promising supplements and/or alternatives to traditional treatment that can enhance mental health care accessibility [<xref ref-type="bibr" rid="ref11">11</xref>]. Digital modalities are gaining traction, including online psychotherapy and programs powered by virtual reality [<xref ref-type="bibr" rid="ref12">12</xref>]. Anonymity is a key advantage of DMHIs; people who believe they are talking to a computer, relative to a human operator, are more willing to disclose or express sadness and have less fear of being evaluated [<xref ref-type="bibr" rid="ref13">13</xref>]. Subsequently, DMHI tools have growing support for treating mental health challenges, including depression [<xref ref-type="bibr" rid="ref14">14</xref>] and anxiety [<xref ref-type="bibr" rid="ref15">15</xref>]. Moreover, when combined with traditional therapy, mental health apps that support patients between sessions can improve the effectiveness of usual treatment for both depressive and anxiety disorders [<xref ref-type="bibr" rid="ref16">16</xref>].</p><p>With the rise of artificial intelligence (AI), particularly through the development of large language models, new possibilities have emerged to mediate the primary psychotherapeutic tool, conversation. Conversational agents (CAs), or chatbots, represent a promising, accessible, and affordable mental health tool that could automate some therapeutic procedures when the demand for professionals exceeds available capacity [<xref ref-type="bibr" rid="ref17">17</xref>]. This leverages one of the primary benefits of DMHIs, which is the personalization of treatment, especially using machine learning [<xref ref-type="bibr" rid="ref18">18</xref>], potentially leading to greater positive outcomes and lower dropout rates [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. AI has reached a point where it is challenging to differentiate real conversations from those with CAs. When therapists were asked to distinguish between transcripts of interactions with human therapists and those with AI chatbots, they were correct only 53.9% of the time, performing no better than random guessing [<xref ref-type="bibr" rid="ref20">20</xref>].</p><p>As early as 2019, at least 41 mental health chatbots were on the market, most of them claiming to provide therapy [<xref ref-type="bibr" rid="ref21">21</xref>]. Yet, many of them had not been reviewed by professionals, placing them in a regulatory &#x2018;gray area&#x2019; and raising questions of safety that have been discussed only by a few studies so far [<xref ref-type="bibr" rid="ref22">22</xref>]. It is important to keep in mind that chatbots do carry potential risks; for example, they can &#x201C;hallucinate,&#x201D; have biases in judgment, or lack safety and quality control [<xref ref-type="bibr" rid="ref23">23</xref>]. For professionals to accept and build trust in the new technology, it is crucial to have evidence-based tools [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref24">24</xref>], but rigorous research in this area has lagged behind AI&#x2019;s rapid development. The advancement of generative artificial intelligence (GenAI) in the 2020s has significantly bolstered the capabilities of mental health CAs [<xref ref-type="bibr" rid="ref25">25</xref>]. Although meta-analyses comparing randomized controlled trials (RCTs) on the effectiveness of CAs already exist, they include studies of different types of chatbots in terms of function (retrieval-based, rule-based, and generative) [<xref ref-type="bibr" rid="ref26">26</xref>-<xref ref-type="bibr" rid="ref29">29</xref>]. A systematic review and meta-analysis from 2024 showed a significant effect of CAs on depression but did not discuss the type of chatbot or AI model [<xref ref-type="bibr" rid="ref26">26</xref>]. Another review and meta-analysis from 2023 showed similar positive results, but the majority of included studies examined retrieval-based CAs [<xref ref-type="bibr" rid="ref27">27</xref>]. Even the most recent meta-analysis from 2025 on young people included only 3 studies examining GenAI CAs [<xref ref-type="bibr" rid="ref29">29</xref>]. Therefore, as there are still only a few studies exploring the effect of GenAI chatbots on mental health, more evidence is needed to examine their effectiveness.</p><p>GenAI chatbots could help fill the treatment gap by supporting individuals who are waiting for therapy, who cannot afford therapy, and those at low or medium acuity levels who do not need intensive treatment or would not otherwise engage in therapy. The present study entails an early-stage pilot trial testing the merits of a GenAI therapy chatbot. As described below, the AI therapy chatbot tested in this pilot was trained to deliver solution-focused brief therapy (SFBT), a therapeutic approach selected for its strong fit with chatbot delivery. Specifically, SFBT offers a structured conversational format and emphasizes brief, goal-oriented interactions. In this pilot RCT, the AI therapy chatbot was compared to both an untrained ChatGPT-4o-based chatbot and an assessment-only control (AOC) group. In line with preregistered hypotheses, we plan to obtain preliminary estimates of potential changes, assuming that AI therapy will improve well-being, anxiety symptoms, depression symptoms, and functional impairment due to depressive symptoms compared to these 2 groups. Given the nonclinical and nontreatment-seeking sample, the study focused on short-term outcomes, including symptoms of depression and anxiety, as well as well-being indices.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Design and Participants</title><p>The preregistered study involved a pilot RCT in which participants were randomly assigned to 1 of three groups in a 1:1:1 ratio: (1) the AI therapy group, who engaged in AI-assisted therapy sessions via the ChatMind app with a requirement of 3 sessions per week for 3 weeks; (2) the ChatGPT group, who completed equivalent sessions with a general chatbot in the ChatGPT mobile app; and (3) the AOC group, who received no intervention. Participants were aware of their assigned groups so that they could perform the relevant tasks and were emailed twice a week to remind them about the experiment. Mental health indices were measured before and after the 3-week intervention protocols using an online self-assessment questionnaire hosted on the OQS platform.</p><p>The sample size was estimated based on a previous RCT [<xref ref-type="bibr" rid="ref30">30</xref>] evaluating a 3-week solution-focused brief, human-delivered therapy intervention, as the AI therapy shares similar characteristics. Using the effect sizes from this study, a range of anticipated mean changes was estimated, and a simulation-based power analysis was conducted. Across different sample sizes, specifying a mixed-effects model accounting for repeated measures design and group differences, power simulations indicated that 16 participants per group would achieve &#x2265;80% power to detect a very large effect size (<italic>d</italic>=1.24). Since we were preparing for a high dropout rate, which is common in mobile app research [<xref ref-type="bibr" rid="ref31">31</xref>], we set the minimum number of participants in each group to 26. However, given the aims of this pilot-stage study, statistical power to detect a smaller effect was not the priority. More details on this analysis, including a power analysis report, are described in the project preregistration.</p><p>Participants were recruited using a convenience sampling method through online advertisements (eg, Instagram), emails, and push notifications in a partnered mental health app VOS. The VOS app shares the same parent company as ChatMind but is not an AI-based therapy chatbot. It targets a general, nonclinical population interested in mental well-being and provides general mental-well-being tools such as a mood tracker, guided journaling, breathing exercises, and meditations. Inclusion criteria were minimal; participants were eligible if they were native English-speaking, aged 18 years or older, were not being treated for any psychiatric condition, and had never used the ChatMind AI chatbot.</p><p>Participants were recruited in 2 waves. Enrollment for the first wave took place during November and December 2024 (prospective study registration took place on November 29, 2024); 83 participants were enrolled, but only 76 (92%) completed the baseline survey, of which 9 (12%) records were deleted for completing the questionnaire outside the time schedule or not finishing the questionnaire, resulting in 67 randomized participants in the first wave. To ensure a sufficient sample size for pilot-stage effect size estimates, an additional recruitment wave took place in February 2025. With the same randomization strategy, participants were allocated into groups. Of the 102 participants enrolled in this wave, 88 (86%) completed the baseline survey, of which 8 were incomplete or off-schedule records, resulting in 80 participants in the second wave and 147 participants in total. No safety incidents or adverse events were reported during the study. Consistent with the aims of a pilot RCT, statistical power was not prioritized; instead, the sample size was selected to enable estimation of preliminary effect sizes to provide early-stage evidence and foundational support for forthcoming large-scale trials.</p><p>The final analytic sample comprised 85 (58%) participants from the United States, 21 (14%) from Canada, and 41 (28%) from other predominantly English-speaking countries, including the United Kingdom, Ireland, and Australia. Participants ranged in age from 20 to 74 years (mean 38.4, SD 10.8), and 73% were women.</p></sec><sec id="s2-2"><title>Ethical Considerations</title><p>Participation was voluntary, with the only incentive being trial access to the ChatMind AI chatbot (ie, participants in all conditions got access after the 3-wk study period). Informed consent (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) was obtained from all individuals before the baseline assessment. To ensure privacy and confidentiality, all data were pseudonymized at the point of collection and stored on secure, password-protected servers. No personally identifiable information is reported in this study, and only aggregated data are presented to prevent the identification of individual participants. Individuals currently receiving psychiatric treatment were excluded to minimize the risk of distress or adverse reactions. The study design was approved by the Ethics Committee at Olomouc University Social Health Institute (OUSHI) (approval September 2, 2024).</p></sec><sec id="s2-3"><title>Measures</title><sec id="s2-3-1"><title>Anxiety Symptoms</title><p>Anxiety was measured using the 7-item Generalized Anxiety Disorder Scale (GAD-7), a 7-item scale assessing anxiety symptoms over the past 2 weeks, rated on a 4-point scale (0=<italic>&#x201C;Not at all&#x201D;</italic> to 3=<italic>&#x201C;Nearly every day&#x201D;</italic>). Total scores range from 0 to 21, with higher scores indicating greater anxiety severity [<xref ref-type="bibr" rid="ref32">32</xref>]. Cronbach &#x03B1; was 0.89 using both baseline and postintervention data.</p></sec><sec id="s2-3-2"><title>Depressive Symptoms</title><p>Depressive symptoms were evaluated using two scales: the Patient Health Questionnaire (PHQ-9) [<xref ref-type="bibr" rid="ref33">33</xref>] and the Overall Depression Severity and Impairment Scale (ODSIS) [<xref ref-type="bibr" rid="ref34">34</xref>]. The PHQ-9 assesses the severity of depressive symptoms over the past 2 weeks through 9 items based on the <italic>Diagnostic and Statistical Manual of Mental Disorders, Fourth Edition</italic> criteria for depression. Responses indicate the frequency of symptoms and are rated on a 4-point scale (0=<italic>&#x201C;Not at all&#x201D;</italic> to 3=<italic>&#x201C;Nearly every day&#x201D;</italic>). Total scores range from 0 to 27, with higher scores indicating more severe symptoms [<xref ref-type="bibr" rid="ref33">33</xref>]. Cronbach &#x03B1; was 0.87 using both pre- and postintervention data. The ODSIS measures the severity and functional impairment of depression. Participants responded to items indicating symptom frequency on a 5-point scale (0=<italic>&#x201C;Not at all&#x201D;</italic> to 4=<italic>&#x201C;All the time&#x201D;</italic>). Total scores range from 0 to 20, whereby higher scores indicate greater impairment [<xref ref-type="bibr" rid="ref34">34</xref>]. Based on both baseline and postintervention data, Cronbach &#x03B1; was 0.94.</p></sec><sec id="s2-3-3"><title>Well-Being</title><p>The World Health Organization Well-Being Index (5-item version) (WHO-5) was used to assess subjective well-being. Participants indicated how often they had experienced any of the manifestations of well-being in the past 2 weeks on a 6-point scale (0=<italic>&#x201C;At no time&#x201D;</italic> to 5=<italic>&#x201C;All of the time&#x201D;</italic>), with total scores ranging from 0 to 25 and higher scores indicating greater well-being [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]. The Cronbach &#x03B1; of this tool was 0.90 using the baseline and postintervention data.</p></sec><sec id="s2-3-4"><title>Attitude Toward AI</title><p>To obtain an indicative overview of participants&#x2019; perception of AI, we asked them which of the following attitudes they most related to: enthusiastic, open, neutral, skeptical, or negative.</p><p>For each scale, we used sum scores treated as continuous variables.</p></sec></sec><sec id="s2-4"><title>Intervention</title><sec id="s2-4-1"><title>AI Therapy</title><p>Participants in the AI therapy group were given access to the ChatMind app, which provided AI therapy rooted in SFBT principles via voice and text messaging. A preview of the application is available in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>. The app consists of 2 types of session lengths, roughly 10 and 30 minutes, although the final length depended on the flow of the conversation. Participants were instructed to complete 1 short session and 1 long session and a third session of their choice per week. Instructions for participants are available in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>. The app incorporated an automated detection system for crisis-related language (eg, references to self-harm or suicidality) that redirected users to national helplines.</p><p>During each session, the AI therapy chatbot first identified the participant&#x2019;s problem and expectations. Then it guided the participant to find a solution or a small step they could take to improve their situation. Conversations operated on GenAI, modified through prompt engineering and specialized architecture. Participants could choose to engage in oral or text communication. Participants were tracked using a unique promo code for using the app, which allowed us to determine whether users started at least 3 sessions per week (if more, it was considered valid, as starting a session did not mean that the respondent had completed it).</p></sec><sec id="s2-4-2"><title>ChatGPT Group</title><p>Participants in this group were asked to download the ChatGPT mobile app, which allows both text and oral communication. From November 2024 to February 2025, free-tier ChatGPT users initially used the GPT-4o model, and after reaching their message limit, the system automatically switched them to the lighter GPT-4o-mini model. Therefore, for most conversations, the 4o model was used, and 4o-mini for the remainder. Participants were instructed to interact with ChatGPT 3 times a week for at least 10 minutes, as if they were talking to an AI therapy chatbot about whatever was bothering them. In terms of safety, we relied on ChatGPT&#x2019;s in-built systems. To check that participants were completing their tasks, they had to provide confirmation each week.</p></sec><sec id="s2-4-3"><title>Assessment-Only Control Group</title><p>Participants in the AOC group completed baseline and follow-up assessments 3 weeks later but did not receive any intervention components. AOC participants were instructed not to use any chatbot for psychological intervention during the 3-week study period.</p></sec></sec><sec id="s2-5"><title>Statistical Analysis</title><p>Group differences in demographic variables and baseline differences in outcome measures were estimated using <italic>&#x03C7;</italic>&#x00B2; tests for categorical variables and nonparametric analysis of variance (the Kruskal-Wallis test) for age. A <italic>&#x03C7;</italic>&#x00B2; test was also performed to assess for differential attrition across the study groups. This test revealed a strong trend suggesting that dropout rates were dependent on group assignment (<italic>&#x03C7;</italic>&#x00B2;=5.14; <italic>P</italic>=.08). This signal of differential attrition, driven by a substantially higher dropout rate in the AI therapy group, raises concerns about the validity of a per-protocol analysis (PPA), as this approach becomes susceptible to selection bias that can compromise the initial randomization. Thus, our primary analysis followed the intention-to-treat (ITT) principle to provide an unbiased estimate of the intervention&#x2019;s effectiveness. A secondary PPA, consistent with one of the options outlined in our preregistration, was also conducted to explore the efficacy of the intervention specifically among participants who completed the study. The results of the PPA are presented in supplementary analysis in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>.</p><p>To evaluate intervention effects, linear mixed-effects models were used. Separate models were fitted for each outcome variable: anxiety (GAD-7), depressive symptoms (PHQ-9), depression severity and impairment (ODSIS), and mental well-being (WHO-5). For the GAD-7, ODSIS, and WHO-5 outcomes, models were fitted with parameters estimated using restricted maximum likelihood. For the PHQ-9 outcome, initial diagnostic checks revealed significant heteroscedasticity. To address this, a mixed-effects model was refitted with the nonconstant variance explicitly modeled. All models were adjusted for participants&#x2019; education level to account for baseline differences across groups.</p><p>Each model included fixed effects for time, with measurements taken at baseline and after the 3-week study period (ie, preintervention vs postintervention), experimental group (AI therapy, ChatGPT, and AOC), and the time &#x00D7; group interaction representing the differential change over time by group. Random intercepts for participants accounted for individual differences in baseline scores and changes over time. Initially, AOC was coded as the reference group to derive contrasts between AOC and the 2 active treatment conditions, then we releveled the condition variable coding to directly contrast AI therapy and ChatGPT conditions via planned comparisons. Although the constructs measured together are often statistically related (eg, [<xref ref-type="bibr" rid="ref37">37</xref>], they are conceptually different. Therefore, we treated the scales as independent variables (depression symptoms, anxiety symptoms, depression-related functional impairment, and positive well-being). Following strict adherence to our preregistration, we applied Holm-Bonferroni correction to the 8 preregistered directional hypotheses: 4 tests comparing AI therapy to control (across 4 outcomes) and 4 tests directly comparing AI therapy to ChatGPT (across 4 outcomes). For these 8 preregistered tests, 1-tailed <italic>P</italic>-values were computed based on the directional hypotheses (expecting AI therapy to show greater improvements). Comparisons between ChatGPT and control were not preregistered with directional hypotheses and are therefore reported as exploratory analyses with 2-tailed <italic>P</italic>-values and no correction for multiple testing.</p><p>To formally assess the mechanism of missing data, we performed an omnibus test for data being missing completely at random (MCAR). In the MCAR test, the assumptions of multivariate normality and homoscedasticity required for the standard parametric Little&#x2019;s test were violated (Hawkins test, <italic>P</italic>&#x003C;.001). Therefore, we relied on the robust nonparametric alternative. The result of this test was not statistically significant (<italic>P</italic>=.06), providing insufficient evidence from this omnibus test to reject the MCAR null hypothesis. To examine predictors of intervention completion (fidelity) and retention (completing the follow-up survey), we performed a series of logistic regression analyses. In these analyses, independent variables were outcome measures (ie, PHQ-9, ODSIS, WHO-5), age, gender, and attitude toward AI.</p><p>Effect sizes were reported as unstandardized regression coefficients (<italic>b</italic>) and Cohen <italic>d</italic>. Because all outcomes were self-reported by participants, blinding of outcome assessors was not feasible. The researchers conducting the data analysis were not blinded to group assignment; however, all code and analytic decisions were independently reviewed by multiple members of the research team to minimize potential bias. All statistical analyses were conducted using R software, version 4.3.0 (R Core Team, 2023) within the RStudio environment, version 2024.04.2.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Participant Characteristics</title><p>The Consolidated Standards of Reporting Trials (CONSORT) diagram chart in <xref ref-type="fig" rid="figure1">Figure 1</xref> illustrates the process of respondent enrollment, allocation into groups, assessment, and intervention. Sample demographics and baseline characteristics for the ITT sample are provided in <xref ref-type="table" rid="table1">Table 1</xref>. Baseline comparisons showed no significant differences across the 3 groups for age or any of the clinical outcome measures (GAD-7, ODSIS, PHQ-9, or WHO-5), with all <italic>P</italic> values &#x003E;.05. However, a Pearson &#x03C7;&#x00B2; test with Monte Carlo simulated p-value revealed a significant difference in the distribution of education levels across the groups (&#x03C7;&#x00B2; = 16.07, simulated p = .014). (<italic>&#x03C7;</italic>&#x00B2;=16.07<italic>; P</italic>=.01). The demographic characteristics of the sample are summarized in <xref ref-type="table" rid="table1">Table 1</xref>.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Consolidated Standards of Reporting Trials flow diagram. AI: artificial intelligence.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="mental_v13i1e82642_fig01.png"/></fig><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Sample characteristics by assigned group.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Variable</td><td align="left" valign="bottom">AI therapy (n=44)</td><td align="left" valign="bottom">ChatGPT (n=60)</td><td align="left" valign="bottom">Control (n=43)</td><td align="left" valign="bottom">Overall (n=147)</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="5">Age</td></tr><tr><td align="left" valign="top">&#x2003;Mean (SD)</td><td align="left" valign="top">37 (9)</td><td align="left" valign="top">39 (10)</td><td align="left" valign="top">39 (13)</td><td align="left" valign="top">38 (11)</td></tr><tr><td align="left" valign="top">&#x2003;Median (IQR)</td><td align="left" valign="top">36 (23-71)</td><td align="left" valign="top">37 (20-74)</td><td align="left" valign="top">38 (22-73)</td><td align="left" valign="top">37 (20-74)</td></tr><tr><td align="left" valign="top" colspan="5">Gender, n (%)</td></tr><tr><td align="left" valign="top">&#x2003;Female</td><td align="left" valign="top">28 (64)</td><td align="left" valign="top">42 (70)</td><td align="left" valign="top">37 (86)</td><td align="left" valign="top">107 (73)</td></tr><tr><td align="left" valign="top">&#x2003;Male</td><td align="left" valign="top">16 (36)</td><td align="left" valign="top">18 (30)</td><td align="left" valign="top">6 (14)</td><td align="left" valign="top">40 (27)</td></tr><tr><td align="left" valign="top" colspan="5">Country, n (%)</td></tr><tr><td align="left" valign="top">&#x2003;United States</td><td align="left" valign="top">25 (57)</td><td align="left" valign="top">34 (57)</td><td align="left" valign="top">26 (60)</td><td align="left" valign="top">85 (58)</td></tr><tr><td align="left" valign="top">&#x2003;Canada</td><td align="left" valign="top">5 (11)</td><td align="left" valign="top">10 (17)</td><td align="left" valign="top">6 (14)</td><td align="left" valign="top">21 (14)</td></tr><tr><td align="left" valign="top">&#x2003;Other</td><td align="left" valign="top">14 (32)</td><td align="left" valign="top">16 (27)</td><td align="left" valign="top">11 (26)</td><td align="left" valign="top">41 (28)</td></tr><tr><td align="left" valign="top" colspan="5">Education, n (%)</td></tr><tr><td align="left" valign="top">&#x2003;High school or less</td><td align="left" valign="top">6 (14)</td><td align="left" valign="top">5 (8.3)</td><td align="left" valign="top">13 (30)</td><td align="left" valign="top">24 (16)</td></tr><tr><td align="left" valign="top">&#x2003;Higher vocational</td><td align="left" valign="top">11 (25)</td><td align="left" valign="top">12 (20)</td><td align="left" valign="top">3 (7.0)</td><td align="left" valign="top">26 (18)</td></tr><tr><td align="left" valign="top">&#x2003;Bachelor&#x2019;s degree</td><td align="left" valign="top">13 (30)</td><td align="left" valign="top">21 (35)</td><td align="left" valign="top">19 (44)</td><td align="left" valign="top">53 (36)</td></tr><tr><td align="left" valign="top">&#x2003;Master&#x2019;s or PhD</td><td align="left" valign="top">14 (32)</td><td align="left" valign="top">22 (37)</td><td align="left" valign="top">8 (19)</td><td align="left" valign="top">44 (30)</td></tr><tr><td align="left" valign="top" colspan="5">Economic status, n (%)</td></tr><tr><td align="left" valign="top">&#x2003;Not currently working</td><td align="left" valign="top">15 (34)</td><td align="left" valign="top">17 (28)</td><td align="left" valign="top">13 (30)</td><td align="left" valign="top">45 (31)</td></tr><tr><td align="left" valign="top">&#x2003;Employed</td><td align="left" valign="top">25 (57)</td><td align="left" valign="top">31 (52)</td><td align="left" valign="top">24 (56)</td><td align="left" valign="top">80 (54)</td></tr><tr><td align="left" valign="top">&#x2003;Self-employed</td><td align="left" valign="top">4 (9.1)</td><td align="left" valign="top">12 (20)</td><td align="left" valign="top">6 (14)</td><td align="left" valign="top">22 (15)</td></tr><tr><td align="left" valign="top" colspan="5">Recruitment phase, n (%)</td></tr><tr><td align="left" valign="top">&#x2003;First</td><td align="left" valign="top">22 (50)</td><td align="left" valign="top">26 (43)</td><td align="left" valign="top">19 (44)</td><td align="left" valign="top">67 (46)</td></tr><tr><td align="left" valign="top">&#x2003;Second</td><td align="left" valign="top">22 (50)</td><td align="left" valign="top">34 (57)</td><td align="left" valign="top">24 (56)</td><td align="left" valign="top">80 (54)</td></tr><tr><td align="left" valign="top" colspan="5">Dropout participants, n (%)</td></tr><tr><td align="left" valign="top">&#x2003;No</td><td align="left" valign="top">15 (34)</td><td align="left" valign="top">32 (53)</td><td align="left" valign="top">24 (56)</td><td align="left" valign="top">71 (48)</td></tr><tr><td align="left" valign="top">&#x2003;Yes</td><td align="left" valign="top">29 (66)</td><td align="left" valign="top">28 (47)</td><td align="left" valign="top">19 (44)</td><td align="left" valign="top">76 (52)</td></tr></tbody></table></table-wrap></sec><sec id="s3-2"><title>Feasibility and Engagement</title><p>Full fidelity to the intervention protocol was relatively low in both treatment conditions; 17 (39%) of those in the AI therapy condition completed all intervention sessions, and 38 (62%) of those in the ChatGPT condition completed all sessions. Logistic regression revealed that none of the baseline clinical measures were significant predictors (GAD-7: odds ratio [OR]=0.97, <italic>P</italic>=.456; ODSIS: OR=0.95, <italic>P</italic>=0.23; PHQ-9: OR=0.98, <italic>P</italic>=.64). However, older age was significantly associated with a lower likelihood of completing the intervention (OR=0.95, <italic>P</italic>=.03).</p><p>Study retention, in terms of completing the follow-up survey, was 28 (64%) in the AI therapy condition, 36 (60%) in the ChatGPT condition, and 28 (65%) in the AOC condition. Logistic regression revealed that baseline symptom severity was not a significant predictor, although higher baseline ODSIS scores showed a trend toward predicting a lower likelihood of retention (OR=0.92; <italic>P</italic>=.05). In these models, older age again emerged as a significant predictor of lower retention (OR=0.95; <italic>P</italic>=.003). Furthermore, a more positive baseline attitude toward AI significantly predicted a higher likelihood of retention (OR=1.48; <italic>P</italic>=.048).</p></sec><sec id="s3-3"><title>Outcome Analysis</title><p>Descriptive statistics for anxiety, depression, and mental well-being scores at baseline and after the 3-week intervention period, stratified by the experimental groups, are presented in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>. Kruskal-Wallis tests showed no significant group differences in mental health indices at baseline (<italic>P</italic>-value range: 0.43&#x2010;0.94). Although not a major feature of the trial, baseline assessment of attitudes toward AI-based therapy was very favorable (mean 3.05, SD 0.92) on a 4-point scale, where 1=skeptical or negative and 4=enthusiastic).</p><p><xref ref-type="table" rid="table2">Table 2</xref> presents the ITT intervention effect estimates, with unstandardized regression coefficients (<italic>b</italic>) for the interaction terms representing the estimated difference in change between groups from preintervention to postintervention. <xref ref-type="table" rid="table3">Table 3</xref> presents the corresponding effect sizes (Cohen <italic>d</italic>) for these interaction effects, along with their 95% CIs.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Results of mixed-effects models of temporal changes in anxiety (GAD-7<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup>), depression (ODSIS<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup>), (PHQ-9<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup>), and mental well-being (WHO-5<sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup>) scores across study groups.<sup><xref ref-type="table-fn" rid="table2fn5">e</xref></sup></p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom" colspan="2">Anxiety (GAD-7)</td><td align="left" valign="bottom" colspan="2">Depression (ODSIS)</td><td align="left" valign="bottom" colspan="2">Depression (PHQ-9)</td><td align="left" valign="bottom" colspan="2">Mental well-being (WHO-5)</td></tr></thead><tbody><tr><td align="left" valign="top">Effect</td><td align="left" valign="top"><italic>b</italic><sup><xref ref-type="table-fn" rid="table2fn6">f</xref></sup> (95% CI)</td><td align="left" valign="top"><italic>P</italic> value</td><td align="left" valign="top"><italic>b</italic> (95% CI)</td><td align="left" valign="top"><italic>P</italic> value</td><td align="left" valign="top"><italic>b</italic> (95% CI)</td><td align="left" valign="top"><italic>P</italic> value</td><td align="left" valign="top"><italic>b</italic> (95% CI)</td><td align="left" valign="top"><italic>P</italic> value</td></tr><tr><td align="left" valign="top" colspan="9">Fixed effects</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Intercept</td><td align="left" valign="top">14.37 (10.53 to 18.21)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">11.55 (7.99 to 15.11)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">24 (19.69 to 28.30)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">9.99 (5.75 to 14.23)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Time</td><td align="left" valign="top">0.38 (&#x2013;1.32 to 2.08)</td><td align="left" valign="top">.66</td><td align="left" valign="top">0.35 (&#x2013;0.93 to 1.64)</td><td align="left" valign="top">.58</td><td align="left" valign="top">0.64 (&#x2013;0.60 to 1.89)</td><td align="left" valign="top">.31</td><td align="left" valign="top">&#x2013;0.25 (&#x2013;1.66 to 1.16)</td><td align="left" valign="top">.72</td></tr><tr><td align="left" valign="top" colspan="9">Experimental group (reference: control)</td></tr><tr><td align="left" valign="top">&#x2003;AI<sup><xref ref-type="table-fn" rid="table2fn7">g</xref></sup> therapy</td><td align="left" valign="top">&#x2013;0.90 (&#x2013;3.17 to 1.37)</td><td align="left" valign="top">.43</td><td align="left" valign="top">&#x2013;0.22 (&#x2013;2.27 to 1.84)</td><td align="left" valign="top">.83</td><td align="left" valign="top">&#x2013;0.98 (&#x2013;3.23 to 1.26)</td><td align="left" valign="top">.39</td><td align="left" valign="top">0.84 (&#x2013;1.60 to 3.27)</td><td align="left" valign="top">.50</td></tr><tr><td align="left" valign="top">&#x2003;ChatGPT</td><td align="left" valign="top">0.23 (&#x2013;1.89 to 2.36)</td><td align="left" valign="top">.83</td><td align="left" valign="top">0.13 (&#x2013;1.79 to 2.06)</td><td align="left" valign="top">.89</td><td align="left" valign="top">0.28 (&#x2013;2.01 to 2.56)</td><td align="left" valign="top">.81</td><td align="left" valign="top">&#x2013;0.49 (&#x2013;2.77 to 1.79)</td><td align="left" valign="top">.67</td></tr><tr><td align="left" valign="top" colspan="9">Interaction effects (reference: control group &#x00D7; time)</td></tr><tr><td align="left" valign="top">&#x2003;AI therapy group &#x00D7; time</td><td align="left" valign="top">&#x2013;1.98 (&#x2013;4.39 to 0.43)</td><td align="left" valign="top">.05 (.37)</td><td align="left" valign="top">&#x2013;1.13 (&#x2013;2.94 to 0.68)</td><td align="left" valign="top">.11 (.66)</td><td align="left" valign="top">&#x2013;2.67 (&#x2013;4.74 to 0.60)</td><td align="left" valign="top">.006 (.046)</td><td align="left" valign="top">0.64 (&#x2013;1.35 to 2.64)</td><td align="left" valign="top">.26 (&#x003E;.99)</td></tr><tr><td align="left" valign="top">&#x2003;ChatGPT group &#x00D7; time</td><td align="left" valign="top">&#x2013;1.41 (&#x2013;3.68 to 0.85)</td><td align="left" valign="top">.22</td><td align="left" valign="top">&#x2013;0.54 (&#x2013;2.25 to 1.17)</td><td align="left" valign="top">.53</td><td align="left" valign="top">&#x2013;2.47 (&#x2013;4.61 to 0.34)</td><td align="left" valign="top">.02</td><td align="left" valign="top">1.02 (&#x2013;0.86 to 2.90)</td><td align="left" valign="top">.28</td></tr><tr><td align="left" valign="top" colspan="9">Planned comparisons (reference: ChatGPT group &#x00D7; time)</td></tr><tr><td align="left" valign="top">&#x2003;AI therapy group &#x00D7; time</td><td align="left" valign="top">&#x2013;0.57 (&#x2013;2.83 to 1.70)</td><td align="left" valign="top">.31 (&#x003E;.99)</td><td align="left" valign="top">&#x2013;0.59 (&#x2013;2.29 to 1.12)</td><td align="left" valign="top">.25 (&#x003E;.99)</td><td align="left" valign="top">&#x2013;0.19 (&#x2013;2.59 to 2.20)</td><td align="left" valign="top">.44 (&#x003E;.99)</td><td align="left" valign="top">&#x2013;0.38 (&#x2013;2.26 to 1.50)</td><td align="left" valign="top">.66 (&#x003E;.99)</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>GAD-7: 7-item Generalized Anxiety Disorder Scale.</p></fn><fn id="table2fn2"><p><sup>b</sup>ODSIS: Overall Depression Severity and Impairment Scale.</p></fn><fn id="table2fn3"><p><sup>c</sup>PHQ-9: Patient Health Questionnaire-9.</p></fn><fn id="table2fn4"><p><sup>d</sup>WHO-5: World Health Organization Well-Being Index (5-item version).</p></fn><fn id="table2fn5"><p><sup>e</sup>Models also controlled for age, gender, country, education, employment status, and recruitment wave. <italic>P</italic> values for AI therapy group &#x00D7; time and AI therapy group &#x00D7; time (vs ChatGPT) are 1-tailed based on preregistered directional hypotheses; ChatGPT group &#x00D7; time comparisons are exploratory (not preregistered) and reported with 2-tailed <italic>P</italic> values. For preregistered tests, the main value represents the unadjusted 1-tailed <italic>P</italic> value, with the Holm-Bonferroni adjusted <italic>P</italic> value (corrected across 8 preregistered hypotheses) provided in bold parentheses. Exploratory tests show 2-tailed <italic>P</italic> values without adjustment.</p></fn><fn id="table2fn6"><p><sup>f</sup>b: unstandardized regression coefficient. </p></fn><fn id="table2fn7"><p><sup>g</sup>AI: artificial intelligence.</p></fn></table-wrap-foot></table-wrap><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Effect sizes (Cohen <italic>d</italic>, 95% CI) for intention-to-treat intervention effects.<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Effect</td><td align="left" valign="bottom">Anxiety (GAD-7<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup>), Cohen <italic>d</italic><sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup> (95% CI)</td><td align="left" valign="bottom">Depression (ODSIS<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup>), Cohen <italic>d</italic> (95% CI)</td><td align="left" valign="bottom">Depression (PHQ-9<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup>), Cohen <italic>d</italic> (95% CI)</td><td align="left" valign="bottom">Mental well-being (WHO-5<sup><xref ref-type="table-fn" rid="table3fn5">e</xref></sup>), Cohen <italic>d</italic> (95% CI)</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="5">Interaction effects (reference: control group &#x00D7; time)</td></tr><tr><td align="left" valign="top">&#x2003;AI<sup><xref ref-type="table-fn" rid="table3fn7">g</xref></sup> therapy group &#x00D7; time</td><td align="left" valign="top">&#x2212;0.37 (&#x2212;0.83 to 0.08)</td><td align="left" valign="top">&#x2212;0.25 (&#x2212;0.66 to 0.15)</td><td align="left" valign="top">&#x2212;0.47 (&#x2212;0.84 to &#x2212;0.11)</td><td align="left" valign="top">0.12 (&#x2212;0.26 to 0.51)</td></tr><tr><td align="left" valign="top">&#x2003;ChatGPT group &#x00D7; time</td><td align="left" valign="top">&#x2212;0.27 (&#x2212;0.70 to 0.16)</td><td align="left" valign="top">&#x2212;0.12 (&#x2212;0.50 to 0.26)</td><td align="left" valign="top">&#x2212;0.44 (&#x2212;0.82 to &#x2212;0.06)</td><td align="left" valign="top">0.20 (&#x2212;0.17 to 0.56)</td></tr><tr><td align="left" valign="top" colspan="5">Planned comparisons (reference: ChatGPT group &#x00D7; time)</td></tr><tr><td align="left" valign="top">&#x2003;AI therapy group &#x00D7; time</td><td align="left" valign="top">&#x2212;0.11 (&#x2212;0.54 to 0.32)</td><td align="left" valign="top">&#x2212;0.13 (&#x2212;0.51 to 0.25)</td><td align="left" valign="top">&#x2212;0.03 (&#x2212;0.46 to 0.39)</td><td align="left" valign="top">&#x2212;0.07 (&#x2212;0.44 to 0.29)</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>Cohen <italic>d</italic> was calculated by dividing the unstandardized regression coefficient (<italic>b</italic>) and its CI by the pooled baseline SD. A negative <italic>d</italic> indicates a greater reduction in symptoms for the nonreference group.</p></fn><fn id="table3fn2"><p><sup>b</sup>GAD-7: 7-item Generalized Anxiety Disorder Scale.</p></fn><fn id="table3fn3"><p><sup>c</sup>ODSIS: Overall Depression Severity and Impairment Scale.</p></fn><fn id="table3fn4"><p><sup>d</sup>PHQ-9: Patient Health Questionnaire-9.</p></fn><fn id="table3fn5"><p><sup>e</sup>WHO-5: World Health Organization Well-Being Index (5-item version).</p></fn><fn id="table3fn6"><p><sup>f</sup>b: unstandardized regression coefficient. </p></fn><fn id="table3fn7"><p><sup>g</sup>AI: artificial intelligence.</p></fn></table-wrap-foot></table-wrap><p>During preregistered hypothesis testing, it was found that the AI therapy group exhibited a statistically significant reduction in PHQ-9 depressive symptoms compared to the control group with a 2.67 point greater reduction (<italic>d</italic>=&#x2212;0.47, 1-tailed and noncorrected <italic>P</italic>=.006, corrected <italic>P</italic>=.046), which remained significant after Holm-Bonferroni correction for the 8 preregistered hypotheses. The AI therapy group also showed trends toward greater improvement in anxiety symptoms (GAD-7: 1.98 point reduction, <italic>d</italic>=&#x2212;0.37) and ODSIS depression functional impairment scores (1.13 point reduction, <italic>d</italic>=&#x2212;0.25), although these did not reach statistical significance. No significant change in well-being (as measured by the WHO-5) was observed compared to the control group.</p><p>During nonpreregistered exploratory analyses, we examined differences between the ChatGPT group and the control group in the outcome measures. It was revealed that the ChatGPT group showed a significant 2.47 point greater reduction in PHQ-9 depressive symptoms (<italic>d</italic>=-0.44, 2-tailed <italic>P</italic>=.02), as well as nonsignificant improvements in anxiety symptoms (<italic>d</italic>=-0.27) and ODSIS scores (<italic>d</italic>=-0.12). These exploratory results were not subject to multiple comparison correction. As shown in the supplemental analyses in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>, these results were largely consistent with the per-protocol results.</p><p>The next set of models was the planned comparisons between the AI therapy and ChatGPT (reference group) conditions, as shown in the lower half of <xref ref-type="table" rid="table2">Tables 2</xref> and <xref ref-type="table" rid="table3">3</xref>. Although none of the estimates reached statistical significance, the AI therapy group showed small, favorable effect size trends compared to the ChatGPT group for anxiety (<italic>d</italic>=-0.11), ODSIS depression severity and impairment scores (<italic>d</italic>=-0.13), PHQ depressive symptoms (<italic>d</italic>=-0.03), but not in well-being (<italic>d</italic>=-0.07). In the PPA, the ChatGPT group showed numerically larger reductions in depression scores (ODSIS and PHQ-9) compared to AI therapy, but these differences were very small and not statistically significant (<xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>).</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>As digital therapy alternatives rapidly evolve, including GenAI-based therapy chatbots, there is a need for careful, iterative testing of these novel therapeutic modalities. This pilot study provides early-stage proof of concept for a brief 3-week (9 sessions) AI therapy chatbot intervention based on solution-focused principles (ie, ChatMind), relative to a standard untrained chatbot (GPT-4o-based models) condition and an AOC condition. As described below, findings provide foundational support for the overall promise/merits of GenAI chatbot therapy while also elucidating key areas of improvement regarding feasibility.</p></sec><sec id="s4-2"><title>Clinical Outcomes</title><sec id="s4-2-1"><title>Overview of Findings</title><p>Overall, both the AI therapy group and the ChatGPT group showed significant reductions in depressive symptoms and nonsignificant improvements in anxiety symptoms compared to the AOC. Changes in well-being scores were not significant in any group. Neither AI group significantly outperformed the other, although the AI therapy group exhibited greater descriptive changes. These findings should be interpreted as preliminary trends rather than definitive evidence of efficacy, given the small sample size and limited statistical power of the study.</p></sec><sec id="s4-2-2"><title>Depression</title><p>Both the AI therapy and ChatGPT groups demonstrated a statistically significant reduction in depressive symptoms (PHQ-9), while functional impairment, as measured by ODSIS, remained unchanged. This suggests that AI interventions may influence symptom severity more than daily life functioning. Overall, the reduction in depressive symptoms aligns with previous meta-analyses highlighting the short-term effectiveness of CAs on depression [<xref ref-type="bibr" rid="ref27">27</xref>]. The effect sizes achieved by the AI interventions on the PHQ-9 (AI therapy: <italic>d</italic>=&#x2212;0.47; ChatGPT: <italic>d</italic>=&#x2212;0.44) are comparable to those reported for psychotherapies for depression, which typically yield standardized mean differences ranging from 0.11 to 0.61 [<xref ref-type="bibr" rid="ref38">38</xref>]. Although these reductions reached statistical significance, the mean changes in PHQ-9 scores (&#x2212;2.7 points for AI therapy; &#x2212;2.5 for ChatGPT) did not meet the commonly accepted minimal clinically important difference of approximately 3.3 points [<xref ref-type="bibr" rid="ref39">39</xref>]. On both measures, the AI therapy group showed greater reductions, although these differences were not statistically significant compared to the ChatGPT group. The AI therapy intervention in this study, though based on GenAI, followed structured prompts emphasizing ventilation and goal setting inspired by SFBT, which has demonstrated effectiveness for depression [<xref ref-type="bibr" rid="ref40">40</xref>]. This structured approach may have contributed to the greater descriptive improvements compared to the unstructured ChatGPT intervention.</p></sec><sec id="s4-2-3"><title>Anxiety</title><p>Both the AI therapy group and the ChatGPT group demonstrated nonsignificant reductions in anxiety symptoms. The descriptive change fell below the minimal clinically important difference threshold of about 3.7 points [<xref ref-type="bibr" rid="ref39">39</xref>]. A longer intervention may be required for these effects to reach statistical significance, although previous meta-analytic evidence suggests that CAs can have short-term effects on both generalized and specific anxiety [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>]. By the nature of anxiety, the real-time availability of CAs may be 1 factor, making them effective in the short term. Furthermore, AI&#x2019;s ability to detect and reframe cognitive distortions [<xref ref-type="bibr" rid="ref41">41</xref>], which often contributes to anxiety, may help reduce its symptoms. Given AI&#x2019;s current restriction to verbal communication, its potential may be strongest in text-based cognitive interventions. Importantly, this remains only a potential, and it is unclear whether AI can deliver such interventions without specific prompting. Recent research even suggests that GenAI models may themselves exhibit metaphorical &#x201C;state anxiety&#x201D; when exposed to trauma-related narratives [<xref ref-type="bibr" rid="ref42">42</xref>], indicating that specific prompting or other adjustments may be necessary to optimize AI responses to anxious input.</p></sec><sec id="s4-2-4"><title>Well-Being</title><p>In our study, both intervention groups showed slight, nonsignificant improvements in well-being, while the control group declined. The effect of CAs on well-being has been inconsistent across previous studies. Although a meta-analysis by Zhong et al shows short-term gains in well-being after a CA intervention [<xref ref-type="bibr" rid="ref26">26</xref>], another of He et al does not [<xref ref-type="bibr" rid="ref27">27</xref>]. Even though the WHO-5 questionnaire is sensitive to intervention-related changes [<xref ref-type="bibr" rid="ref36">36</xref>], well-being is considered a relatively stable construct across the lifespan [<xref ref-type="bibr" rid="ref43">43</xref>], which may limit the short-term impact of CAs. The therapeutic approach that is most commonly integrated into CAs, cognitive behavioral therapy [<xref ref-type="bibr" rid="ref44">44</xref>], appears to be more effective in reducing negative affect than in enhancing positive affect [<xref ref-type="bibr" rid="ref45">45</xref>]. This difference could explain the more consistent effects on depression and anxiety compared to well-being. In contrast, SFBT, which underpinned the AI therapy group, has demonstrated effectiveness for both affects [<xref ref-type="bibr" rid="ref46">46</xref>]. Because cognitive behavioral therapy is often symptom-focused, its integration into CAs may be effective for reducing targeted issues like depression or anxiety, but less so for promoting overall well-being, highlighting the potential benefit of including elements from broader therapeutic frameworks.</p></sec><sec id="s4-2-5"><title>Comparison of Two Chatbots</title><p>A key strength of our study is the direct comparison of a structured AI therapy chatbot with an unstructured general-purpose 1. Neither chatbot was found to significantly outperform the other in any outcome. In the ITT analysis, the AI therapy group showed slightly larger reductions than the ChatGPT group, with small effect sizes favoring AI therapy for anxiety (AI therapy: <italic>d</italic>=&#x2212;0.37 vs ChatGPT: <italic>d</italic>=&#x2212;0.27), ODSIS depression (AI therapy: <italic>d</italic>=&#x2212;0.25 vs ChatGPT: <italic>d</italic>=&#x2212;0.12), and PHQ depression (AI therapy: <italic>d</italic>=&#x2212;0.47 vs ChatGPT: <italic>d</italic>=&#x2212;0.44). However, in the per-protocol analysis, this pattern reversed for depression: the ChatGPT group achieved slightly greater reductions in PHQ-9 and ODSIS scores. This discrepancy may reflect differences in adherence or user engagement, as per-protocol analysis includes only participants who completed the intervention as intended. While the results of the ITT analysis may be closer to a real-life scenario, the per-protocol analysis is closer to the ideal situation. These differences should be interpreted with caution. However, they also highlight the need to examine which features, such as the AI model used, conversation flow, or therapeutic framing, drive effectiveness. We do not yet know what the determinants of the effectiveness of CAs are; however, recent studies suggest that prompt engineering influences their relevance, empathy, and contextual responses [<xref ref-type="bibr" rid="ref33">33</xref>].</p></sec><sec id="s4-2-6"><title>Factors Influencing Effectiveness</title><p>The emergence of GenAI represents a fundamental shift: unlike older retrieval-based or rule-based systems, generative models can produce original and coherent text [<xref ref-type="bibr" rid="ref47">47</xref>]. Our findings revealed descriptive trends indicating that structured AI interactions led to greater results in depression and anxiety changes than in the ChatGPT group, raising questions about which features, such as the AI model used, conversation flow, or therapeutic framing, drive effectiveness. In line with our results, previous research suggests that prompt engineering influences the CA&#x2019;s relevance, empathy, and contextual responses [<xref ref-type="bibr" rid="ref33">33</xref>].</p><p>When we compared our results thoroughly with previous studies, we encountered several obstacles. While our study compared 2 generative chatbots with a control group, most earlier studies examined rule-based or retrieval-based CAs, limiting the generalizability of their findings to current models used in our trial. Moreover, many studies fail to report these crucial technical details, and even meta-analyses do not account for these differences [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref48">48</xref>]. Recent evidence indicates that GenAI chatbots may achieve larger effects on mental health outcomes compared to rule-based agents [<xref ref-type="bibr" rid="ref28">28</xref>], and perform better in giving empathetic responses and establishing the alliance between the CA and the user [<xref ref-type="bibr" rid="ref27">27</xref>]. Systematic comparisons between different types of CAs are therefore essential to identify which specific features drive the effectiveness of CAs.</p></sec></sec><sec id="s4-3"><title>Feasibility</title><p>The multinational sample of nontreatment-seeking adults generally reported favorable attitudes toward AI-based therapy assessed at baseline; however, the suboptimal adherence to intervention protocols may suggest waning interest once involved. Indeed, only 39% of those in the AI therapy condition fully adhered to the 9-session protocol. This pattern may reflect limited engagement among participants without acute treatment needs and is an important consideration in our study of healthy, nontreatment-seeking samples. Fidelity was higher in the ChatGPT group (62%), likely due to several factors. Accessing ChatMind required extra steps, such as obtaining a promo code, which may have discouraged some participants. The structured, solution-focused session format may also have reduced engagement compared with the more flexible ChatGPT experience. Another possible contributing factor could have been differences in overall user-friendliness. Notably, participants with higher baseline depression severity and impairment on the ODSIS scale were more likely to adhere to the full protocol, although this trend did not reach statistical significance. However, this was not the case for higher depression symptom scores measured by the PHQ-9, suggesting greater adherence in those whose symptoms of depression had already begun to interfere with their lives. The relatively rigid structure of the current protocol (3 sessions per wk for 3 wk) may have also contributed to lower protocol adherence. In contrast, real-world applications of AI therapy are likely to be more flexible, allowing individuals to engage when most needed and at a preferred pace. Furthermore, this pilot tested a single therapeutic approach (SFBT), which may not resonate with all users or meet a wide range of needs and preferences. The fixed protocol may have felt repetitive for some participants, further limiting sustained engagement. Looking ahead, AI therapy tools will likely need to emulate the flexibility and adaptability of human therapists by tailoring interactions to patient preferences, symptom severity, and evolving goals to maximize engagement and therapeutic impact. Future feasibility research should focus on clinical, treatment-seeking samples, explore adaptive or flexible treatment models, and further evaluate the optimal number and pacing of AI therapy sessions.</p></sec><sec id="s4-4"><title>Strengths and Limitations</title><p>Our study is 1 of the few RCTs to investigate the effectiveness of a generative mental health chatbot. The field of AI is rapidly advancing, and our study focuses on instruments that use the most recent AI models, underscoring its urgency and relevance. To the best of our knowledge, we are the first to compare 2 generative chatbots against a control group, which is the strongest aspect of our study. Furthermore, the study code and data are freely available online so that findings from this study can be easily replicated.</p><p>The study also has several limitations. The first one is a high attrition rate, which is a common challenge in short-term CA intervention studies [<xref ref-type="bibr" rid="ref49">49</xref>]. We addressed this limitation with second participant recruitment, but although the targeted sample size estimated by power analysis was achieved, a larger sample would still likely be needed to detect smaller effects. The second limitation is the intervention length. In addition, the second limitation relates to the nature of the GenAI on which both interventions were based, as it inherently limits control over the conversation flow and content compared to the earlier researched rule or retrieval-based chatbots. However, this also allowed for more naturalistic data and greater ecological validity. The third limitation is a lack of data on the exact length of interventions. We were not able to track the total time participants spent conversing within the AI therapy and ChatGPT groups. Nonetheless, this reflects a common limitation in studies of unsupervised digital interventions. The fourth limitation is that we did not specify in the guidelines that participants should not start any psychological treatment, only that they should not use another chatbot for therapeutic purposes. A final limitation of the present study is the absence of detailed engagement data, such as session duration or use of voice versus text input. Future studies should incorporate more precise tracking of user interaction patterns to better evaluate engagement and adherence.</p></sec><sec id="s4-5"><title>Implications</title><p>Future research should investigate the long-term effects of AI-based psychological interventions, as most studies, including ours, assess only short-term outcomes. Extended intervention periods and follow-up assessments are needed to evaluate sustainability and rule out novelty effects. Comparative studies should also explore different AI types, delivery formats (eg, text vs voice), and therapeutic approaches embedded in chatbots.</p><p>Regarding implications for practice, our results underscore that not all AI-based mental health tools are equal: therapeutic outcomes may critically depend on how AI is deployed in a particular chatbot, including the use of prompt engineering, conversation design, and alignment with established therapeutic frameworks. For chatbot developers, it will be important to build on development practices as well as psychological foundations that are supported by research, evaluate the effectiveness of specific chatbots through new research, and identify new factors contributing to their effectiveness.</p></sec><sec id="s4-6"><title>Conclusion</title><p>This study evaluated the effectiveness of a structured, generative chatbot rooted in solution-focused brief therapy compared to a general-purpose GenAI chatbot (ChatGPT) and a no-intervention control group over 3 weeks. Both the AI therapy and ChatGPT groups demonstrated a significant reduction in depressive symptoms compared to the control group. These findings support the potential of GenAI interventions for mental health. Further comparative studies are essential to identify the specific design features and therapeutic mechanisms that contribute to the effectiveness of AI-based mental health tools.</p></sec></sec></body><back><ack><p>The authors would like to thank the ChatMind app for providing access to the app for respondents.</p></ack><notes><sec><title>Funding</title><p>The work was supported by ERDF/ESF project DigiWELL (number CZ.02.01.01/00/22_008/0004583) and IGA_CMTF_2025_008.</p></sec><sec><title>Data Availability</title><p>The data, analytical scripts, and further supplementary analyses used to produce the results of this study are freely available on the Open Science Framework [<xref ref-type="bibr" rid="ref50">50</xref>].</p></sec></notes><fn-group><fn fn-type="con"><p>BK, LN, and RZ contributed to the conception of the study. BK drafted the manuscript, designed the intervention process and content, recruited participants, and distributed the assessment tools. LN set up the assessment on the online platform. JF and LN performed the statistical analysis and interpreted the results. VH served as the research supervisor. All authors critically revised the manuscript and approved the final version.</p></fn><fn fn-type="conflict"><p>BK was employed at the company that owns the ChatMind app and was involved in its development. The company provided access to the app for research purposes but had no influence on the study design, data collection, statistical analysis, interpretation, or manuscript preparation. Data analyses were conducted independently by researchers unaffiliated with the company.</p></fn><fn fn-type="other"><p><bold>Editorial Notice</bold></p><p>This randomized study was registered in OSF prospectively (prior to data observation) because the platform allows for comprehensive sharing of study materials, and OSF is traditionally used at the authors' institution as a credible platform for psychological research. The editor granted an exception from ICMJE rules mandating prospective registration of randomized trials in a primary registry in the WHO registry network because the risk of bias appears low and the study was considered formative, guiding the development of the chatbot application. However, readers are advised to carefully assess the validity of any potential explicit or implicit claims related to primary outcomes or effectiveness, as retrospective registration does not prevent authors from changing their outcome measures retrospectively.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb2">AOC</term><def><p>assessment-only control</p></def></def-item><def-item><term id="abb3">CA</term><def><p>conversational agent</p></def></def-item><def-item><term id="abb4">CBT</term><def><p>cognitive behavioral therapy</p></def></def-item><def-item><term id="abb5">CONSORT</term><def><p>Consolidated Standards of Reporting Trials</p></def></def-item><def-item><term id="abb6">DMHI</term><def><p>digital mental health intervention</p></def></def-item><def-item><term id="abb7">GAD-7</term><def><p>7-item Generalized Anxiety Disorder Scale</p></def></def-item><def-item><term id="abb8">GenAI</term><def><p>generative artificial intelligence</p></def></def-item><def-item><term id="abb9">ITT</term><def><p>intention-to-treat</p></def></def-item><def-item><term id="abb10">MCAR</term><def><p>missing completely at random</p></def></def-item><def-item><term id="abb11">ODSIS</term><def><p>Overall Depression Severity and Impairment Scale</p></def></def-item><def-item><term id="abb12">OR</term><def><p>odds ratio</p></def></def-item><def-item><term id="abb13">PHQ-9</term><def><p>Patient Health Questionnaire-9</p></def></def-item><def-item><term id="abb14">PPA</term><def><p>per-protocol analysis</p></def></def-item><def-item><term id="abb15">RCT</term><def><p>randomized controlled trial</p></def></def-item><def-item><term id="abb16">SFBT</term><def><p>solution-focused brief therapy</p></def></def-item><def-item><term id="abb17">WHO-5</term><def><p>World Health Organization Well-Being Index (5-item version)</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="web"><article-title>GBD results</article-title><source>Institute for Health Metrics and Evaluation (IHME)</source><access-date>2025-06-06</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://vizhub.healthdata.org/gbd-results">https://vizhub.healthdata.org/gbd-results</ext-link></comment></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="web"><article-title>GBD compare</article-title><source>Institute for Health Metrics and Evaluation</source><access-date>2025-03-18</access-date><comment><ext-link ext-link-type="uri" xlink:href="http://vizhub.healthdata.org/gbd-compare">http://vizhub.healthdata.org/gbd-compare</ext-link></comment></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>McGinty</surname><given-names>EE</given-names> </name><name name-style="western"><surname>Eisenberg</surname><given-names>MD</given-names> </name></person-group><article-title>Mental health treatment gap-the implementation problem as a research problem</article-title><source>JAMA Psychiatry</source><year>2022</year><month>08</month><day>1</day><volume>79</volume><issue>8</issue><fpage>746</fpage><lpage>747</lpage><pub-id pub-id-type="doi">10.1001/jamapsychiatry.2022.1468</pub-id><pub-id pub-id-type="medline">35704300</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="report"><article-title>Mental health has bigger challenges than stigma &#x2013; rapid report</article-title><year>2021</year><access-date>2026-03-10</access-date><publisher-name>Sapien Labs</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://mentalstateoftheworld.report/wp-content/uploads/2021/05/Rapid-Report-2021-Help-Seeking.pdf">https://mentalstateoftheworld.report/wp-content/uploads/2021/05/Rapid-Report-2021-Help-Seeking.pdf</ext-link></comment></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Moitra</surname><given-names>M</given-names> </name><name name-style="western"><surname>Santomauro</surname><given-names>D</given-names> </name><name name-style="western"><surname>Collins</surname><given-names>PY</given-names> </name><etal/></person-group><article-title>The global gap in treatment coverage for major depressive disorder in 84 countries from 2000-2019: a systematic review and Bayesian meta-regression analysis</article-title><source>PLoS Med</source><year>2022</year><month>02</month><volume>19</volume><issue>2</issue><fpage>e1003901</fpage><pub-id pub-id-type="doi">10.1371/journal.pmed.1003901</pub-id><pub-id pub-id-type="medline">35167593</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Peipert</surname><given-names>A</given-names> </name><name name-style="western"><surname>Krendl</surname><given-names>AC</given-names> </name><name name-style="western"><surname>Lorenzo-Luaces</surname><given-names>L</given-names> </name></person-group><article-title>Waiting lists for psychotherapy and provider attitudes toward low-intensity treatments as potential interventions: survey study</article-title><source>JMIR Form Res</source><year>2022</year><month>09</month><day>16</day><volume>6</volume><issue>9</issue><fpage>e39787</fpage><pub-id pub-id-type="doi">10.2196/39787</pub-id><pub-id pub-id-type="medline">36112400</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rastpour</surname><given-names>A</given-names> </name><name name-style="western"><surname>McGregor</surname><given-names>C</given-names> </name></person-group><article-title>Predicting patient wait times by using highly deidentified data in mental health care: enhanced machine learning approach</article-title><source>JMIR Ment Health</source><year>2022</year><month>08</month><day>9</day><volume>9</volume><issue>8</issue><fpage>e38428</fpage><pub-id pub-id-type="doi">10.2196/38428</pub-id><pub-id pub-id-type="medline">35943774</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Conroy</surname><given-names>J</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>L</given-names> </name><name name-style="western"><surname>Ghaness</surname><given-names>A</given-names> </name></person-group><article-title>Why people aren&#x2019;t getting the care they need</article-title><source>Monit Psychol</source><year>2020</year><access-date>2026-03-10</access-date><volume>51</volume><issue>5</issue><comment><ext-link ext-link-type="uri" xlink:href="https://www.apa.org/monitor/2020/07/datapoint-care">https://www.apa.org/monitor/2020/07/datapoint-care</ext-link></comment></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Andrade</surname><given-names>LH</given-names> </name><name name-style="western"><surname>Alonso</surname><given-names>J</given-names> </name><name name-style="western"><surname>Mneimneh</surname><given-names>Z</given-names> </name><etal/></person-group><article-title>Barriers to mental health treatment: results from the WHO World Mental Health surveys</article-title><source>Psychol Med</source><year>2014</year><month>04</month><volume>44</volume><issue>6</issue><fpage>1303</fpage><lpage>1317</lpage><pub-id pub-id-type="doi">10.1017/S0033291713001943</pub-id><pub-id pub-id-type="medline">23931656</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Co&#x00EA;lho</surname><given-names>BM</given-names> </name><name name-style="western"><surname>Santana</surname><given-names>GL</given-names> </name><name name-style="western"><surname>Viana</surname><given-names>MC</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>YP</given-names> </name><name name-style="western"><surname>Andrade</surname><given-names>LH</given-names> </name></person-group><article-title>&#x201C;I don&#x2019;t need any treatment&#x201D; - barriers to mental health treatment in the general population of a megacity</article-title><source>Braz J Psychiatry</source><year>2021</year><volume>43</volume><issue>6</issue><fpage>590</fpage><lpage>598</lpage><pub-id pub-id-type="doi">10.1590/1516-4446-2020-1448</pub-id><pub-id pub-id-type="medline">33950152</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Torous</surname><given-names>J</given-names> </name><name name-style="western"><surname>J&#x00E4;n Myrick</surname><given-names>K</given-names> </name><name name-style="western"><surname>Rauseo-Ricupero</surname><given-names>N</given-names> </name><name name-style="western"><surname>Firth</surname><given-names>J</given-names> </name></person-group><article-title>Digital mental health and COVID-19: using technology today to accelerate the curve on access and quality tomorrow</article-title><source>JMIR Ment Health</source><year>2020</year><month>03</month><day>26</day><volume>7</volume><issue>3</issue><fpage>e18848</fpage><pub-id pub-id-type="doi">10.2196/18848</pub-id><pub-id pub-id-type="medline">32213476</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Aboujaoude</surname><given-names>E</given-names> </name><name name-style="western"><surname>Gega</surname><given-names>L</given-names> </name><name name-style="western"><surname>Parish</surname><given-names>MB</given-names> </name><name name-style="western"><surname>Hilty</surname><given-names>DM</given-names> </name></person-group><article-title>Editorial: digital interventions in mental health: current status and future directions</article-title><source>Front Psychiatry</source><year>2020</year><volume>11</volume><fpage>111</fpage><pub-id pub-id-type="doi">10.3389/fpsyt.2020.00111</pub-id><pub-id pub-id-type="medline">32174858</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lucas</surname><given-names>GM</given-names> </name><name name-style="western"><surname>Gratch</surname><given-names>J</given-names> </name><name name-style="western"><surname>King</surname><given-names>A</given-names> </name><name name-style="western"><surname>Morency</surname><given-names>LP</given-names> </name></person-group><article-title>It&#x2019;s only a computer: virtual humans increase willingness to disclose</article-title><source>Comput Human Behav</source><year>2014</year><month>08</month><volume>37</volume><fpage>94</fpage><lpage>100</lpage><pub-id pub-id-type="doi">10.1016/j.chb.2014.04.043</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Omylinska-Thurston</surname><given-names>J</given-names> </name><name name-style="western"><surname>Aithal</surname><given-names>S</given-names> </name><name name-style="western"><surname>Liverpool</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Digital psychotherapies for adults experiencing depressive symptoms: systematic review and meta-analysis</article-title><source>JMIR Ment Health</source><year>2024</year><month>09</month><day>30</day><volume>11</volume><fpage>e55500</fpage><pub-id pub-id-type="doi">10.2196/55500</pub-id><pub-id pub-id-type="medline">39348177</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pauley</surname><given-names>D</given-names> </name><name name-style="western"><surname>Cuijpers</surname><given-names>P</given-names> </name><name name-style="western"><surname>Papola</surname><given-names>D</given-names> </name><name name-style="western"><surname>Miguel</surname><given-names>C</given-names> </name><name name-style="western"><surname>Karyotaki</surname><given-names>E</given-names> </name></person-group><article-title>Two decades of digital interventions for anxiety disorders: a systematic review and meta-analysis of treatment effectiveness</article-title><source>Psychol Med</source><year>2023</year><month>01</month><volume>53</volume><issue>2</issue><fpage>567</fpage><lpage>579</lpage><pub-id pub-id-type="doi">10.1017/S0033291721001999</pub-id><pub-id pub-id-type="medline">34047264</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Willemsen</surname><given-names>RF</given-names> </name><name name-style="western"><surname>Versluis</surname><given-names>A</given-names> </name><name name-style="western"><surname>Aardoom</surname><given-names>JJ</given-names> </name><etal/></person-group><article-title>Evaluation of completely online psychotherapy with app-support versus therapy as usual for clients with depression or anxiety disorder: a retrospective matched cohort study investigating the effectiveness, efficiency, client satisfaction, and costs</article-title><source>Int J Med Inform</source><year>2024</year><month>09</month><volume>189</volume><fpage>105485</fpage><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2024.105485</pub-id><pub-id pub-id-type="medline">38815315</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Koulouri</surname><given-names>T</given-names> </name><name name-style="western"><surname>Macredie</surname><given-names>RD</given-names> </name><name name-style="western"><surname>Olakitan</surname><given-names>D</given-names> </name></person-group><article-title>Chatbots to support young adults&#x2019; mental health: an exploratory study of acceptability</article-title><source>ACM Trans Interact Intell Syst</source><year>2022</year><month>06</month><day>30</day><volume>12</volume><issue>2</issue><fpage>1</fpage><lpage>39</lpage><pub-id pub-id-type="doi">10.1145/3485874</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hornstein</surname><given-names>S</given-names> </name><name name-style="western"><surname>Zantvoort</surname><given-names>K</given-names> </name><name name-style="western"><surname>Lueken</surname><given-names>U</given-names> </name><name name-style="western"><surname>Funk</surname><given-names>B</given-names> </name><name name-style="western"><surname>Hilbert</surname><given-names>K</given-names> </name></person-group><article-title>Personalization strategies in digital mental health interventions: a systematic review and conceptual framework for depressive symptoms</article-title><source>Front Digit Health</source><year>2023</year><volume>5</volume><fpage>1170002</fpage><pub-id pub-id-type="doi">10.3389/fdgth.2023.1170002</pub-id><pub-id pub-id-type="medline">37283721</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Swift</surname><given-names>JK</given-names> </name><name name-style="western"><surname>Callahan</surname><given-names>JL</given-names> </name><name name-style="western"><surname>Cooper</surname><given-names>M</given-names> </name><name name-style="western"><surname>Parkin</surname><given-names>SR</given-names> </name></person-group><article-title>The impact of accommodating client preference in psychotherapy: a meta-analysis</article-title><source>J Clin Psychol</source><year>2018</year><month>11</month><volume>74</volume><issue>11</issue><fpage>1924</fpage><lpage>1937</lpage><pub-id pub-id-type="doi">10.1002/jclp.22680</pub-id><pub-id pub-id-type="medline">30091140</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kuhail</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Alturki</surname><given-names>N</given-names> </name><name name-style="western"><surname>Thomas</surname><given-names>J</given-names> </name><name name-style="western"><surname>Alkhalifa</surname><given-names>AK</given-names> </name><name name-style="western"><surname>Alshardan</surname><given-names>A</given-names> </name></person-group><article-title>Human-human vs human-AI therapy: an empirical study</article-title><source>Int J Hum Comput Interact</source><year>2025</year><month>06</month><day>3</day><volume>41</volume><issue>11</issue><fpage>6841</fpage><lpage>6852</lpage><pub-id pub-id-type="doi">10.1080/10447318.2024.2385001</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Abd-Alrazaq</surname><given-names>AA</given-names> </name><name name-style="western"><surname>Alajlani</surname><given-names>M</given-names> </name><name name-style="western"><surname>Alalwan</surname><given-names>AA</given-names> </name><name name-style="western"><surname>Bewick</surname><given-names>BM</given-names> </name><name name-style="western"><surname>Gardner</surname><given-names>P</given-names> </name><name name-style="western"><surname>Househ</surname><given-names>M</given-names> </name></person-group><article-title>An overview of the features of chatbots in mental health: a scoping review</article-title><source>Int J Med Inform</source><year>2019</year><month>12</month><volume>132</volume><fpage>103978</fpage><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2019.103978</pub-id><pub-id pub-id-type="medline">31622850</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>De Freitas</surname><given-names>J</given-names> </name><name name-style="western"><surname>Cohen</surname><given-names>IG</given-names> </name></person-group><article-title>The health risks of generative AI-based wellness apps</article-title><source>Nat Med</source><year>2024</year><month>05</month><volume>30</volume><issue>5</issue><fpage>1269</fpage><lpage>1275</lpage><pub-id pub-id-type="doi">10.1038/s41591-024-02943-6</pub-id><pub-id pub-id-type="medline">38684859</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Frances</surname><given-names>A</given-names> </name></person-group><article-title>Warning: AI chatbots will soon dominate psychotherapy</article-title><source>Br J Psychiatry</source><year>2025</year><month>08</month><day>20</day><fpage>1</fpage><lpage>5</lpage><pub-id pub-id-type="doi">10.1192/bjp.2025.10380</pub-id><pub-id pub-id-type="medline">40831348</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Miner</surname><given-names>AS</given-names> </name><name name-style="western"><surname>Shah</surname><given-names>N</given-names> </name><name name-style="western"><surname>Bullock</surname><given-names>KD</given-names> </name><name name-style="western"><surname>Arnow</surname><given-names>BA</given-names> </name><name name-style="western"><surname>Bailenson</surname><given-names>J</given-names> </name><name name-style="western"><surname>Hancock</surname><given-names>J</given-names> </name></person-group><article-title>Key considerations for incorporating conversational AI in psychotherapy</article-title><source>Front Psychiatry</source><year>2019</year><volume>10</volume><fpage>746</fpage><pub-id pub-id-type="doi">10.3389/fpsyt.2019.00746</pub-id><pub-id pub-id-type="medline">31681047</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Salah</surname><given-names>M</given-names> </name><name name-style="western"><surname>Abdelfattah</surname><given-names>F</given-names> </name><name name-style="western"><surname>Al Halbusi</surname><given-names>H</given-names> </name></person-group><article-title>The good, the bad, and the GPT: reviewing the impact of generative artificial intelligence on psychology</article-title><source>Curr Opin Psychol</source><year>2024</year><month>10</month><volume>59</volume><fpage>101872</fpage><pub-id pub-id-type="doi">10.1016/j.copsyc.2024.101872</pub-id><pub-id pub-id-type="medline">39197407</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhong</surname><given-names>W</given-names> </name><name name-style="western"><surname>Luo</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>H</given-names> </name></person-group><article-title>The therapeutic effectiveness of artificial intelligence-based chatbots in alleviation of depressive and anxiety symptoms in short-course treatments: a systematic review and meta-analysis</article-title><source>J Affect Disord</source><year>2024</year><month>07</month><day>1</day><volume>356</volume><fpage>459</fpage><lpage>469</lpage><pub-id pub-id-type="doi">10.1016/j.jad.2024.04.057</pub-id><pub-id pub-id-type="medline">38631422</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>He</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>L</given-names> </name><name name-style="western"><surname>Qian</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Conversational agent interventions for mental health problems: systematic review and meta-analysis of randomized controlled trials</article-title><source>J Med Internet Res</source><year>2023</year><month>04</month><day>28</day><volume>25</volume><issue>1</issue><fpage>e43862</fpage><pub-id pub-id-type="doi">10.2196/43862</pub-id><pub-id pub-id-type="medline">37115595</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>H</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>R</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>YC</given-names> </name><name name-style="western"><surname>Kraut</surname><given-names>RE</given-names> </name><name name-style="western"><surname>Mohr</surname><given-names>DC</given-names> </name></person-group><article-title>Systematic review and meta-analysis of AI-based conversational agents for promoting mental health and well-being</article-title><source>NPJ Digit Med</source><year>2023</year><month>12</month><day>19</day><volume>6</volume><issue>1</issue><fpage>236</fpage><pub-id pub-id-type="doi">10.1038/s41746-023-00979-5</pub-id><pub-id pub-id-type="medline">38114588</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Feng</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Hang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>W</given-names> </name><etal/></person-group><article-title>Effectiveness of AI-driven conversational agents in improving mental health among young people: systematic review and meta-analysis</article-title><source>J Med Internet Res</source><year>2025</year><month>05</month><day>14</day><volume>27</volume><issue>1</issue><fpage>e69639</fpage><pub-id pub-id-type="doi">10.2196/69639</pub-id><pub-id pub-id-type="medline">40367506</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cooper</surname><given-names>ZW</given-names> </name><name name-style="western"><surname>Mowbray</surname><given-names>O</given-names> </name><name name-style="western"><surname>Ali</surname><given-names>MK</given-names> </name><name name-style="western"><surname>Johnson</surname><given-names>LCM</given-names> </name></person-group><article-title>Addressing depression and comorbid health conditions through solution-focused brief therapy in an integrated care setting: a randomized clinical trial</article-title><source>BMC Prim Care</source><year>2024</year><month>08</month><day>23</day><volume>25</volume><issue>1</issue><fpage>313</fpage><pub-id pub-id-type="doi">10.1186/s12875-024-02561-8</pub-id><pub-id pub-id-type="medline">39179982</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Torous</surname><given-names>J</given-names> </name><name name-style="western"><surname>Lipschitz</surname><given-names>J</given-names> </name><name name-style="western"><surname>Ng</surname><given-names>M</given-names> </name><name name-style="western"><surname>Firth</surname><given-names>J</given-names> </name></person-group><article-title>Dropout rates in clinical trials of smartphone apps for depressive symptoms: a systematic review and meta-analysis</article-title><source>J Affect Disord</source><year>2020</year><month>02</month><day>15</day><volume>263</volume><fpage>413</fpage><lpage>419</lpage><pub-id pub-id-type="doi">10.1016/j.jad.2019.11.167</pub-id><pub-id pub-id-type="medline">31969272</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Spitzer</surname><given-names>RL</given-names> </name><name name-style="western"><surname>Kroenke</surname><given-names>K</given-names> </name><name name-style="western"><surname>Williams</surname><given-names>JBW</given-names> </name><name name-style="western"><surname>L&#x00F6;we</surname><given-names>B</given-names> </name></person-group><article-title>A brief measure for assessing generalized anxiety disorder: the GAD-7</article-title><source>Arch Intern Med</source><year>2006</year><month>05</month><day>22</day><volume>166</volume><issue>10</issue><fpage>1092</fpage><lpage>1097</lpage><pub-id pub-id-type="doi">10.1001/archinte.166.10.1092</pub-id><pub-id pub-id-type="medline">16717171</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kroenke</surname><given-names>K</given-names> </name><name name-style="western"><surname>Spitzer</surname><given-names>RL</given-names> </name><name name-style="western"><surname>Williams</surname><given-names>JBW</given-names> </name></person-group><article-title>The PHQ-9: validity of a brief depression severity measure</article-title><source>J Gen Intern Med</source><year>2001</year><month>09</month><volume>16</volume><issue>9</issue><fpage>606</fpage><lpage>613</lpage><pub-id pub-id-type="doi">10.1046/j.1525-1497.2001.016009606.x</pub-id><pub-id pub-id-type="medline">11556941</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bentley</surname><given-names>KH</given-names> </name><name name-style="western"><surname>Gallagher</surname><given-names>MW</given-names> </name><name name-style="western"><surname>Carl</surname><given-names>JR</given-names> </name><name name-style="western"><surname>Barlow</surname><given-names>DH</given-names> </name></person-group><article-title>Development and validation of the Overall Depression Severity and Impairment Scale</article-title><source>Psychol Assess</source><year>2014</year><month>09</month><volume>26</volume><issue>3</issue><fpage>815</fpage><lpage>830</lpage><pub-id pub-id-type="doi">10.1037/a0036216</pub-id><pub-id pub-id-type="medline">24708078</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="report"><article-title>Wellbeing measures in primary health care/the DEPCARE project</article-title><year>1998</year><access-date>2026-03-10</access-date><publisher-name>World Health Organization, Regional Office for Europe</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://iris.who.int/server/api/core/bitstreams/8af98105-30ec-4da4-9fe9-097f7459e6da/content">https://iris.who.int/server/api/core/bitstreams/8af98105-30ec-4da4-9fe9-097f7459e6da/content</ext-link></comment></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Topp</surname><given-names>CW</given-names> </name><name name-style="western"><surname>&#x00D8;stergaard</surname><given-names>SD</given-names> </name><name name-style="western"><surname>S&#x00F8;ndergaard</surname><given-names>S</given-names> </name><name name-style="western"><surname>Bech</surname><given-names>P</given-names> </name></person-group><article-title>The WHO-5 Well-Being Index: a systematic review of the literature</article-title><source>Psychother Psychosom</source><year>2015</year><volume>84</volume><issue>3</issue><fpage>167</fpage><lpage>176</lpage><pub-id pub-id-type="doi">10.1159/000376585</pub-id><pub-id pub-id-type="medline">25831962</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Newman</surname><given-names>MW</given-names> </name></person-group><article-title>Value added? A pragmatic analysis of the routine use of PHQ-9 and GAD-7 scales in primary care</article-title><source>Gen Hosp Psychiatry</source><year>2022</year><volume>79</volume><fpage>15</fpage><lpage>18</lpage><pub-id pub-id-type="doi">10.1016/j.genhosppsych.2022.09.005</pub-id><pub-id pub-id-type="medline">36209615</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Leichsenring</surname><given-names>F</given-names> </name><name name-style="western"><surname>Steinert</surname><given-names>C</given-names> </name><name name-style="western"><surname>Rabung</surname><given-names>S</given-names> </name><name name-style="western"><surname>Ioannidis</surname><given-names>JPA</given-names> </name></person-group><article-title>The efficacy of psychotherapies and pharmacotherapies for mental disorders in adults: an umbrella review and meta-analytic evaluation of recent meta-analyses</article-title><source>World Psychiatry</source><year>2022</year><month>02</month><volume>21</volume><issue>1</issue><fpage>133</fpage><lpage>145</lpage><pub-id pub-id-type="doi">10.1002/wps.20941</pub-id><pub-id pub-id-type="medline">35015359</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bauer-Staeb</surname><given-names>C</given-names> </name><name name-style="western"><surname>Kounali</surname><given-names>DZ</given-names> </name><name name-style="western"><surname>Welton</surname><given-names>NJ</given-names> </name><etal/></person-group><article-title>Effective dose 50 method as the minimal clinically important difference: evidence from depression trials</article-title><source>J Clin Epidemiol</source><year>2021</year><month>09</month><volume>137</volume><fpage>200</fpage><lpage>208</lpage><pub-id pub-id-type="doi">10.1016/j.jclinepi.2021.04.002</pub-id><pub-id pub-id-type="medline">33892086</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>&#x017B;ak</surname><given-names>AM</given-names> </name><name name-style="western"><surname>P&#x0119;kala</surname><given-names>K</given-names> </name></person-group><article-title>Effectiveness of solution-focused brief therapy: an umbrella review of systematic reviews and meta-analyses</article-title><source>Psychother Res</source><year>2025</year><month>09</month><volume>35</volume><issue>7</issue><fpage>1043</fpage><lpage>1055</lpage><pub-id pub-id-type="doi">10.1080/10503307.2024.2406540</pub-id><pub-id pub-id-type="medline">39324877</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Lin</surname><given-names>S</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Dong</surname><given-names>J</given-names> </name><name name-style="western"><surname>Ni</surname><given-names>S</given-names> </name></person-group><article-title>Detection and positive reconstruction of cognitive distortion sentences: Mandarin dataset and evaluation</article-title><access-date>2026-03-10</access-date><conf-name>Findings of the Association for Computational Linguistics: ACL 2024</conf-name><conf-date>Aug 11-16, 2024</conf-date><comment><ext-link ext-link-type="uri" xlink:href="https://aclanthology.org/2024.findings-acl.399/">https://aclanthology.org/2024.findings-acl.399/</ext-link></comment><pub-id pub-id-type="doi">10.18653/v1/2024.findings-acl.399</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ben-Zion</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Witte</surname><given-names>K</given-names> </name><name name-style="western"><surname>Jagadish</surname><given-names>AK</given-names> </name><etal/></person-group><article-title>Assessing and alleviating state anxiety in large language models</article-title><source>NPJ Digit Med</source><year>2025</year><month>03</month><day>3</day><volume>8</volume><issue>1</issue><fpage>132</fpage><pub-id pub-id-type="doi">10.1038/s41746-025-01512-6</pub-id><pub-id pub-id-type="medline">40033130</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>de Vries</surname><given-names>LP</given-names> </name><name name-style="western"><surname>Pelt</surname><given-names>DHM</given-names> </name><name name-style="western"><surname>Bartels</surname><given-names>M</given-names> </name></person-group><article-title>The stability and change of wellbeing across the lifespan: a longitudinal twin-sibling study</article-title><source>Psychol Med</source><year>2024</year><month>07</month><volume>54</volume><issue>10</issue><fpage>2572</fpage><lpage>2584</lpage><pub-id pub-id-type="doi">10.1017/S0033291724000692</pub-id><pub-id pub-id-type="medline">38533784</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Balan</surname><given-names>R</given-names> </name><name name-style="western"><surname>Dobrean</surname><given-names>A</given-names> </name><name name-style="western"><surname>Poetar</surname><given-names>CR</given-names> </name></person-group><article-title>Use of automated conversational agents in improving young population mental health: a scoping review</article-title><source>NPJ Digit Med</source><year>2024</year><month>03</month><day>19</day><volume>7</volume><issue>1</issue><fpage>75</fpage><pub-id pub-id-type="doi">10.1038/s41746-024-01072-1</pub-id><pub-id pub-id-type="medline">38503909</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Whelen</surname><given-names>ML</given-names> </name><name name-style="western"><surname>Strunk</surname><given-names>DR</given-names> </name></person-group><article-title>Does cognitive behavioral therapy for depression target positive affect? Examining affect and cognitive change session-to-session</article-title><source>J Consult Clin Psychol</source><year>2021</year><month>09</month><volume>89</volume><issue>9</issue><fpage>742</fpage><lpage>750</lpage><pub-id pub-id-type="doi">10.1037/ccp0000679</pub-id><pub-id pub-id-type="medline">34591547</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Grant</surname><given-names>AM</given-names> </name></person-group><article-title>Making positive change: a randomized study comparing solution-focused vs. problem-focused coaching questions</article-title><source>J Syst Ther</source><year>2012</year><month>06</month><volume>31</volume><issue>2</issue><fpage>21</fpage><lpage>35</lpage><pub-id pub-id-type="doi">10.1521/jsyt.2012.31.2.21</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pandey</surname><given-names>S</given-names> </name><name name-style="western"><surname>Sharma</surname><given-names>S</given-names> </name></person-group><article-title>A comparative study of retrieval-based and generative-based chatbots using deep learning and machine learning</article-title><source>Healthc Anal</source><year>2023</year><month>11</month><volume>3</volume><fpage>100198</fpage><pub-id pub-id-type="doi">10.1016/j.health.2023.100198</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lau</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Ang</surname><given-names>WHD</given-names> </name><name name-style="western"><surname>Ang</surname><given-names>WW</given-names> </name><name name-style="western"><surname>Pang</surname><given-names>PCI</given-names> </name><name name-style="western"><surname>Wong</surname><given-names>SH</given-names> </name><name name-style="western"><surname>Chan</surname><given-names>KS</given-names> </name></person-group><article-title>Artificial intelligence&#x2013;based psychotherapeutic intervention on psychological outcomes: a meta&#x2010;analysis and meta&#x2010;regression</article-title><source>Depress Anxiety</source><year>2025</year><month>01</month><volume>2025</volume><issue>1</issue><pub-id pub-id-type="doi">10.1155/da/8930012</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jabir</surname><given-names>AI</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>X</given-names> </name><name name-style="western"><surname>Martinengo</surname><given-names>L</given-names> </name><name name-style="western"><surname>Sharp</surname><given-names>G</given-names> </name><name name-style="western"><surname>Theng</surname><given-names>YL</given-names> </name><name name-style="western"><surname>Tudor Car</surname><given-names>L</given-names> </name></person-group><article-title>Attrition in conversational agent-delivered mental health interventions: systematic review and meta-analysis</article-title><source>J Med Internet Res</source><year>2024</year><month>02</month><day>27</day><volume>26</volume><fpage>e48168</fpage><pub-id pub-id-type="doi">10.2196/48168</pub-id><pub-id pub-id-type="medline">38412023</pub-id></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="web"><article-title>The efficacy of AI assisted psychological intervention on well-being, anxiety and depressive symptoms: experimental study</article-title><source>OSF</source><access-date>2026-03-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://doi.org/10.17605/OSF.IO/BPS58">https://doi.org/10.17605/OSF.IO/BPS58</ext-link></comment></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Informed consent.</p><media xlink:href="mental_v13i1e82642_app1.docx" xlink:title="DOCX File, 291 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>ChatMind app screenshot.</p><media xlink:href="mental_v13i1e82642_app2.png" xlink:title="PNG File, 943 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>Instructions.</p><media xlink:href="mental_v13i1e82642_app3.docx" xlink:title="DOCX File, 7 KB"/></supplementary-material><supplementary-material id="app4"><label>Multimedia Appendix 4</label><p>Supplementary per-protocol analysis.</p><media xlink:href="mental_v13i1e82642_app4.zip" xlink:title="ZIP File, 1378 KB"/></supplementary-material><supplementary-material id="app5"><label>Multimedia Appendix 5</label><p>Descriptive characteristics.</p><media xlink:href="mental_v13i1e82642_app5.docx" xlink:title="DOCX File, 19 KB"/></supplementary-material><supplementary-material id="app6"><label>Checklist 1</label><p>CONSORT-EHEALTH (V 1.6.1) checklist.</p><media xlink:href="mental_v13i1e82642_app6.pdf" xlink:title="PDF File, 1142 KB"/></supplementary-material></app-group></back></article>