<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Ment Health</journal-id><journal-id journal-id-type="publisher-id">mental</journal-id><journal-id journal-id-type="index">16</journal-id><journal-title>JMIR Mental Health</journal-title><abbrev-journal-title>JMIR Ment Health</abbrev-journal-title><issn pub-type="epub">2368-7959</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v12i1e57986</article-id><article-id pub-id-type="doi">10.2196/57986</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Exploring Biases of Large Language Models in the Field of Mental Health: Comparative Questionnaire Study of the Effect of Gender and Sexual Orientation in Anorexia Nervosa and Bulimia Nervosa Case Vignettes</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Schnepper</surname><given-names>Rebekka</given-names></name><degrees>Dr rer nat</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Roemmel</surname><given-names>Noa</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Schaefert</surname><given-names>Rainer</given-names></name><degrees>Prof Dr Med</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lambrecht-Walzinger</surname><given-names>Lena</given-names></name><degrees>Dr med</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Meinlschmidt</surname><given-names>Gunther</given-names></name><degrees>Prof Dr</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff4">4</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Psychosomatic Medicine, University Hospital and University of Basel</institution><addr-line>Hebelstr. 2</addr-line><addr-line>Basel</addr-line><country>Switzerland</country></aff><aff id="aff2"><institution>Department of Digital and Blended Psychosomatics and Psychotherapy, Psychosomatic Medicine, University Hospital and University of Basel</institution><addr-line>Basel</addr-line><country>Switzerland</country></aff><aff id="aff3"><institution>Department of Clinical Psychology and Psychotherapy, University of Trier</institution><addr-line>Trier</addr-line><addr-line>Rheinland-Pfalz</addr-line><country>Germany</country></aff><aff id="aff4"><institution>Department of Psychology, Division of Clinical Psychology and Epidemiology, University of Basel</institution><addr-line>Basel</addr-line><country>Switzerland</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Asman</surname><given-names>Oren</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Hassan</surname><given-names>Ahmed</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Zhang</surname><given-names>Tianlin</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Rebekka Schnepper, Dr rer nat, Department of Psychosomatic Medicine, University Hospital and University of Basel, Hebelstr. 2, Basel, 4031, Switzerland, 41 613284633; <email>rebekka.schnepper@usb.ch</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>20</day><month>3</month><year>2025</year></pub-date><volume>12</volume><elocation-id>e57986</elocation-id><history><date date-type="received"><day>01</day><month>03</month><year>2024</year></date><date date-type="rev-recd"><day>30</day><month>10</month><year>2024</year></date><date date-type="accepted"><day>24</day><month>11</month><year>2024</year></date></history><copyright-statement>&#x00A9; Rebekka Schnepper, Noa Roemmel, Rainer Schaefert, Lena Lambrecht-Walzinger, Gunther Meinlschmidt. Originally published in JMIR Mental Health (<ext-link ext-link-type="uri" xlink:href="https://mental.jmir.org">https://mental.jmir.org</ext-link>), 20.3.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Mental Health, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://mental.jmir.org/">https://mental.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://mental.jmir.org/2025/1/e57986"/><abstract><sec><title>Background</title><p>Large language models (LLMs) are increasingly used in mental health, showing promise in assessing disorders. However, concerns exist regarding their accuracy, reliability, and fairness. Societal biases and underrepresentation of certain populations may impact LLMs. Because LLMs are already used for clinical practice, including decision support, it is important to investigate potential biases to ensure a responsible use of LLMs. Anorexia nervosa (AN) and bulimia nervosa (BN) show a lifetime prevalence of 1%&#x2010;2%, affecting more women than men. Among men, homosexual men face a higher risk of eating disorders (EDs) than heterosexual men. However, men are underrepresented in ED research, and studies on gender, sexual orientation, and their impact on AN and BN prevalence, symptoms, and treatment outcomes remain limited.</p></sec><sec><title>Objectives</title><p>We aimed to estimate the presence and size of bias related to gender and sexual orientation produced by a common LLM as well as a smaller LLM specifically trained for mental health analyses, exemplified in the context of ED symptomatology and health-related quality of life (HRQoL) of patients with AN or BN.</p></sec><sec sec-type="methods"><title>Methods</title><p>We extracted 30 case vignettes (22 AN and 8 BN) from scientific papers. We adapted each vignette to create 4 versions, describing a female versus male patient living with their female versus male partner (2 &#x00D7; 2 design), yielding 120 vignettes. We then fed each vignette into ChatGPT-4 and to &#x201C;MentaLLaMA&#x201D; based on the Large Language Model Meta AI (LLaMA) architecture thrice with the instruction to evaluate them by providing responses to 2 psychometric instruments, the RAND-36 questionnaire assessing HRQoL and the eating disorder examination questionnaire. With the resulting LLM-generated scores, we calculated multilevel models with a random intercept for gender and sexual orientation (accounting for within-vignette variance), nested in vignettes (accounting for between-vignette variance).</p></sec><sec sec-type="results"><title>Results</title><p>In ChatGPT-4, the multilevel model with 360 observations indicated a significant association with gender for the RAND-36 mental composite summary (conditional means: 12.8 for male and 15.1 for female cases; 95% CI of the effect &#x2013;6.15 to &#x2212;0.35; <italic>P</italic>=.04) but neither with sexual orientation (<italic>P</italic>=.71) nor with an interaction effect (<italic>P</italic>=.37). We found no indications for main effects of gender (conditional means: 5.65 for male and 5.61 for female cases; 95% CI &#x2013;0.10 to 0.14; <italic>P</italic>=.88), sexual orientation (conditional means: 5.63 for heterosexual and 5.62 for homosexual cases; 95% CI &#x2013;0.14 to 0.09; <italic>P</italic>=.67), or for an interaction effect (<italic>P</italic>=.61, 95% CI &#x2013;0.11 to 0.19) for the eating disorder examination questionnaire overall score (conditional means 5.59&#x2010;5.65 95% CIs 5.45 to 5.7). MentaLLaMA did not yield reliable results.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>LLM-generated mental HRQoL estimates for AN and BN case vignettes may be biased by gender, with male cases scoring lower despite no real-world evidence supporting this pattern. This highlights the risk of bias in generative artificial intelligence in the field of mental health. Understanding and mitigating biases related to gender and other factors, such as ethnicity, and socioeconomic status are crucial for responsible use in diagnostics and treatment recommendations.</p></sec></abstract><kwd-group><kwd>anorexia nervosa</kwd><kwd>artificial intelligence</kwd><kwd>bulimia nervosa</kwd><kwd>ChatGPT</kwd><kwd>eating disorders</kwd><kwd>LLM</kwd><kwd>responsible AI</kwd><kwd>transformer</kwd><kwd>bias</kwd><kwd>large language model</kwd><kwd>gender</kwd><kwd>vignette</kwd><kwd>quality of life</kwd><kwd>symptomatology</kwd><kwd>questionnaire</kwd><kwd>generative AI</kwd><kwd>mental health</kwd><kwd>AI</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><sec id="s1-1"><title>Large Language Models in the Context of Mental Health</title><p>In recent years, there has been significant progress in the field of artificial intelligence (AI) [<xref ref-type="bibr" rid="ref1">1</xref>]. In particular, the development of large language models (LLMs), such as OpenAI&#x2019;s GPT models [<xref ref-type="bibr" rid="ref2">2</xref>], Google&#x2019;s LaMDA [<xref ref-type="bibr" rid="ref3">3</xref>], or Meta&#x2019;s Large Language Model Meta AI (LLaMA) [<xref ref-type="bibr" rid="ref4">4</xref>], has made the deployment of such algorithms accessible to researchers, clinicians, and the public alike [<xref ref-type="bibr" rid="ref5">5</xref>]. With advancements in computational power and access to larger datasets, these models can now go beyond simple word counting [<xref ref-type="bibr" rid="ref6">6</xref>] and actually account for the relationships between words [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. The technique of modeling words in a large context has been referred to as transformer-based large language modeling [<xref ref-type="bibr" rid="ref8">8</xref>]. This may not only facilitate the automatic analysis of large amounts of text data [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>] but, by modeling words in a large context, also allow the generation of meaningful text and the interactive use of this technology [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. Thus, the application of LLMs may improve efficiency and effectiveness of data processing in various fields&#x2014;including health care [<xref ref-type="bibr" rid="ref5">5</xref>].</p><p>Since psychology and psychotherapy research are primarily shaped by language, the potential of LLMs in this field is significant [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. This becomes even more meaningful when considering the contribution of mental disorders to the global disease burden [<xref ref-type="bibr" rid="ref12">12</xref>] and acknowledging the persistent treatment gap in mental health care [<xref ref-type="bibr" rid="ref13">13</xref>]. Especially in the field of psychological assessment, research on the use of LLMs is advanced [<xref ref-type="bibr" rid="ref14">14</xref>]. For example, the use of transformer language models on language patterns has resulted in remarkably high predictive accuracy on standardized well-being rating scales [<xref ref-type="bibr" rid="ref15">15</xref>]. This procedure of using LLMs to automatically generate psychological construct scores based on free text has been formally referred to as &#x201C;language-based assessment&#x201D; [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. Findings indicate comparable levels of validity and reliability of language-based assessments compared with standardized rating scales [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. Moreover, language-based assessments have the capacity to incorporate additional information beyond free text entries [<xref ref-type="bibr" rid="ref14">14</xref>], such as user age [<xref ref-type="bibr" rid="ref18">18</xref>].</p><p>LLMs have also been applied in the evaluation of clinical case vignettes, and ChatGPT-4 has been shown to assess suicidality as reliable as mental health professionals [<xref ref-type="bibr" rid="ref19">19</xref>]. Furthermore, Chat-GPT 3.5&#x2019;s performance in the diagnostic assessment and advice on disease management in a study using 100 clinical vignettes has been rated as excellent by mental health professionals [<xref ref-type="bibr" rid="ref20">20</xref>].</p></sec><sec id="s1-2"><title>Biases and Responsible AI</title><p>Despite the promising findings of using LLMs in the context of (mental) health, the issue of potential biases in information generated by LLMs has been raised. Because LLMs are being increasingly introduced in clinical practice, it is important to investigate potential biases to ensure a responsible use of AI [<xref ref-type="bibr" rid="ref21">21</xref>] and LLMs [<xref ref-type="bibr" rid="ref22">22</xref>]. Since LLMs rely on training data, which is directly or indirectly generated by humans, these models are likely to contain the same biases as the society in which they are created in [<xref ref-type="bibr" rid="ref21">21</xref>-<xref ref-type="bibr" rid="ref24">24</xref>]. This is especially critical in (mental) health care [<xref ref-type="bibr" rid="ref25">25</xref>], where biases in LLMs may lead to discrimination of different social groups [<xref ref-type="bibr" rid="ref22">22</xref>]. For example, ChatGPT 3.5 performed poorly in diagnosing an infectious disease known to be widely underdiagnosed [<xref ref-type="bibr" rid="ref26">26</xref>]. Furthermore, ChatGPT 3.5 made different treatment recommendations based on insurance status, which might introduce health disparities [<xref ref-type="bibr" rid="ref27">27</xref>]. When generating clinical cases, ChatGPT-4 failed to create cases that depicted demographic diversity and relied on stereotypes when choosing gender or ethnicity [<xref ref-type="bibr" rid="ref28">28</xref>]. Thus, the need for &#x201C;fair AI&#x201D; has been pointed out with the goal to develop prediction models that provide equivalent outputs for identical individuals who differ only in one sensitive attribute [<xref ref-type="bibr" rid="ref29">29</xref>]. To avoid or at least reduce potential bias and move toward fair AI, this bias first needs to be conceptualized, measured, and understood [<xref ref-type="bibr" rid="ref22">22</xref>]. The aim of this paper was to explore a potential bias in the evaluation of eating disorders (EDs), which have been subjected to stigma [<xref ref-type="bibr" rid="ref30">30</xref>] and gender-biased assessment [<xref ref-type="bibr" rid="ref31">31</xref>].</p></sec><sec id="s1-3"><title>EDs (Anorexia Nervosa or Bulimia Nervosa)</title><p>Anorexia nervosa (AN) and bulimia nervosa (BN) are severe EDs with many medical complications, high mortality rates [<xref ref-type="bibr" rid="ref32">32</xref>], slow treatment progress, and frequent relapses [<xref ref-type="bibr" rid="ref33">33</xref>]. The lifetime prevalence to develop AN or BN is estimated to be 1%&#x2010;2% each [<xref ref-type="bibr" rid="ref34">34</xref>]. Historically, AN and BN have been described only in women, and it was not until the 21st century that research started to systematically investigate EDs in men [<xref ref-type="bibr" rid="ref35">35</xref>]. Today, men are estimated to account for approximately 10%&#x2010;25% of AN or BN cases [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]. Research on gender difference in AN and BN is scarce and inconclusive, with no clear findings with regard to genetic and environmental factors that might explain differences in etiology or maintenance of these EDs [<xref ref-type="bibr" rid="ref38">38</xref>]. Likewise, findings on severity and treatment outcomes are ambiguous. While one study suggests that men diagnosed with AN might have faster and more frequent remission rates [<xref ref-type="bibr" rid="ref39">39</xref>], another study found no difference [<xref ref-type="bibr" rid="ref40">40</xref>]. Men might produce lower costs in outpatient treatment; however, this might be due to higher barriers to receive treatment [<xref ref-type="bibr" rid="ref41">41</xref>]. Men have been found to be more stigmatizing than women toward people with EDs [<xref ref-type="bibr" rid="ref42">42</xref>], and this internalized stigma might be one reason for the hesitancy to seek outpatient treatment.</p><p>In men, sexual orientation might increase the risk of developing an ED, with more men with an ED or ED-related behavior identifying as homosexual compared with the general population [<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref44">44</xref>]. Furthermore, independent of being diagnosed with an ED, homosexual men report more psychological distress than heterosexual men, and in men with an ED, being homosexual was related to higher ED symptomatology [<xref ref-type="bibr" rid="ref45">45</xref>]. In women, a review found no significant difference in overall disordered eating due to sexual orientation, but distinct symptom patterns, with homosexual women reporting less restrictive eating behavior and more binge eating [<xref ref-type="bibr" rid="ref46">46</xref>].</p><p>To conclude, only in the last 2 decades men were included in ED research and there are still many open questions related to the effect of gender on prevalence, symptoms, and treatment outcomes of AN and BN. With regard to sexual orientation, there is evidence for an association between identifying as homosexual and a higher risk of EDs in men but not in women.</p></sec><sec id="s1-4"><title>Objectives</title><p>We aimed to estimate the presence and size of bias related to gender and sexual orientation produced by ChatGPT-4, a common LLM, as well as MentaLLaMA, an LLM fine-tuned for the mental health domain, exemplified by their application in the context of ED symptomatology and health-related quality of life (HRQoL) of patients with AN or BN. By providing clinical case vignettes to the LLMs and instructing them to take up the role of a clinical psychologist rating the vignettes, we sought to mimic the diagnostic process of an LLM-based ED assessment.</p></sec></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Vignette Selection and Modification</title><p>We searched PubMed and Google Scholar up until October 2023 for vignettes in scientific papers published since 2000 that describe patients with either AN or BN. A total of 30 case vignettes were extracted from 12 different papers (published between 2001 and 2022). Of these vignettes, 22 described patients with AN and 8 described patients with BN. Most vignettes originally describe a female patient (n=28). We then adapted gender and sexual orientation in each vignette to create 4 versions (2 &#x00D7; 2 design), describing a female versus male patient living with their female versus male partner (if either a marriage or age &#x2265;30 years was mentioned, the term husband or wife was chosen, otherwise boyfriend or girlfriend). This resulted in 120 adopted vignettes. Some information was removed due to content policy violations, that is, drug abuse, self-mutilation, suicidal ideation or suicide attempts, sexual abuse, and traumatizing experiences. Furthermore, details on the menstrual cycle were removed since they do not apply to male patients, as well as indications of height, since they were unrealistically short for male patients. Finally, some specific details not needed in this context were removed, for example, study enrollment procedures and study-specific measures, medication plan, and the name of the hospital.</p><p>See <xref ref-type="table" rid="table1">Table 1</xref> for further details about the vignettes.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Vignettes included in the study, search term, and information on parts that were removed, added, or changed.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Vignette</td><td align="left" valign="bottom">Search term</td><td align="left" valign="bottom">Removed</td><td align="left" valign="bottom">Changed</td><td align="left" valign="bottom">Added</td></tr></thead><tbody><tr><td align="char" char="." valign="top">1 [<xref ref-type="bibr" rid="ref47">47</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">GAF<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> score</td><td align="left" valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="top">Patient with AN<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup> (implied in title of paper), sex, sexual orientation, and living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">2 [<xref ref-type="bibr" rid="ref47">47</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">GAF score self-mutilation, suicide attempt</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Patient with AN (implied in title of paper), sex, sexual orientation, and living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">3 [<xref ref-type="bibr" rid="ref47">47</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">GAF score, amenorrhea</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Patient with AN (implied in title of paper), sex, sexual orientation, and living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">4 [<xref ref-type="bibr" rid="ref47">47</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">GAF score</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Patient with AN (implied in title of paper), sex, sexual orientation, and living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">5 [<xref ref-type="bibr" rid="ref47">47</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">GAF score</td><td align="left" valign="top">&#x201C;School&#x201D; changed to &#x201C;university&#x201D;</td><td align="left" valign="top">Patient with AN (implied in title of paper), sex, sexual orientation, and living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">6 [<xref ref-type="bibr" rid="ref47">47</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">GAF score</td><td align="left" valign="top">&#x201C;School&#x201D; changed to &#x201C;university&#x201D;</td><td align="left" valign="top">Patient with AN (implied in title of paper), sex, sexual orientation, and living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">7 [<xref ref-type="bibr" rid="ref47">47</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">GAF score</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Patient with AN (implied in title of paper), sex, sexual orientation, and living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">8 [<xref ref-type="bibr" rid="ref47">47</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">GAF score</td><td align="left" valign="top">&#x201C;School&#x201D; changed to &#x201C;university&#x201D;</td><td align="left" valign="top">Patient with AN (implied in title of paper), sex, sexual orientation, and living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">9 [<xref ref-type="bibr" rid="ref47">47</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">GAF score</td><td align="left" valign="top">&#x201C;Living with parents&#x201D; changed to &#x201C;living with boyfriend or girlfriend&#x201D;</td><td align="left" valign="top">Patient with AN (implied in title of paper), sex, and sexual orientation</td></tr><tr><td align="char" char="." valign="top">10 [<xref ref-type="bibr" rid="ref47">47</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">GAF score, amenorrhea</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Patient with AN (implied in title of paper), sex, sexual orientation, and living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">11 [<xref ref-type="bibr" rid="ref47">47</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">GAF score, amenorrhea</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Patient with AN (implied in title of paper), sex, sexual orientation, and living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">12 [<xref ref-type="bibr" rid="ref47">47</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">GAF score, amenorrhea, and suicide attempts</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Patient with AN (implied in title of paper), sex, sexual orientation, and living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">13 [<xref ref-type="bibr" rid="ref47">47</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">GAF score, amenorrhea, and suicide attempts</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Patient with AN (implied in title of paper), sex, sexual orientation, and living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">14 [<xref ref-type="bibr" rid="ref47">47</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">GAF score, amenorrhea, suicide ideation, and self-mutilation</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Patient with AN (implied in title of paper), sex, sexual orientation, and living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">15 [<xref ref-type="bibr" rid="ref48">48</xref>]</td><td align="left" valign="top">PubMed, August 11, 2023: eating disorder filter for &#x201C;case report,&#x201D; since 2000</td><td align="left" valign="top">Menses, not sexually active</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">16 [<xref ref-type="bibr" rid="ref48">48</xref>]</td><td align="left" valign="top">PubMed, August 11, 2023: eating disorder filter for &#x201C;case report,&#x201D; since 2000</td><td align="left" valign="top">Medication details, menstrual cycle</td><td align="left" valign="top"/><td align="left" valign="top">Living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">17 [<xref ref-type="bibr" rid="ref48">48</xref>]</td><td align="left" valign="top">PubMed, August 11, 2023: eating disorder filter for &#x201C;case report,&#x201D; since 2000</td><td align="left" valign="top">Menstrual cycle</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Living with husband or wife (&#x003E;30 years)</td></tr><tr><td align="char" char="." valign="top">18 [<xref ref-type="bibr" rid="ref49">49</xref>]</td><td align="left" valign="top">PubMed, August 11, 2023: eating disorder filter for &#x201C;case report,&#x201D; since 2000</td><td align="left" valign="top">Sexual abuse, drugs or alcohol, suicide</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Living with husband or wife</td></tr><tr><td align="char" char="." valign="top">19 [<xref ref-type="bibr" rid="ref49">49</xref>]</td><td align="left" valign="top">PubMed, August 11, 2023: eating disorder filter for &#x201C;case report,&#x201D; since 2000</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">20 [<xref ref-type="bibr" rid="ref50">50</xref>]</td><td align="left" valign="top">PubMed, August 11, 2023: eating disorder filter for &#x201C;case report,&#x201D; since 2000</td><td align="left" valign="top">Suicidal ideation</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Living with husband or wife (&#x003E;30 years)</td></tr><tr><td align="char" char="." valign="top">21 [<xref ref-type="bibr" rid="ref51">51</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">Substance abuse</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">22 [<xref ref-type="bibr" rid="ref52">52</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">Diagnostic manual and citation, name of measure, scientific consent, treated by author, and height (unrealistic if changed to male sex)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">23 [<xref ref-type="bibr" rid="ref53">53</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">City, education, menstrual irregularities, and weight (unrealistic if changed to male sex)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">24 [<xref ref-type="bibr" rid="ref54">54</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">PTSD<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup>, sexual abuse, mens, and study</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">25 [<xref ref-type="bibr" rid="ref54">54</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">Sexual abuse, PTSD, and mens or menopause</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Living with husband or wife (&#x003E;30 years)</td></tr><tr><td align="char" char="." valign="top">26 [<xref ref-type="bibr" rid="ref54">54</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">Enrollment in study</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">27 [<xref ref-type="bibr" rid="ref55">55</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Living with husband or wife (&#x003E;30 years)</td></tr><tr><td align="char" char="." valign="top">28 [<xref ref-type="bibr" rid="ref56">56</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Living with boyfriend or girlfriend</td></tr><tr><td align="char" char="." valign="top">29 [<xref ref-type="bibr" rid="ref57">57</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Living with husband or wife (&#x003E;30 years)</td></tr><tr><td align="char" char="." valign="top">30 [<xref ref-type="bibr" rid="ref58">58</xref>]</td><td align="left" valign="top">Google Scholar; October 13, 2023: (&#x201C;case report&#x201D; OR &#x201C;case series&#x201D;) AND (anorexia OR bulimia) AND &#x201C;psychotherapy,&#x201D; since 2000</td><td align="left" valign="top">Height (unrealistic if changed to male sex)</td><td align="left" valign="top">&#x201C;Single&#x201D; changed to &#x201C;living with boyfriend or girlfriend&#x201D;</td><td align="left" valign="top">&#x2014;</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>GAF: global assessment of functioning.</p></fn><fn id="table1fn2"><p><sup>b</sup>Not applicable.</p></fn><fn id="table1fn3"><p><sup>c</sup>AN: anorexia nervosa.</p></fn><fn id="table1fn4"><p><sup>d</sup>PTSD: posttraumatic stress disorder.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2-2"><title>Ethical Considerations</title><p>We did not collect any data from human subjects within our study but instead conducted analyses on case vignettes that were previously published in a fully anonymized way in peer-reviewed, easily accessible journals. Therefore, no ethics application was required for this study.</p></sec><sec id="s2-3"><title>Data Generation</title><p>In 3 rounds, each vignette was fed into ChatGPT-4 with the instruction to evaluate them by providing responses to 1 of the 2 psychometric instruments. This resulted in a total of 720 vignette evaluations (120 vignettes &#x00D7; 3 rounds &#x00D7; 2 measures). ChatGPT-4 was opened in an internet browser (Google Chrome) with the chat history turned off to avoid a learning effect from the repeated evaluation of case vignettes. In the &#x201C;custom instructions&#x201D; settings, the instruction &#x201C;Set the temperature of your replies to 0&#x201D; was included. This instruction minimizes randomness in the text generation process and ensures maximum replicability, high precision, and factual accuracy. Data were generated between October and December 2023. See <xref ref-type="other" rid="box1">Textbox 1</xref> for an example of a prompt. Data generation in MentaLLaMA had to be substantially adapted (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p><boxed-text id="box1"><title> An example prompt for 1 of the 120 vignettes.</title><p>Take up the role of a clinical psychologist. Imagine that you see a patient described by the following case vignette.</p><p>&#x201C;A 21-year-old university student living with her boyfriend self-refers with concerns about her 7-year use of laxatives to control weight gain. She is eating daily without vomiting, but admits to binge-eating episodes three or four times weekly during the past 2 years. Compensatory vomiting stopped 6 months ago. She does not overexercise. Her BMI is low at 17.8, and her vital signs are normal. She admits to recent increased fatigue with occasional exertional dyspnea and daily diarrhea. She has been hospitalized twice in the past 3 years for dehydration not recognized as related to her laxative abuse.&#x201D;</p><p>Based on the information given, what would be your best estimate regarding the following questions that refer to the case vignette:</p><p>So even though originally the questions are meant as self-report, apply them as questions to be replied as observer and provide the respective best estimate regarding the following questions that refer to the case vignette:</p><p>[One of the 2 measures in their original format]</p><p>Reply to each question with the reply categories:</p><p>[Original reply categories of the measure]</p><p>If no estimate can be given for a question, code it as 999.</p><p>Provide the estimates as a simple table. In this table, provide each question as a new variable with the corresponding values in 2 columns, 1 column containing the question number in ascending order and 1 column containing ONLY the numerical values. Provide the entire table.</p></boxed-text></sec><sec id="s2-4"><title>Measures</title><sec id="s2-4-1"><title>RAND 36-Item Short Form Health Survey Version 1.0 (SF-36)</title><p>The SF-36 [<xref ref-type="bibr" rid="ref59">59</xref>] assesses HRQoL and consists of 8 subscales: physical functioning, bodily pain, role limitations due to physical health problems, role limitations due to personal or emotional problems, emotional well-being, social functioning, energy or fatigue, and general health perceptions. From these subscales, the mental composite summary (MCS; comprising role limitations due to personal or emotional problems, emotional well-being, social functioning, and energy or fatigue), as well as a physical composite score (PCS), can be calculated. Evidence suggests that in EDs, MCS is more affected than PCS [<xref ref-type="bibr" rid="ref60">60</xref>]; thus, this score was selected for this study. Furthermore, the SF-36 includes a single item assessing perceived change in health, which is not included in any of the subscales. Items are answered either with &#x201C;yes/no&#x201D; or on different Likert scales and then recoded to values ranging from 0 to 100, with higher scores indicating better HRQoL. To calculate the MCS, the authors have suggested an approach [<xref ref-type="bibr" rid="ref61">61</xref>] in which first, the subscales are <italic>z</italic>-transformed using means and SDs from the general US population; second, the subscales are aggregated by weighing them with coefficients from the general US population; and third, a <italic>t</italic>-score transformation is performed (mean 50, SD 10). This approach has been criticized for distorting the raw scores, and it was found that simply calculating the MCS by forming the mean of the 4 subscales resulted in satisfactory validity [<xref ref-type="bibr" rid="ref62">62</xref>]. In this study, the simple approach was chosen because on the one hand, only the MCS was investigated and therefore a potential correlation with the PCS would not pose a problem. On the other hand, the choice of population that the scores are <italic>z</italic>-standardized and weighed with makes assumptions on the origin of data that ChatGPT-4 were trained with, something that is not entirely known and therefore could distort our data.</p></sec><sec id="s2-4-2"><title>Eating Disorder Examination Questionnaire</title><p>The eating disorder examination questionnaire (EDE-Q) [<xref ref-type="bibr" rid="ref63">63</xref>] assesses ED symptomatology during the previous 28 days. It consists of 4 subscales: dietary restraint, weight concern, shape concern, and eating concern. By calculating the mean of these subscales, a global score can be formed. Items are answered on a scale ranging from 0 to 6, with 6 reflecting the greatest severity or frequency of ED symptoms.</p></sec></sec><sec id="s2-5"><title>Statistical Analysis</title><p>Data from ChatGPT-4 and MentaLLaMA replies were copied to an Excel sheet, indicating the vignette number, gender, sexual orientation, and round number. Female gender and heterosexual orientation were coded as &#x201C;0.&#x201D; We performed all analyses in RStudio [<xref ref-type="bibr" rid="ref64">64</xref>]. Data quality of MentaLLaMA results was low and yielded no reliable results (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). For the main outcome analyses of ChatGPT-4 replies, we used the package &#x201C;lme4&#x201D; [<xref ref-type="bibr" rid="ref65">65</xref>], which is suitable to calculate linear multilevel models (MLMs) with crossed random-effects structure [<xref ref-type="bibr" rid="ref66">66</xref>]. This approach was chosen to take the repeated evaluation (3 rounds) of each vignette as well as the main and interaction effects of gender and sexual orientation into account. These MLMs included a random intercept for vignettes (accounting for between-vignette variance), as well as a random intercept for the gender &#x00D7; sexual orientation interaction nested in vignettes (accounting for within-vignette variance). This resulted in the formula:</p><disp-formula id="E1"><mml:math id="eqn1"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mtext mathvariant="italic">Outcome</mml:mtext><mml:mo>&#x223C;</mml:mo><mml:mtext mathvariant="italic">Gender</mml:mtext><mml:mo>&#x00D7;</mml:mo><mml:mtext mathvariant="italic">Orientation</mml:mtext><mml:mo mathvariant="italic">+</mml:mo><mml:mo mathvariant="italic" stretchy="false">(</mml:mo><mml:mtext mathvariant="italic">interaction</mml:mtext><mml:mo mathvariant="italic" stretchy="false">(</mml:mo><mml:mtext mathvariant="italic">Gender</mml:mtext><mml:mo mathvariant="italic">,</mml:mo><mml:mtext mathvariant="italic">Orientation</mml:mtext><mml:mo mathvariant="italic" stretchy="false">)</mml:mo><mml:mrow><mml:mo mathvariant="italic" stretchy="false">|</mml:mo></mml:mrow><mml:mtext mathvariant="italic">Vignette</mml:mtext><mml:mo mathvariant="italic" stretchy="false">)</mml:mo></mml:mrow></mml:mrow></mml:mstyle></mml:math></disp-formula><p>We plotted the results using <italic>ggplot2</italic> [<xref ref-type="bibr" rid="ref67">67</xref>].</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Descriptives</title><p><xref ref-type="table" rid="table2">Table 2</xref> shows the unconditional means of the MCS and EDE-Q. For the SF-36, there were 1.19% of missing values in items included in the MCS. For the EDE-Q, there were 0.76% of missing values in items included in the overall score (coded &#x201C;999&#x201D; by ChatGPT-4 and recoded to a missing value). Interrater reliability measured by the intraclass correlation coefficient was moderate for both measures (0.71 for the MCS and 0.56 for the EDE-Q).</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Means and SDs of the 2 outcome measures for each of the 4 subgroups.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Characteristics</td><td align="left" valign="bottom">MCS<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup>, mean (SD)</td><td align="left" valign="bottom">EDE-Q<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup>, mean (SD)</td></tr></thead><tbody><tr><td align="left" valign="top"><bold>Female gender</bold></td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Overall (n=180)</td><td align="left" valign="top">15.1 (15.6)</td><td align="left" valign="top">5.61 (0.52)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Heterosexual (n=90)</td><td align="left" valign="top">15.3 (16.3)</td><td align="left" valign="top">5.63 (0.49)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Homosexual (n=90)</td><td align="left" valign="top">14.8 (14.9)</td><td align="left" valign="top">5.60 (0.55)</td></tr><tr><td align="left" valign="top"><bold>Male gender</bold></td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Overall (n=180)</td><td align="left" valign="top">12.8 (14.2)</td><td align="left" valign="top">5.65 (0.47)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Heterosexual (n=90)</td><td align="left" valign="top">12.1 (12.5)</td><td align="left" valign="top">5.64 (0.51)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Homosexual (n=90)</td><td align="left" valign="top">13.6 (15.7)</td><td align="left" valign="top">5.65 (0.42)</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>MCS: mental composite summary of the RAND 36-item short form survey.</p></fn><fn id="table2fn2"><p><sup>b</sup>EDE-Q: eating disorder examination questionnaire.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-2"><title>Main Outcomes</title><p>For the MCS, the MLM with 360 observations indicated a significant effect of gender, with men having a lower MCS score (conditional means: 12.8 for male and 15.1 for female cases; 95% CI of the effect &#x2212;6.15 to &#x2212;0.35; <xref ref-type="fig" rid="figure1">Figure 1</xref>), with no indications of an effect of sexual orientation or an interaction effect. For the EDE-Q overall score, there were no indications for main effects of gender (conditional means: 5.65 for male and 5.61 for female cases); significant main effects of gender (conditional means: 5.65 for male and 5.61 for female cases; 95% CI &#x2013;0.10 to 0.14; <italic>P</italic>=.88), sexual orientation (conditional means: 5.63 for heterosexual and 5.62 for homosexual cases; 95% CI &#x2013;0.14 to 0.09; <italic>P</italic>=.67), or for an interaction effect (<italic>P</italic>=.61, 95% CI &#x2013;0.11 to 0.19). See <xref ref-type="table" rid="table3">Table 3</xref> for estimates of main and interaction effects and respective <italic>P</italic> values and 95% CIs of the estimates.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Lower HRQoL in men compared with women. HRQoL: health-related quality of life.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="mental_v12i1e57986_fig01.png"/></fig><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Estimates calculated in the multilevel model.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Characteristics</td><td align="left" valign="bottom">MCS<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup>, estimate (<italic>P</italic> value), 95% CI</td><td align="left" valign="bottom">EDE-Q<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup>, estimate (<italic>P</italic> value), 95% CI</td></tr></thead><tbody><tr><td align="left" valign="top">Gender</td><td align="left" valign="top">&#x2212;3.25 (.04), &#x2212;6.15 to &#x2212;0.35</td><td align="left" valign="top">&#x2212;0.02 (.88), &#x2212;0.10 to 0.14</td></tr><tr><td align="left" valign="top">Sexual orientation</td><td align="left" valign="top">&#x2212;0.50 (.71), &#x2212;3.04 to 2.05</td><td align="left" valign="top">&#x2212;0.03 (.67), &#x2212;0.14 to 0.09</td></tr><tr><td align="left" valign="top">Gender &#x00D7; Sexual orientation</td><td align="left" valign="top">1.93 (.37), &#x2212;2.18 to 6.04</td><td align="left" valign="top">0.04 (.61), &#x2212;0.11 to 0.19</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>MCS: mental composite summary of the RAND 36-item short form survey.</p></fn><fn id="table3fn2"><p><sup>b</sup>EDE-Q: eating disorder examination questionnaire.</p></fn></table-wrap-foot></table-wrap></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Results</title><p>We investigated whether gender and sexual orientation in AN and BN case vignettes would influence mental HRQoL and ED severity estimates by ChatGPT-4, a commonly used LLM. Quadruples of 30 case vignettes from scientific papers were modified in a way that only information on gender and sexual orientation varied across vignettes of the same quadruple. Vignettes were then fed into ChatGPT-4 with the instruction to estimate scores of 2 widely used psychometric instruments for assessing HRQoL (MCS of the SF-36) and ED symptomatology (EDE-Q). Findings indicated no effect of gender or sexual orientation in ED severity. Of note, the EDE-Q scores were very high, which might have led to ceiling effects. For the MCS, there was an effect of gender but not of sexual orientation, with vignettes describing men resulting in lower MCS than vignettes describing women. Thus, ChatGPT-4 assumed a greater impairment in mental HRQoL for men compared with women with similar ED severity. Since there is no evidence from previous studies that supports this finding, this can be considered a bias.</p></sec><sec id="s4-2"><title>Interpretation</title><p>While the effect for gender was statistically significant, it is also important to consider the minimal clinically important difference (MCID), that is, to evaluate whether differences in scores would be clinically relevant [<xref ref-type="bibr" rid="ref68">68</xref>]. For the MCS, the MCID has been estimated to be between 3 and 9 points [<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref70">70</xref>]. With a difference of 2.3, the gender effect found in this study was slightly below an MCID. However, a longitudinal study showed that MCS scores in patients with ED improved only 1-6 points during 2 years of treatment although ED symptoms improved markedly, which highlights the clinical relevance of below-MCID differences in MCS scores in participants with ED [<xref ref-type="bibr" rid="ref71">71</xref>].</p><p>Of note, the EDE-Q scores generated by ChatGPT-4 were around 1.6 points above the scores reported in ED samples [<xref ref-type="bibr" rid="ref72">72</xref>-<xref ref-type="bibr" rid="ref74">74</xref>]. Likewise, the MCS scores generated by ChatGPT-4 were around 20 points below mean scores in other ED cohorts [<xref ref-type="bibr" rid="ref75">75</xref>,<xref ref-type="bibr" rid="ref76">76</xref>]. This has implications on the evaluation of the MCID, as potential floor effects need to be considered.</p><p>The gender bias delivered by ChatGPT-4 could be due to social roles assuming general lower mental problems in men than in women and consequently evoking more attention if mental problems are identified. Thus, ChatGPT-4 might mirror possible prejudices, which should be taken up as a nudge to try to correct these prejudices in real life. In the field of EDs, the role of gender, sexual orientation, and the influence of stigmatization and biases in our society need to be understood better [<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref77">77</xref>].</p></sec><sec id="s4-3"><title>Strengths and Limitations</title><p>Our study has several strengths: First, real vignettes from scientific publications were used and varied in a way that the distinct influence of gender and sexual orientation could be singled out. To our knowledge, this is the first study that tests a potential bias when instructing an LLM to evaluate clinical cases with the use of psychometric instruments. Second, while many studies mentioned in this paper have used ChatGPT-3.5, we used ChatGPT-4, which has been shown to perform better in the field of mental health (<xref ref-type="bibr" rid="ref18">18</xref>). Furthermore, we attempted to repeat the analyses in MentaLLaMA, which is fine-tuned for the mental health domain. Third, by applying repeated testing, we reached a much larger sample size than other vignette studies, ensuring sufficient power for our analyses.</p><p>This study also has limitations. First, the gender ratio of the original vignettes was not balanced (only 2 male vignettes), which might have had an impact on the evaluation of these vignettes. However, this ratio approximately reflects the gender ratio of AN and BN in the general population. Second, although we sought to set the temperature to zero and followed available instructions to do so when using the applied interface, we could not verify whether the setting of the temperature via &#x201C;custom instructions&#x201D; actually resulted in respective changes in the system setting of the temperature. Finally, the deviations in EDE-Q and MCS scores raise the question whether scores generated by ChatGPT-4 can be transferred to scores reported in ED research and highlight that the use of LLMs for scoring patient vignettes is still in the fledging stages.</p></sec><sec id="s4-4"><title>Implications and Future Directions</title><p>Our findings highlight the importance of examining biases in LLMs in the context of (mental) health care. Future studies should investigate the generalizability of these findings by exploring biases in other LLMs as well as in other fields of (mental) health. As ChatGPT-4 has been found to disregard conditions that are understudied [<xref ref-type="bibr" rid="ref26">26</xref>], being aware of research and knowledge gaps as well as existing biases and stigma in society when using and training LLMs is of high importance. Furthermore, potential mitigation strategies for biases introduced by LLMs should be investigated. Although AI is not widely used yet in the assessment of disorders, it is already used in assisting doctor&#x2019;s decision-making [ <xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref67">67</xref>]. Furthermore, ChatGPT-3.5 has been used to generate more diverse and inclusive case vignettes to be used in medical education [<xref ref-type="bibr" rid="ref78">78</xref>]. It has been proposed that in health care, specially trained LLMs are needed, as ChatGPT-4 was not intended to be used in a clinical context [<xref ref-type="bibr" rid="ref79">79</xref>] and was deemed unreliable in offering personalized medical advice [<xref ref-type="bibr" rid="ref27">27</xref>].</p><p>In an exploratory analysis, we attempted to replicate the analyses using MentaLLaMA, which is one of the very few available LLMs specialized for mental health topics with published scientific evidence [<xref ref-type="bibr" rid="ref80">80</xref>]. However, MentaLLama is based on an older LLM and therefore appears to have difficulties in conducting meaningful complex vignette assessments as needed for this study. When using MentaLLaMA, our prompting strategy had to be adapted by creating a separate prompt for every single question. Still, MentaLLaMA yielded insufficient interrater correlation coefficients. Thus, data quality was much lower compared with the more recent and advanced model, GPT-4, on which our main analyses were based, leading to findings with low reliability, thus providing very limited insight (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p><p>More powerful LLMs in the field of mental health need to be developed and validated, given that more recent publicly available models lack published evidence of their scientific validation [<xref ref-type="bibr" rid="ref81">81</xref>]. When training specialized LLMs, policy makers should make sure that measures are taken to minimize biases in the training material and that proposed frameworks for responsible AI [<xref ref-type="bibr" rid="ref82">82</xref>] are considered. A potential next step could be to program LLMs or AI systems as &#x201C;verifiers&#x201D; to check for biases in specialized LLMs, using a similar methodology to that used in this study. This would establish an additional layer of scrutiny and validation, enhancing the reliability and fairness of LLM applications in mental health care. In a clinical context, it is important to understand the precision with which LLMs can interpret and apply information from case vignettes or patient records, compared with the accuracy achieved when affected patients complete these assessments themselves.</p></sec><sec id="s4-5"><title>Conclusions</title><p>This study showed that ChatGPT-4 might exhibit a potential gender bias when evaluating ED symptomatology and mental HRQoL. Researchers as well as clinicians should be aware of potential biases when using LLMs to support clinical decision-making. Better understanding and mitigation of risk of bias related to gender and other factors, such as ethnicity or socioeconomic status, are highly warranted to ensure responsible use of LLMs.</p></sec></sec></body><back><ack><p>R Schnepper is funded by the Swiss State Secretariat for Education, Research and Innovation (SERI, under funding number: 22.00094) in the context of a European Union (Horizon Europe) research consortium &#x201C;Long Covid&#x201D; (funding number: 101057553). The publication was funded and supported by the Open Access Fund of Universit&#x00E4;t Trier and by the German Research Foundation (DFG).</p></ack><fn-group><fn fn-type="con"><p>R Schnepper contributed to the conceptualization, methodology, and data collection; conducted the formal analysis; and wrote the original draft of the paper. NR contributed to the writing of the original draft. R Schaefert contributed to the conceptualization and manuscript review and editing. LL contributed to the conceptualization and manuscript review and editing. GM contributed to the conceptualization, methodology, data collection, formal analysis, writing the original draft, and manuscript review and editing. All authors read and approved the final submitted version of the paper.</p></fn><fn fn-type="conflict"><p>R Schaefert and GM received funding from the Stanley Thomas Johnson Stiftung and Gottfried &#x0026; Julia Bangerter-Rhyner-Stiftung under projects nos. PC 28/17 and PC 05/18, from Gesundheitsf&#x00F6;rderung Schweiz under project no. 18.191/K50001, and in the context of a Horizon Europe project from the Swiss State Secretariat for Education, Research and Innovation (SERI) under contract number 22.00094 and from Wings Health in the context of a proof-of-concept study. GM received funding from the Swiss Heart Foundation under project no. FF21101, from the Research Foundation of the International Psychoanalytic University (IPU) Berlin under projects nos. 5087 and 5217, from the German Federal Ministry of Education and Research under budget item 68606, and from the Hasler Foundation under project no. 23004. GM is a cofounder, member of the board, and shareholder of Therayou AG, and active in digital and blended mental health care. GM receives royalties from publishing companies as author, including a book published by Springer, and an honorarium from Lundbeck for speaking at a symposium. Furthermore, GM is compensated for providing psychotherapy to patients, acting as a supervisor, serving as a self-experience facilitator ("Selbsterfahrungsleiter"), and for postgraduate training of psychotherapists, psychosomatic specialists, and supervisors. NR is a coworker at Therayou AG, active in digital and blended mental health care. NR received funding from the Hasler Foundation under project no. 23004 and from Wings Health AG in the context of a proof-of-concept study.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb2">AN</term><def><p>anorexia nervosa</p></def></def-item><def-item><term id="abb3">BN</term><def><p>bulimia nervosa</p></def></def-item><def-item><term id="abb4">ED</term><def><p>eating disorder</p></def></def-item><def-item><term id="abb5">EDE-Q</term><def><p>eating disorder examination questionnaire</p></def></def-item><def-item><term id="abb6">GAF</term><def><p>global assessment of functioning</p></def></def-item><def-item><term id="abb7">HRQoL</term><def><p>health-related quality of life</p></def></def-item><def-item><term id="abb8">ICC</term><def><p>intraclass correlation coefficient</p></def></def-item><def-item><term id="abb9">LLaMA</term><def><p>Large Language Model Meta AI</p></def></def-item><def-item><term id="abb10">LLM</term><def><p>large language model</p></def></def-item><def-item><term id="abb11">MCID</term><def><p>minimal clinically important difference</p></def></def-item><def-item><term id="abb12">MCS</term><def><p>mental composite summary</p></def></def-item><def-item><term id="abb13">MLM</term><def><p>multilevel model</p></def></def-item><def-item><term id="abb14">PCS</term><def><p>physical composite summary</p></def></def-item><def-item><term id="abb15">PTSD</term><def><p>posttraumatic stress disorder</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Demszky</surname><given-names>D</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>D</given-names> </name><name name-style="western"><surname>Yeager</surname><given-names>DS</given-names> </name><etal/></person-group><article-title>Using large language models in psychology</article-title><source>Nat Rev Psychol</source><year>2023</year><volume>2</volume><fpage>688</fpage><lpage>701</lpage><pub-id pub-id-type="doi">10.1038/s44159-023-00241-5</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="preprint"><person-group person-group-type="author"><collab>OpenAi</collab><name name-style="western"><surname>Achiam</surname><given-names>J</given-names> </name><name name-style="western"><surname>Adler</surname><given-names>S</given-names> </name><etal/></person-group><article-title>GPT-4 technical report</article-title><source>arXiv</source><comment>Preprint posted online on  Mar 15, 2023</comment><pub-id pub-id-type="doi">10.48550/arXiv.2303.08774</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="web"><article-title>LaMDA: our breakthrough conversation technology</article-title><source>The Keyword</source><year>2021</year><access-date>2024-02-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://blog.google/technology/ai/lamda/">https://blog.google/technology/ai/lamda/</ext-link></comment></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="preprint"><person-group person-group-type="author"><name name-style="western"><surname>Touvron</surname><given-names>H</given-names> </name><name name-style="western"><surname>Lavril</surname><given-names>T</given-names> </name><name name-style="western"><surname>Izacard</surname><given-names>G</given-names> </name><etal/></person-group><article-title>Llama: open and efficient foundation language models</article-title><source>arXiv</source><comment>Preprint posted online on  Feb 27, 2023</comment><pub-id pub-id-type="doi">10.48550/arXiv.2302.13971</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Thirunavukarasu</surname><given-names>AJ</given-names> </name><name name-style="western"><surname>Ting</surname><given-names>DSJ</given-names> </name><name name-style="western"><surname>Elangovan</surname><given-names>K</given-names> </name><name name-style="western"><surname>Gutierrez</surname><given-names>L</given-names> </name><name name-style="western"><surname>Tan</surname><given-names>TF</given-names> </name><name name-style="western"><surname>Ting</surname><given-names>DSW</given-names> </name></person-group><article-title>Large language models in medicine</article-title><source>Nat Med</source><year>2023</year><month>08</month><volume>29</volume><issue>8</issue><fpage>1930</fpage><lpage>1940</lpage><pub-id pub-id-type="doi">10.1038/s41591-023-02448-8</pub-id><pub-id pub-id-type="medline">37460753</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pennebaker</surname><given-names>JW</given-names> </name><name name-style="western"><surname>Mehl</surname><given-names>MR</given-names> </name><name name-style="western"><surname>Niederhoffer</surname><given-names>KG</given-names> </name></person-group><article-title>Psychological aspects of natural language. use: our words, our selves</article-title><source>Annu Rev Psychol</source><year>2003</year><volume>54</volume><issue>1</issue><fpage>547</fpage><lpage>577</lpage><pub-id pub-id-type="doi">10.1146/annurev.psych.54.101601.145041</pub-id><pub-id pub-id-type="medline">12185209</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>De Choudhury</surname><given-names>M</given-names> </name><name name-style="western"><surname>Gamon</surname><given-names>M</given-names> </name><name name-style="western"><surname>Counts</surname><given-names>S</given-names> </name><name name-style="western"><surname>Horvitz</surname><given-names>E</given-names> </name></person-group><article-title>Predicting depression via social media</article-title><source>ICWSM</source><year>2021</year><volume>7</volume><issue>1</issue><fpage>128</fpage><lpage>137</lpage><pub-id pub-id-type="doi">10.1609/icwsm.v7i1.14432</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="preprint"><person-group person-group-type="author"><name name-style="western"><surname>Vaswani</surname><given-names>A</given-names> </name><name name-style="western"><surname>Shazeer</surname><given-names>N</given-names> </name><name name-style="western"><surname>Parmar</surname><given-names>N</given-names> </name><etal/></person-group><article-title>Attention is all you need</article-title><source>arXiv</source><comment>Preprint posted online on  Jun 12, 2017</comment><pub-id pub-id-type="doi">10.48550/arXiv.1706.03762</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Liddy</surname><given-names>ED</given-names> </name></person-group><article-title>Natural language processing</article-title><source>Encyclopedia of Library and Information Science</source><year>2001</year><publisher-name>Marcel Decker Inc</publisher-name></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Meyer</surname><given-names>JG</given-names> </name><name name-style="western"><surname>Urbanowicz</surname><given-names>RJ</given-names> </name><name name-style="western"><surname>Martin</surname><given-names>PCN</given-names> </name><etal/></person-group><article-title>ChatGPT and large language models in academia: opportunities and challenges</article-title><source>BioData Min</source><year>2023</year><month>07</month><day>13</day><volume>16</volume><issue>1</issue><fpage>20</fpage><pub-id pub-id-type="doi">10.1186/s13040-023-00339-9</pub-id><pub-id pub-id-type="medline">37443040</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Boyd</surname><given-names>RL</given-names> </name><name name-style="western"><surname>Schwartz</surname><given-names>HA</given-names> </name></person-group><article-title>Natural language analysis and the psychology of verbal behavior: the past, present, and future states of the field</article-title><source>J Lang Soc Psychol</source><year>2021</year><month>01</month><volume>40</volume><issue>1</issue><fpage>21</fpage><lpage>41</lpage><pub-id pub-id-type="doi">10.1177/0261927x20967028</pub-id><pub-id pub-id-type="medline">34413563</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rehm</surname><given-names>J</given-names> </name><name name-style="western"><surname>Shield</surname><given-names>KD</given-names> </name></person-group><article-title>Global burden of disease and the impact of mental and addictive disorders</article-title><source>Curr Psychiatry Rep</source><year>2019</year><month>02</month><day>7</day><volume>21</volume><issue>2</issue><fpage>10</fpage><pub-id pub-id-type="doi">10.1007/s11920-019-0997-0</pub-id><pub-id pub-id-type="medline">30729322</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chaulagain</surname><given-names>A</given-names> </name><name name-style="western"><surname>Pacione</surname><given-names>L</given-names> </name><name name-style="western"><surname>Abdulmalik</surname><given-names>J</given-names> </name><etal/></person-group><article-title>WHO Mental Health Gap Action Programme Intervention Guide (mhGAP-IG): the first pre-service training study</article-title><source>Int J Ment Health Syst</source><year>2020</year><volume>14</volume><issue>1</issue><fpage>47</fpage><pub-id pub-id-type="doi">10.1186/s13033-020-00379-2</pub-id><pub-id pub-id-type="medline">32612675</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kjell</surname><given-names>ONE</given-names> </name><name name-style="western"><surname>Kjell</surname><given-names>K</given-names> </name><name name-style="western"><surname>Schwartz</surname><given-names>HA</given-names> </name></person-group><article-title>Beyond rating scales: with targeted evaluation, large language models are poised for psychological assessment</article-title><source>Psychiatry Res</source><year>2024</year><month>03</month><volume>333</volume><fpage>115667</fpage><pub-id pub-id-type="doi">10.1016/j.psychres.2023.115667</pub-id><pub-id pub-id-type="medline">38290286</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kjell</surname><given-names>ONE</given-names> </name><name name-style="western"><surname>Sikstr&#x00F6;m</surname><given-names>S</given-names> </name><name name-style="western"><surname>Kjell</surname><given-names>K</given-names> </name><name name-style="western"><surname>Schwartz</surname><given-names>HA</given-names> </name></person-group><article-title>Natural language analyzed with AI-based transformers predict traditional subjective well-being measures approaching the theoretical upper limits in accuracy</article-title><source>Sci Rep</source><year>2022</year><month>03</month><day>10</day><volume>12</volume><issue>1</issue><fpage>3918</fpage><pub-id pub-id-type="doi">10.1038/s41598-022-07520-w</pub-id><pub-id pub-id-type="medline">35273198</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Park</surname><given-names>G</given-names> </name><name name-style="western"><surname>Schwartz</surname><given-names>HA</given-names> </name><name name-style="western"><surname>Eichstaedt</surname><given-names>JC</given-names> </name><etal/></person-group><article-title>Automatic personality assessment through social media language</article-title><source>J Pers Soc Psychol</source><year>2015</year><month>06</month><volume>108</volume><issue>6</issue><fpage>934</fpage><lpage>952</lpage><pub-id pub-id-type="doi">10.1037/pspp0000020</pub-id><pub-id pub-id-type="medline">25365036</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kjell</surname><given-names>ONE</given-names> </name><name name-style="western"><surname>Kjell</surname><given-names>K</given-names> </name><name name-style="western"><surname>Garcia</surname><given-names>D</given-names> </name><name name-style="western"><surname>Sikstr&#x00F6;m</surname><given-names>S</given-names> </name></person-group><article-title>Semantic measures: using natural language processing to measure, differentiate, and describe psychological constructs</article-title><source>Psychol Methods</source><year>2019</year><month>02</month><volume>24</volume><issue>1</issue><fpage>92</fpage><lpage>115</lpage><pub-id pub-id-type="doi">10.1037/met0000191</pub-id><pub-id pub-id-type="medline">29963879</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Son</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Clouston</surname><given-names>SAP</given-names> </name><name name-style="western"><surname>Kotov</surname><given-names>R</given-names> </name><etal/></person-group><article-title>World Trade Center responders in their own words: predicting PTSD symptom trajectories with AI-based language analyses of interviews</article-title><source>Psychol Med</source><year>2023</year><month>02</month><volume>53</volume><issue>3</issue><fpage>918</fpage><lpage>926</lpage><pub-id pub-id-type="doi">10.1017/S0033291721002294</pub-id><pub-id pub-id-type="medline">34154682</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Levkovich</surname><given-names>I</given-names> </name><name name-style="western"><surname>Elyoseph</surname><given-names>Z</given-names> </name></person-group><article-title>Suicide risk assessments through the eyes of ChatGPT-3.5 versus ChatGPT-4: vignette study</article-title><source>JMIR Ment Health</source><year>2023</year><month>09</month><day>20</day><volume>10</volume><fpage>e51232</fpage><pub-id pub-id-type="doi">10.2196/51232</pub-id><pub-id pub-id-type="medline">37728984</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Franco D&#x2019;Souza</surname><given-names>R</given-names> </name><name name-style="western"><surname>Amanullah</surname><given-names>S</given-names> </name><name name-style="western"><surname>Mathew</surname><given-names>M</given-names> </name><name name-style="western"><surname>Surapaneni</surname><given-names>KM</given-names> </name></person-group><article-title>Appraising the performance of ChatGPT in psychiatry using 100 clinical case vignettes</article-title><source>Asian J Psychiatr</source><year>2023</year><month>11</month><volume>89</volume><fpage>103770</fpage><pub-id pub-id-type="doi">10.1016/j.ajp.2023.103770</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ntoutsi</surname><given-names>E</given-names> </name><name name-style="western"><surname>Fafalios</surname><given-names>P</given-names> </name><name name-style="western"><surname>Gadiraju</surname><given-names>U</given-names> </name><etal/></person-group><article-title>Bias in data&#x2010;driven artificial intelligence systems&#x2014;an introductory survey</article-title><source>WIREs Data Mining Knowledge Discov</source><year>2020</year><month>05</month><volume>10</volume><issue>3</issue><pub-id pub-id-type="doi">10.1002/widm.1356</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Navigli</surname><given-names>R</given-names> </name><name name-style="western"><surname>Conia</surname><given-names>S</given-names> </name><name name-style="western"><surname>Ross</surname><given-names>B</given-names> </name></person-group><article-title>Biases in large language models: origins, inventory, and discussion</article-title><source>J Data Inf Qual</source><year>2023</year><month>06</month><day>30</day><volume>15</volume><issue>2</issue><fpage>1</fpage><lpage>21</lpage><pub-id pub-id-type="doi">10.1145/3597307</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Walsh</surname><given-names>CG</given-names> </name><name name-style="western"><surname>Chaudhry</surname><given-names>B</given-names> </name><name name-style="western"><surname>Dua</surname><given-names>P</given-names> </name><etal/></person-group><article-title>Stigma, biomarkers, and algorithmic bias: recommendations for precision behavioral health with artificial intelligence</article-title><source>JAMIA Open</source><year>2020</year><month>04</month><volume>3</volume><issue>1</issue><fpage>9</fpage><lpage>15</lpage><pub-id pub-id-type="doi">10.1093/jamiaopen/ooz054</pub-id><pub-id pub-id-type="medline">32607482</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="preprint"><person-group person-group-type="author"><name name-style="western"><surname>Rahimi</surname><given-names>P</given-names> </name><name name-style="western"><surname>Ecabert</surname><given-names>C</given-names> </name><name name-style="western"><surname>Marce</surname><given-names>S</given-names> </name></person-group><article-title>Toward responsible face datasets: modeling the distribution of a disentangled latent space for sampling face images from demographic groups</article-title><source>arXiv</source><comment>Preprint posted online on  Sep 15, 2023</comment><pub-id pub-id-type="doi">10.48550/arXiv.2309.08442</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>IY</given-names> </name><name name-style="western"><surname>Szolovits</surname><given-names>P</given-names> </name><name name-style="western"><surname>Ghassemi</surname><given-names>M</given-names> </name></person-group><article-title>Can AI help reduce disparities in general medical and mental health care?</article-title><source>AMA J Ethics</source><year>2019</year><month>02</month><day>1</day><volume>21</volume><issue>2</issue><fpage>E167</fpage><lpage>E179</lpage><pub-id pub-id-type="doi">10.1001/amajethics.2019.167</pub-id><pub-id pub-id-type="medline">30794127</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nacher</surname><given-names>M</given-names> </name><name name-style="western"><surname>Fran&#x00E7;oise</surname><given-names>U</given-names> </name><name name-style="western"><surname>Adenis</surname><given-names>A</given-names> </name></person-group><article-title>ChatGPT neglects a neglected disease</article-title><source>Lancet Infect Dis</source><year>2024</year><month>02</month><volume>24</volume><issue>2</issue><fpage>e76</fpage><pub-id pub-id-type="doi">10.1016/S1473-3099(23)00750-8</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nastasi</surname><given-names>AJ</given-names> </name><name name-style="western"><surname>Courtright</surname><given-names>KR</given-names> </name><name name-style="western"><surname>Halpern</surname><given-names>SD</given-names> </name><name name-style="western"><surname>Weissman</surname><given-names>GE</given-names> </name></person-group><article-title>A vignette-based evaluation of ChatGPT&#x2019;s ability to provide appropriate and equitable medical advice across care contexts</article-title><source>Sci Rep</source><year>2023</year><month>10</month><day>19</day><volume>13</volume><issue>1</issue><fpage>17885</fpage><pub-id pub-id-type="doi">10.1038/s41598-023-45223-y</pub-id><pub-id pub-id-type="medline">37857839</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zack</surname><given-names>T</given-names> </name><name name-style="western"><surname>Lehman</surname><given-names>E</given-names> </name><name name-style="western"><surname>Suzgun</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Assessing the potential of GPT-4 to perpetuate racial and gender biases in health care: a model evaluation study</article-title><source>Lancet Digit Health</source><year>2024</year><month>01</month><volume>6</volume><issue>1</issue><fpage>e12</fpage><lpage>e22</lpage><pub-id pub-id-type="doi">10.1016/S2589-7500(23)00225-X</pub-id><pub-id pub-id-type="medline">38123252</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mosteiro</surname><given-names>P</given-names> </name><name name-style="western"><surname>Kuiper</surname><given-names>J</given-names> </name><name name-style="western"><surname>Masthoff</surname><given-names>J</given-names> </name><name name-style="western"><surname>Scheepers</surname><given-names>F</given-names> </name><name name-style="western"><surname>Spruit</surname><given-names>M</given-names> </name></person-group><article-title>Bias discovery in machine learning models for mental health</article-title><source>Information</source><year>2022</year><volume>13</volume><issue>5</issue><fpage>237</fpage><pub-id pub-id-type="doi">10.3390/info13050237</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Roehrig</surname><given-names>JP</given-names> </name><name name-style="western"><surname>McLean</surname><given-names>CP</given-names> </name></person-group><article-title>A comparison of stigma toward eating disorders versus depression</article-title><source>Int J Eat Disord</source><year>2010</year><month>11</month><day>1</day><volume>43</volume><issue>7</issue><fpage>671</fpage><lpage>674</lpage><pub-id pub-id-type="doi">10.1002/eat.20760</pub-id><pub-id pub-id-type="medline">19816860</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gallagher</surname><given-names>KA</given-names> </name><name name-style="western"><surname>Sonneville</surname><given-names>KR</given-names> </name><name name-style="western"><surname>Hazzard</surname><given-names>VM</given-names> </name><name name-style="western"><surname>Carson</surname><given-names>TL</given-names> </name><name name-style="western"><surname>Needham</surname><given-names>BL</given-names> </name></person-group><article-title>Evaluating gender bias in an eating disorder risk assessment questionnaire for athletes</article-title><source>Eat Disord</source><year>2021</year><volume>29</volume><issue>1</issue><fpage>29</fpage><lpage>41</lpage><pub-id pub-id-type="doi">10.1080/10640266.2019.1613846</pub-id><pub-id pub-id-type="medline">31079562</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Westmoreland</surname><given-names>P</given-names> </name><name name-style="western"><surname>Krantz</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Mehler</surname><given-names>PS</given-names> </name></person-group><article-title>Medical complications of anorexia nervosa and bulimia</article-title><source>Am J Med</source><year>2016</year><month>01</month><volume>129</volume><issue>1</issue><fpage>30</fpage><lpage>37</lpage><pub-id pub-id-type="doi">10.1016/j.amjmed.2015.06.031</pub-id><pub-id pub-id-type="medline">26169883</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Richard</surname><given-names>M</given-names> </name></person-group><article-title>Effective treatment of eating disorders in Europe: treatment outcome and its predictors</article-title><source>Eur Eat Disorders Rev</source><year>2005</year><month>05</month><volume>13</volume><issue>3</issue><fpage>169</fpage><lpage>179</lpage><pub-id pub-id-type="doi">10.1002/erv.636</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Galmiche</surname><given-names>M</given-names> </name><name name-style="western"><surname>D&#x00E9;chelotte</surname><given-names>P</given-names> </name><name name-style="western"><surname>Lambert</surname><given-names>G</given-names> </name><name name-style="western"><surname>Tavolacci</surname><given-names>MP</given-names> </name></person-group><article-title>Prevalence of eating disorders over the 2000-2018 period: a systematic literature review</article-title><source>Am J Clin Nutr</source><year>2019</year><month>05</month><day>1</day><volume>109</volume><issue>5</issue><fpage>1402</fpage><lpage>1413</lpage><pub-id pub-id-type="doi">10.1093/ajcn/nqy342</pub-id><pub-id pub-id-type="medline">31051507</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gorrell</surname><given-names>S</given-names> </name><name name-style="western"><surname>Murray</surname><given-names>SB</given-names> </name></person-group><article-title>Eating disorders in males</article-title><source>Child Adolesc Psychiatr Clin N Am</source><year>2019</year><month>10</month><volume>28</volume><issue>4</issue><fpage>641</fpage><lpage>651</lpage><pub-id pub-id-type="doi">10.1016/j.chc.2019.05.012</pub-id><pub-id pub-id-type="medline">31443881</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hudson</surname><given-names>JI</given-names> </name><name name-style="western"><surname>Hiripi</surname><given-names>E</given-names> </name><name name-style="western"><surname>Pope</surname><given-names>HG</given-names>  <suffix>Jr</suffix></name><name name-style="western"><surname>Kessler</surname><given-names>RC</given-names> </name></person-group><article-title>The prevalence and correlates of eating disorders in the National Comorbidity Survey Replication</article-title><source>Biol Psychiatry</source><year>2007</year><month>02</month><day>1</day><volume>61</volume><issue>3</issue><fpage>348</fpage><lpage>358</lpage><pub-id pub-id-type="doi">10.1016/j.biopsych.2006.03.040</pub-id><pub-id pub-id-type="medline">16815322</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sweeting</surname><given-names>H</given-names> </name><name name-style="western"><surname>Walker</surname><given-names>L</given-names> </name><name name-style="western"><surname>MacLean</surname><given-names>A</given-names> </name><name name-style="western"><surname>Patterson</surname><given-names>C</given-names> </name><name name-style="western"><surname>R&#x00E4;is&#x00E4;nen</surname><given-names>U</given-names> </name><name name-style="western"><surname>Hunt</surname><given-names>K</given-names> </name></person-group><article-title>Prevalence of eating disorders in males: a review of rates reported in academic research and UK mass media</article-title><source>Int J Mens Health</source><year>2015</year><volume>14</volume><issue>2</issue><pub-id pub-id-type="doi">10.3149/jmh.1402.86</pub-id><pub-id pub-id-type="medline">26290657</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Timko</surname><given-names>CA</given-names> </name><name name-style="western"><surname>DeFilipp</surname><given-names>L</given-names> </name><name name-style="western"><surname>Dakanalis</surname><given-names>A</given-names> </name></person-group><article-title>Sex differences in adolescent anorexia and bulimia nervosa: beyond the signs and symptoms</article-title><source>Curr Psychiatry Rep</source><year>2019</year><month>01</month><day>12</day><volume>21</volume><issue>1</issue><fpage>1</fpage><pub-id pub-id-type="doi">10.1007/s11920-019-0988-1</pub-id><pub-id pub-id-type="medline">30637488</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>St&#x00F8;ving</surname><given-names>RK</given-names> </name><name name-style="western"><surname>Andries</surname><given-names>A</given-names> </name><name name-style="western"><surname>Brixen</surname><given-names>K</given-names> </name><name name-style="western"><surname>Bilenberg</surname><given-names>N</given-names> </name><name name-style="western"><surname>H&#x00F8;rder</surname><given-names>K</given-names> </name></person-group><article-title>Gender differences in outcome of eating disorders: a retrospective cohort study</article-title><source>Psychiatry Res</source><year>2011</year><month>04</month><day>30</day><volume>186</volume><issue>2-3</issue><fpage>362</fpage><lpage>366</lpage><pub-id pub-id-type="doi">10.1016/j.psychres.2010.08.005</pub-id><pub-id pub-id-type="medline">20826003</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Strobel</surname><given-names>C</given-names> </name><name name-style="western"><surname>Quadflieg</surname><given-names>N</given-names> </name><name name-style="western"><surname>Naab</surname><given-names>S</given-names> </name><name name-style="western"><surname>Voderholzer</surname><given-names>U</given-names> </name><name name-style="western"><surname>Fichter</surname><given-names>MM</given-names> </name></person-group><article-title>Long-term outcomes in treated males with anorexia nervosa and bulimia nervosa&#x2014;a prospective, gender-matched study</article-title><source>Int J Eat Disord</source><year>2019</year><month>12</month><volume>52</volume><issue>12</issue><fpage>1353</fpage><lpage>1364</lpage><pub-id pub-id-type="doi">10.1002/eat.23151</pub-id><pub-id pub-id-type="medline">31444805</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bothe</surname><given-names>T</given-names> </name><name name-style="western"><surname>Walker</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kr&#x00F6;ger</surname><given-names>C</given-names> </name></person-group><article-title>Gender-related differences in health-care and economic costs for eating disorders: a comparative cost-development analysis for anorexia and bulimia nervosa based on anonymized claims data</article-title><source>Int J Eat Disord</source><year>2022</year><month>01</month><volume>55</volume><issue>1</issue><fpage>61</fpage><lpage>75</lpage><pub-id pub-id-type="doi">10.1002/eat.23610</pub-id><pub-id pub-id-type="medline">34599621</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Brelet</surname><given-names>L</given-names> </name><name name-style="western"><surname>Flaudias</surname><given-names>V</given-names> </name><name name-style="western"><surname>D&#x00E9;sert</surname><given-names>M</given-names> </name><name name-style="western"><surname>Guillaume</surname><given-names>S</given-names> </name><name name-style="western"><surname>Llorca</surname><given-names>PM</given-names> </name><name name-style="western"><surname>Boirie</surname><given-names>Y</given-names> </name></person-group><article-title>Stigmatization toward people with anorexia nervosa, bulimia nervosa, and binge eating disorder: a scoping review</article-title><source>Nutrients</source><year>2021</year><month>08</month><day>18</day><volume>13</volume><issue>8</issue><fpage>2834</fpage><pub-id pub-id-type="doi">10.3390/nu13082834</pub-id><pub-id pub-id-type="medline">34444994</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cao</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Cini</surname><given-names>E</given-names> </name><name name-style="western"><surname>Pellegrini</surname><given-names>D</given-names> </name><name name-style="western"><surname>Fragkos</surname><given-names>KC</given-names> </name></person-group><article-title>The association between sexual orientation and eating disorders-related eating behaviours in adolescents: a systematic review and meta-analysis</article-title><source>Eur Eat Disord Rev</source><year>2023</year><month>01</month><volume>31</volume><issue>1</issue><fpage>46</fpage><lpage>64</lpage><pub-id pub-id-type="doi">10.1002/erv.2952</pub-id><pub-id pub-id-type="medline">36367345</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Boisvert</surname><given-names>JA</given-names> </name><name name-style="western"><surname>Harrell</surname><given-names>WA</given-names> </name></person-group><article-title>Homosexuality as a risk factor for eating disorder symptomatology in men</article-title><source>J Men Stud</source><year>2010</year><month>06</month><volume>17</volume><issue>3</issue><fpage>210</fpage><lpage>225</lpage><pub-id pub-id-type="doi">10.3149/jms.1703.210</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Str&#x00FC;bel</surname><given-names>J</given-names> </name><name name-style="western"><surname>Petrie</surname><given-names>TA</given-names> </name></person-group><article-title>Sexual orientation, eating disorder classification, and men&#x2019;s psychosocial well-being</article-title><source>Psychol Men Masculinities</source><year>2020</year><volume>21</volume><issue>2</issue><fpage>190</fpage><lpage>200</lpage><pub-id pub-id-type="doi">10.1037/men0000224</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dotan</surname><given-names>A</given-names> </name><name name-style="western"><surname>Bachner-Melman</surname><given-names>R</given-names> </name><name name-style="western"><surname>Dahlenburg</surname><given-names>SC</given-names> </name></person-group><article-title>Sexual orientation and disordered eating in women: a meta-analysis</article-title><source>Eat Weight Disord</source><year>2021</year><volume>26</volume><issue>1</issue><fpage>13</fpage><lpage>25</lpage><pub-id pub-id-type="doi">10.1007/s40519-019-00824-3</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Garc&#x00ED;a-Anaya</surname><given-names>M</given-names> </name><name name-style="western"><surname>Caballero-Romo</surname><given-names>A</given-names> </name><name name-style="western"><surname>Gonz&#x00E1;lez-Mac&#x00ED;as</surname><given-names>L</given-names> </name></person-group><article-title>Parent-focused psychotherapy for the preventive management of chronicity in anorexia nervosa: a case series</article-title><source>Int J Environ Res Public Health</source><year>2022</year><month>08</month><day>3</day><volume>19</volume><issue>15</issue><fpage>15</fpage><pub-id pub-id-type="doi">10.3390/ijerph19159522</pub-id><pub-id pub-id-type="medline">35954879</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Olson</surname><given-names>AF</given-names> </name></person-group><article-title>Outpatient management of electrolyte imbalances associated with anorexia nervosa and bulimia nervosa</article-title><source>J Infus Nurs</source><year>2005</year><volume>28</volume><issue>2</issue><fpage>118</fpage><lpage>122</lpage><pub-id pub-id-type="doi">10.1097/00129804-200503000-00005</pub-id><pub-id pub-id-type="medline">15785332</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gurevich</surname><given-names>MI</given-names> </name><name name-style="western"><surname>Chung</surname><given-names>MK</given-names> </name><name name-style="western"><surname>LaRiccia</surname><given-names>PJ</given-names> </name></person-group><article-title>Resolving bulimia nervosa using an innovative neural therapy approach: two case reports</article-title><source>Clin Case Rep</source><year>2018</year><month>02</month><volume>6</volume><issue>2</issue><fpage>278</fpage><lpage>282</lpage><pub-id pub-id-type="doi">10.1002/ccr3.1326</pub-id><pub-id pub-id-type="medline">29445463</pub-id></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Manuelli</surname><given-names>M</given-names> </name><name name-style="western"><surname>Franzini</surname><given-names>A</given-names> </name><name name-style="western"><surname>Galentino</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Changes in eating behavior after deep brain stimulation for anorexia nervosa. A case study</article-title><source>Eat Weight Disord</source><year>2020</year><month>10</month><volume>25</volume><issue>5</issue><fpage>1481</fpage><lpage>1486</lpage><pub-id pub-id-type="doi">10.1007/s40519-019-00742-4</pub-id><pub-id pub-id-type="medline">31290029</pub-id></nlm-citation></ref><ref id="ref51"><label>51</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gonz&#x00E1;lez-Mac&#x00ED;as</surname><given-names>L</given-names> </name><name name-style="western"><surname>Caballero-Romo</surname><given-names>A</given-names> </name><name name-style="western"><surname>Garc&#x00ED;a-Anaya</surname><given-names>M</given-names> </name></person-group><article-title>Group family psychotherapy during relapse. Case report of a novel intervention for severe and enduring anorexia nervosa</article-title><source>Salud Mental</source><year>2021</year><month>02</month><day>9</day><volume>44</volume><issue>1</issue><fpage>31</fpage><lpage>37</lpage><pub-id pub-id-type="doi">10.17711/SM.0185-3325.2021.006</pub-id></nlm-citation></ref><ref id="ref52"><label>52</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Safer</surname><given-names>DL</given-names> </name><name name-style="western"><surname>Telch</surname><given-names>CF</given-names> </name><name name-style="western"><surname>Agras</surname><given-names>WS</given-names> </name></person-group><article-title>Dialectical behavior therapy adapted for bulimia: a case report</article-title><source>Int J Eat Disord</source><year>2001</year><month>07</month><volume>30</volume><issue>1</issue><fpage>101</fpage><lpage>106</lpage><pub-id pub-id-type="doi">10.1002/eat.1059</pub-id><pub-id pub-id-type="medline">11439414</pub-id></nlm-citation></ref><ref id="ref53"><label>53</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Srinivasa</surname><given-names>P</given-names> </name><name name-style="western"><surname>Chandrashekar</surname><given-names>M</given-names> </name><name name-style="western"><surname>Harish</surname><given-names>N</given-names> </name><name name-style="western"><surname>Gowda</surname><given-names>MR</given-names> </name><name name-style="western"><surname>Durgoji</surname><given-names>S</given-names> </name></person-group><article-title>Case report on anorexia nervosa</article-title><source>Indian J Psychol Med</source><year>2015</year><volume>37</volume><issue>2</issue><fpage>236</fpage><lpage>238</lpage><pub-id pub-id-type="doi">10.4103/0253-7176.155655</pub-id><pub-id pub-id-type="medline">25969616</pub-id></nlm-citation></ref><ref id="ref54"><label>54</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Berman</surname><given-names>MI</given-names> </name><name name-style="western"><surname>Boutelle</surname><given-names>KN</given-names> </name><name name-style="western"><surname>Crow</surname><given-names>SJ</given-names> </name></person-group><article-title>A case series investigating acceptance and commitment therapy as a treatment for previously treated, unremitted patients with anorexia nervosa</article-title><source>Eur Eat Disord Rev</source><year>2009</year><month>11</month><volume>17</volume><issue>6</issue><fpage>426</fpage><lpage>434</lpage><pub-id pub-id-type="doi">10.1002/erv.962</pub-id><pub-id pub-id-type="medline">19760625</pub-id></nlm-citation></ref><ref id="ref55"><label>55</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Viseu</surname><given-names>M</given-names> </name><name name-style="western"><surname>Oliveira</surname><given-names>A</given-names> </name><name name-style="western"><surname>Barbosa Pinto</surname><given-names>M</given-names> </name><name name-style="western"><surname>Sousa</surname><given-names>R</given-names> </name></person-group><article-title>A case report of anorexia nervosa&#x2014;the &#x201C;perfect&#x201C; woman</article-title><source>Eur Psychiatr</source><year>2022</year><month>06</month><volume>65</volume><issue>S1</issue><fpage>S583</fpage><lpage>S584</lpage><pub-id pub-id-type="doi">10.1192/j.eurpsy.2022.1495</pub-id></nlm-citation></ref><ref id="ref56"><label>56</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Laser</surname><given-names>E</given-names> </name><name name-style="western"><surname>Sassack</surname><given-names>M</given-names> </name></person-group><article-title>Treating bulimia with hypnosis and low-level light therapy: a case report</article-title><conf-name>SPIE BiOS</conf-name><conf-date>Jan 21-26, 2012</conf-date><conf-loc>San Francisco, CA, United States</conf-loc><pub-id pub-id-type="doi">10.1117/12.905375</pub-id></nlm-citation></ref><ref id="ref57"><label>57</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Morgan</surname><given-names>CD</given-names> </name><name name-style="western"><surname>Marsh</surname><given-names>C</given-names> </name></person-group><article-title>Bulimia nervosa in an elderly male: a case report</article-title><source>Int J Eat Disord</source><year>2006</year><month>03</month><volume>39</volume><issue>2</issue><fpage>170</fpage><lpage>171</lpage><pub-id pub-id-type="doi">10.1002/eat.20212</pub-id><pub-id pub-id-type="medline">16252279</pub-id></nlm-citation></ref><ref id="ref58"><label>58</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sansone</surname><given-names>RA</given-names> </name><name name-style="western"><surname>Naqvi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Sansone</surname><given-names>LA</given-names> </name></person-group><article-title>An unusual cause of dizziness in bulimia nervosa: a case report</article-title><source>Int J Eat Disord</source><year>2005</year><month>05</month><volume>37</volume><issue>4</issue><fpage>364</fpage><lpage>366</lpage><pub-id pub-id-type="doi">10.1002/eat.20095</pub-id><pub-id pub-id-type="medline">15856497</pub-id></nlm-citation></ref><ref id="ref59"><label>59</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hays</surname><given-names>RD</given-names> </name><name name-style="western"><surname>Sherbourne</surname><given-names>CD</given-names> </name><name name-style="western"><surname>Mazel</surname><given-names>RM</given-names> </name></person-group><article-title>The RAND 36-Item Health Survey 1.0</article-title><source>Health Econ</source><year>1993</year><month>10</month><volume>2</volume><issue>3</issue><fpage>217</fpage><lpage>227</lpage><pub-id pub-id-type="doi">10.1002/hec.4730020305</pub-id><pub-id pub-id-type="medline">8275167</pub-id></nlm-citation></ref><ref id="ref60"><label>60</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jenkins</surname><given-names>PE</given-names> </name><name name-style="western"><surname>Hoste</surname><given-names>RR</given-names> </name><name name-style="western"><surname>Doyle</surname><given-names>AC</given-names> </name><etal/></person-group><article-title>Health-related quality of life among adolescents with eating disorders</article-title><source>J Psychosom Res</source><year>2014</year><month>01</month><volume>76</volume><issue>1</issue><fpage>1</fpage><lpage>5</lpage><pub-id pub-id-type="doi">10.1016/j.jpsychores.2013.11.006</pub-id><pub-id pub-id-type="medline">24360133</pub-id></nlm-citation></ref><ref id="ref61"><label>61</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Ware</surname><given-names>JE</given-names> </name></person-group><source>SF-36 Physical and Mental Health Summary Scales: A User&#x2019;s Manual</source><year>1994</year><publisher-name>The Health Institute, New England Medical Center Hospitals</publisher-name></nlm-citation></ref><ref id="ref62"><label>62</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Andersen</surname><given-names>JR</given-names> </name><name name-style="western"><surname>Breivik</surname><given-names>K</given-names> </name><name name-style="western"><surname>Engelund</surname><given-names>IE</given-names> </name><etal/></person-group><article-title>Correlated physical and mental health composite scores for the RAND-36 and RAND-12 health surveys: can we keep them simple?</article-title><source>Health Qual Life Outcomes</source><year>2022</year><month>06</month><day>3</day><volume>20</volume><issue>1</issue><fpage>89</fpage><pub-id pub-id-type="doi">10.1186/s12955-022-01992-0</pub-id><pub-id pub-id-type="medline">35659237</pub-id></nlm-citation></ref><ref id="ref63"><label>63</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fairburn</surname><given-names>CG</given-names> </name><name name-style="western"><surname>Beglin</surname><given-names>SJ</given-names> </name></person-group><article-title>Assessment of eating disorders: interview or self-report questionnaire?</article-title><source>Int J Eat Disord</source><year>1994</year><month>12</month><volume>16</volume><issue>4</issue><fpage>363</fpage><lpage>370</lpage><pub-id pub-id-type="medline">7866415</pub-id></nlm-citation></ref><ref id="ref64"><label>64</label><nlm-citation citation-type="web"><source>RStudio: Integrated Development Environment for R</source><access-date>2025-02-24</access-date><comment><ext-link ext-link-type="uri" xlink:href="http://www.rstudio.com/">http://www.rstudio.com/</ext-link></comment></nlm-citation></ref><ref id="ref65"><label>65</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bates</surname><given-names>D</given-names> </name><name name-style="western"><surname>M&#x00E4;chler</surname><given-names>M</given-names> </name><name name-style="western"><surname>Bolker</surname><given-names>B</given-names> </name><name name-style="western"><surname>Walker</surname><given-names>S</given-names> </name></person-group><article-title>Fitting linear mixed-effects models using lme4</article-title><source>J Stat Softw</source><year>2015</year><volume>67</volume><issue>1</issue><fpage>1</fpage><lpage>48</lpage><pub-id pub-id-type="doi">10.18637/jss.v067.i01</pub-id></nlm-citation></ref><ref id="ref66"><label>66</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Bliese</surname><given-names>PD</given-names> </name></person-group><article-title>Within-group agreement, non-independence, and reliability: implications for data aggregation and analysis</article-title><source>Multilevel Theory, Research, and Methods in Organizations: Foundations, Extensions, and New Directions</source><year>2000</year><publisher-name>Jossey-Bass/Wiley</publisher-name><fpage>349</fpage><lpage>381</lpage></nlm-citation></ref><ref id="ref67"><label>67</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Wickham</surname><given-names>H</given-names> </name></person-group><source>Data Analysis</source><year>2016</year><publisher-name>Springer</publisher-name></nlm-citation></ref><ref id="ref68"><label>68</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dettori</surname><given-names>JR</given-names> </name><name name-style="western"><surname>Norvell</surname><given-names>DC</given-names> </name><name name-style="western"><surname>Chapman</surname><given-names>JR</given-names> </name></person-group><article-title>Clinically important difference: 4 tips toward a better understanding</article-title><source>Global Spine J</source><year>2022</year><month>07</month><volume>12</volume><issue>6</issue><fpage>1297</fpage><lpage>1298</lpage><pub-id pub-id-type="doi">10.1177/21925682221092721</pub-id><pub-id pub-id-type="medline">35393866</pub-id></nlm-citation></ref><ref id="ref69"><label>69</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ferguson</surname><given-names>RJ</given-names> </name><name name-style="western"><surname>Robinson</surname><given-names>AB</given-names> </name><name name-style="western"><surname>Splaine</surname><given-names>M</given-names> </name></person-group><article-title>Use of the reliable change index to evaluate clinical significance in SF-36 outcomes</article-title><source>Qual Life Res</source><year>2002</year><month>09</month><volume>11</volume><issue>6</issue><fpage>509</fpage><lpage>516</lpage><pub-id pub-id-type="doi">10.1023/a:1016350431190</pub-id><pub-id pub-id-type="medline">12206571</pub-id></nlm-citation></ref><ref id="ref70"><label>70</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Samsa</surname><given-names>G</given-names> </name><name name-style="western"><surname>Edelman</surname><given-names>D</given-names> </name><name name-style="western"><surname>Rothman</surname><given-names>ML</given-names> </name><name name-style="western"><surname>Williams</surname><given-names>GR</given-names> </name><name name-style="western"><surname>Lipscomb</surname><given-names>J</given-names> </name><name name-style="western"><surname>Matchar</surname><given-names>D</given-names> </name></person-group><article-title>Determining clinically important differences in health status measures: a general approach with illustration to the Health Utilities Index Mark II</article-title><source>Pharmacoeconomics</source><year>1999</year><month>02</month><volume>15</volume><issue>2</issue><fpage>141</fpage><lpage>155</lpage><pub-id pub-id-type="doi">10.2165/00019053-199915020-00003</pub-id><pub-id pub-id-type="medline">10351188</pub-id></nlm-citation></ref><ref id="ref71"><label>71</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Padierna</surname><given-names>A</given-names> </name><name name-style="western"><surname>Quintana</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Arostegui</surname><given-names>I</given-names> </name><name name-style="western"><surname>Gonzalez</surname><given-names>N</given-names> </name><name name-style="western"><surname>Horcajo</surname><given-names>MJ</given-names> </name></person-group><article-title>Changes in health related quality of life among patients treated for eating disorders</article-title><source>Qual Life Res</source><year>2002</year><month>09</month><volume>11</volume><issue>6</issue><fpage>545</fpage><lpage>552</lpage><pub-id pub-id-type="doi">10.1023/a:1016324527729</pub-id><pub-id pub-id-type="medline">12206575</pub-id></nlm-citation></ref><ref id="ref72"><label>72</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jennings</surname><given-names>KM</given-names> </name><name name-style="western"><surname>Phillips</surname><given-names>KE</given-names> </name></person-group><article-title>Eating disorder examination-questionnaire (EDE-Q): norms for clinical sample of female adolescents with anorexia nervosa</article-title><source>Arch Psychiatr Nurs</source><year>2017</year><month>12</month><volume>31</volume><issue>6</issue><fpage>578</fpage><lpage>581</lpage><pub-id pub-id-type="doi">10.1016/j.apnu.2017.08.002</pub-id><pub-id pub-id-type="medline">29179824</pub-id></nlm-citation></ref><ref id="ref73"><label>73</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Aardoom</surname><given-names>JJ</given-names> </name><name name-style="western"><surname>Dingemans</surname><given-names>AE</given-names> </name><name name-style="western"><surname>Slof Op&#x2019;t Landt</surname><given-names>MCT</given-names> </name><name name-style="western"><surname>Van Furth</surname><given-names>EF</given-names> </name></person-group><article-title>Norms and discriminative validity of the Eating Disorder Examination Questionnaire (EDE-Q)</article-title><source>Eat Behav</source><year>2012</year><month>12</month><volume>13</volume><issue>4</issue><fpage>305</fpage><lpage>309</lpage><pub-id pub-id-type="doi">10.1016/j.eatbeh.2012.09.002</pub-id><pub-id pub-id-type="medline">23121779</pub-id></nlm-citation></ref><ref id="ref74"><label>74</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jennings</surname><given-names>KM</given-names> </name><name name-style="western"><surname>Phillips</surname><given-names>KE</given-names> </name></person-group><article-title>Eating disorder examination-questionnaire (EDE-Q): norms for a clinical sample of males</article-title><source>Arch Psychiatr Nurs</source><year>2017</year><month>02</month><volume>31</volume><issue>1</issue><fpage>73</fpage><lpage>76</lpage><pub-id pub-id-type="doi">10.1016/j.apnu.2016.08.004</pub-id><pub-id pub-id-type="medline">28104062</pub-id></nlm-citation></ref><ref id="ref75"><label>75</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Padierna</surname><given-names>A</given-names> </name><name name-style="western"><surname>Quintana</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Arostegui</surname><given-names>I</given-names> </name><name name-style="western"><surname>Gonzalez</surname><given-names>N</given-names> </name><name name-style="western"><surname>Horcajo</surname><given-names>MJ</given-names> </name></person-group><article-title>The health-related quality of life in eating disorders</article-title><source>Qual Life Res</source><year>2000</year><volume>9</volume><issue>6</issue><fpage>667</fpage><lpage>674</lpage><pub-id pub-id-type="doi">10.1023/a:1008973106611</pub-id><pub-id pub-id-type="medline">11236856</pub-id></nlm-citation></ref><ref id="ref76"><label>76</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Doll</surname><given-names>HA</given-names> </name><name name-style="western"><surname>Petersen</surname><given-names>SE</given-names> </name><name name-style="western"><surname>Stewart-Brown</surname><given-names>SL</given-names> </name></person-group><article-title>Eating disorders and emotional and physical well-being: associations between student self-reports of eating disorders and quality of life as measured by the SF-36</article-title><source>Qual Life Res</source><year>2005</year><month>04</month><volume>14</volume><issue>3</issue><fpage>705</fpage><lpage>717</lpage><pub-id pub-id-type="doi">10.1007/s11136-004-0792-0</pub-id><pub-id pub-id-type="medline">16022064</pub-id></nlm-citation></ref><ref id="ref77"><label>77</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>O&#x2019;Connor</surname><given-names>C</given-names> </name><name name-style="western"><surname>McNamara</surname><given-names>N</given-names> </name><name name-style="western"><surname>O&#x2019;Hara</surname><given-names>L</given-names> </name><name name-style="western"><surname>McNicholas</surname><given-names>M</given-names> </name><name name-style="western"><surname>McNicholas</surname><given-names>F</given-names> </name></person-group><article-title>How do people with eating disorders experience the stigma associated with their condition? A mixed-methods systematic review</article-title><source>J Ment Health</source><year>2021</year><month>07</month><day>4</day><volume>30</volume><issue>4</issue><fpage>454</fpage><lpage>469</lpage><pub-id pub-id-type="doi">10.1080/09638237.2019.1685081</pub-id></nlm-citation></ref><ref id="ref78"><label>78</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bakkum</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Hartjes</surname><given-names>MG</given-names> </name><name name-style="western"><surname>Pi&#x00EB;t</surname><given-names>JD</given-names> </name><etal/></person-group><article-title>Using artificial intelligence to create diverse and inclusive medical case vignettes for education</article-title><source>Brit J Clinical Pharma</source><year>2024</year><month>03</month><volume>90</volume><issue>3</issue><fpage>640</fpage><lpage>648</lpage><pub-id pub-id-type="doi">10.1111/bcp.15977</pub-id></nlm-citation></ref><ref id="ref79"><label>79</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name><name name-style="western"><surname>Dada</surname><given-names>A</given-names> </name><name name-style="western"><surname>Puladi</surname><given-names>B</given-names> </name><name name-style="western"><surname>Kleesiek</surname><given-names>J</given-names> </name><name name-style="western"><surname>Egger</surname><given-names>J</given-names> </name></person-group><article-title>ChatGPT in healthcare: a taxonomy and systematic review</article-title><source>Comput Methods Programs Biomed</source><year>2024</year><month>03</month><volume>245</volume><fpage>108013</fpage><pub-id pub-id-type="doi">10.1016/j.cmpb.2024.108013</pub-id></nlm-citation></ref><ref id="ref80"><label>80</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>K</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>T</given-names> </name><name name-style="western"><surname>Kuang</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Xie</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Ananiadou</surname><given-names>S</given-names> </name></person-group><article-title>MentaLLaMA: interpretable mental health analysis on social media with large language models</article-title><conf-name>WWW &#x2019;24: Proceedings of the ACM Web Conference 2024</conf-name><conf-date>May 13-17, 2024</conf-date><conf-loc>Singapore, Singapore</conf-loc><pub-id pub-id-type="doi">10.1145/3589334.3648137</pub-id></nlm-citation></ref><ref id="ref81"><label>81</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>F</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>K</given-names> </name><name name-style="western"><surname>Hua</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Large language models in mental health care: a scoping review</article-title><source>arXiv</source><year>Preprint posted online on 2024</year><comment>arXiv:2401.02984</comment></nlm-citation></ref><ref id="ref82"><label>82</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ray</surname><given-names>PP</given-names> </name></person-group><article-title>Benchmarking, ethical alignment, and evaluation framework for conversational AI: advancing responsible development of ChatGPT</article-title><source>BenchCouncil Transact Benchmark Stand Eval</source><year>2023</year><month>09</month><volume>3</volume><issue>3</issue><fpage>100136</fpage><pub-id pub-id-type="doi">10.1016/j.tbench.2023.100136</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Additional analysis with MentaLLaMA.</p><media xlink:href="mental_v12i1e57986_app1.docx" xlink:title="DOCX File, 23 KB"/></supplementary-material></app-group></back></article>