<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMH</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Ment Health</journal-id>
      <journal-title>JMIR Mental Health</journal-title>
      <issn pub-type="epub">2368-7959</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v11i1e58129</article-id>
      <article-id pub-id-type="pmid">38876484</article-id>
      <article-id pub-id-type="doi">10.2196/58129</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Large Language Models Versus Expert Clinicians in Crisis Prediction Among Telemental Health Patients: Comparative Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Tal</surname>
            <given-names>Amir</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Malgaroli</surname>
            <given-names>Matteo</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Baker</surname>
            <given-names>Justin C</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Irigoyen-Otinano</surname>
            <given-names>Maria</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>Christine</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2729-3777</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Mohebbi</surname>
            <given-names>Matthew</given-names>
          </name>
          <degrees>BS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0006-4929-3483</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>O'Callaghan</surname>
            <given-names>Erin</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8212-9278</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Winsberg</surname>
            <given-names>Mirène</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Brightside Health</institution>
            <addr-line>2261 Market Street</addr-line>
            <addr-line>STE 10222</addr-line>
            <addr-line>San Francisco, CA, 94114</addr-line>
            <country>United States</country>
            <phone>1 415 279 2042</phone>
            <email>mimi.winsberg@brightside.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9637-8133</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Brightside Health</institution>
        <addr-line>San Francisco, CA</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Mirène Winsberg <email>mimi.winsberg@brightside.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>2</day>
        <month>8</month>
        <year>2024</year>
      </pub-date>
      <volume>11</volume>
      <elocation-id>e58129</elocation-id>
      <history>
        <date date-type="received">
          <day>6</day>
          <month>3</month>
          <year>2024</year>
        </date>
        <date date-type="rev-request">
          <day>20</day>
          <month>4</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>11</day>
          <month>6</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>14</day>
          <month>6</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Christine Lee, Matthew Mohebbi, Erin O'Callaghan, Mirène Winsberg. Originally published in JMIR Mental Health (https://mental.jmir.org), 02.08.2024.</copyright-statement>
      <copyright-year>2024</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Mental Health, is properly cited. The complete bibliographic information, a link to the original publication on https://mental.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://mental.jmir.org/2024/1/e58129" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Due to recent advances in artificial intelligence, large language models (LLMs) have emerged as a powerful tool for a variety of language-related tasks, including sentiment analysis, and summarization of provider-patient interactions. However, there is limited research on these models in the area of crisis prediction.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to evaluate the performance of LLMs, specifically OpenAI’s generative pretrained transformer 4 (GPT-4), in predicting current and future mental health crisis episodes using patient-provided information at intake among users of a national telemental health platform.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Deidentified patient-provided data were pulled from specific intake questions of the Brightside telehealth platform, including the chief complaint, for 140 patients who indicated suicidal ideation (SI), and another 120 patients who later indicated SI with a plan during the course of treatment. Similar data were pulled for 200 randomly selected patients, treated during the same time period, who never endorsed SI. In total, 6 senior Brightside clinicians (3 psychologists and 3 psychiatrists) were shown patients’ self-reported chief complaint and self-reported suicide attempt history but were blinded to the future course of treatment and other reported symptoms, including SI. They were asked a simple yes or no question regarding their prediction of endorsement of SI with plan, along with their confidence level about the prediction. GPT-4 was provided with similar information and asked to answer the same questions, enabling us to directly compare the performance of artificial intelligence and clinicians.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Overall, the clinicians’ average precision (0.7) was higher than that of GPT-4 (0.6) in identifying the SI with plan at intake (n=140) versus no SI (n=200) when using the chief complaint alone, while sensitivity was higher for the GPT-4 (0.62) than the clinicians’ average (0.53). The addition of suicide attempt history increased the clinicians’ average sensitivity (0.59) and precision (0.77) while increasing the GPT-4 sensitivity (0.59) but decreasing the GPT-4 precision (0.54). Performance decreased comparatively when predicting future SI with plan (n=120) versus no SI (n=200) with a chief complaint only for the clinicians (average sensitivity=0.4; average precision=0.59) and the GPT-4 (sensitivity=0.46; precision=0.48). The addition of suicide attempt history increased performance comparatively for the clinicians (average sensitivity=0.46; average precision=0.69) and the GPT-4 (sensitivity=0.74; precision=0.48).</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>GPT-4, with a simple prompt design, produced results on some metrics that approached those of a trained clinician. Additional work must be done before such a model can be piloted in a clinical setting. The model should undergo safety checks for bias, given evidence that LLMs can perpetuate the biases of the underlying data on which they are trained. We believe that LLMs hold promise for augmenting the identification of higher-risk patients at intake and potentially delivering more timely care to patients.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>mental health</kwd>
        <kwd>telehealth</kwd>
        <kwd>PHQ-9</kwd>
        <kwd>Patient Health Questionnaire-9</kwd>
        <kwd>suicidal ideation</kwd>
        <kwd>AI</kwd>
        <kwd>LLM</kwd>
        <kwd>OpenAI</kwd>
        <kwd>GPT-4</kwd>
        <kwd>generative pretrained transformer 4</kwd>
        <kwd>tele-mental health</kwd>
        <kwd>large language model</kwd>
        <kwd>clinician</kwd>
        <kwd>clinicians</kwd>
        <kwd>artificial intelligence</kwd>
        <kwd>patient information</kwd>
        <kwd>suicide</kwd>
        <kwd>suicidal</kwd>
        <kwd>mental disorder</kwd>
        <kwd>suicide attempt</kwd>
        <kwd>psychologist</kwd>
        <kwd>psychologists</kwd>
        <kwd>psychiatrist</kwd>
        <kwd>psychiatrists</kwd>
        <kwd>psychiatry</kwd>
        <kwd>clinical setting</kwd>
        <kwd>self-reported</kwd>
        <kwd>treatment</kwd>
        <kwd>medication</kwd>
        <kwd>digital mental health</kwd>
        <kwd>machine learning</kwd>
        <kwd>language model</kwd>
        <kwd>suicide</kwd>
        <kwd>crisis</kwd>
        <kwd>telemental health</kwd>
        <kwd>tele health</kwd>
        <kwd>e-health</kwd>
        <kwd>digital health</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Suicide is a serious public health concern. Suicide rates have risen at an alarming rate in the past 20 years, and in the United States, suicide is the second leading cause of death in adults aged 18-45 years [<xref ref-type="bibr" rid="ref1">1</xref>]. In 2021, approximately 50,000 people in the United States died by suicide, which marks the highest national rate of suicide in decades [<xref ref-type="bibr" rid="ref2">2</xref>]. As suicide rates increase, the behavioral health care workforce in the United States has not expanded enough to keep up with these mental health demands, limiting the timely access to care that is essential for suicide risk detection and prevention [<xref ref-type="bibr" rid="ref3">3</xref>].</p>
        <p>Suicide risk is difficult to predict. Research has demonstrated that there are numerous individual, relationship, community, and societal risk factors associated with suicide, such as history of previous suicide attempts, psychiatric diagnosis, sense of hopelessness, social isolation, community violence, and access to lethal means of suicide [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref9">9</xref>]. More recently, suicide theories and research suggest ideation-to-action pathways to help explain suicide risk, where people who think about suicide are at a higher risk of participating in suicidal behavior [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref13">13</xref>].</p>
        <p>The prevalence of suicidal ideation (SI), which is defined as “thinking about, considering, or planning suicide” [<xref ref-type="bibr" rid="ref14">14</xref>], is common, with 12.3 million Americans aged 18 years and older having thoughts of suicide in 2021 [<xref ref-type="bibr" rid="ref15">15</xref>]. SI is predictive of suicide attempts and completed suicide [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. SI is also a more sensitive predictor of lifetime risk for suicide than imminent risk [<xref ref-type="bibr" rid="ref18">18</xref>]. Research has suggested that among those exhibiting SI, there is a 29% conditional probability of making a suicide attempt [<xref ref-type="bibr" rid="ref19">19</xref>]. Other research has shown that those with nearly daily SI were 5 to 8 times more likely to attempt suicide and 3 to 11 times more likely to die by suicide within 30 days [<xref ref-type="bibr" rid="ref20">20</xref>].</p>
        <p>Artificial intelligence (AI) methods have been used for assessing mental health factors such as psychiatric symptom severity, diagnosis, and clinical risk using free text generated by the patient. Researchers using natural language processing (NLP) and machine learning (ML) were able to identify suicidal behavior from electronic medical records [<xref ref-type="bibr" rid="ref21">21</xref>] and detect SI in a variety of different free-text settings [<xref ref-type="bibr" rid="ref22">22</xref>]. In addition, an NLP-based system to determine the likelihood of crisis in patient chat messages to their clinicians was developed and implemented with reliable retrospective and prospective performance as a clinical support tool for a crisis specialist team [<xref ref-type="bibr" rid="ref23">23</xref>].</p>
        <p>Recent advances in AI methods, such as large language models (LLMs), have also shown success in a variety of medical applications. Both generalist LLMs, such as generative pretrained transformer 4 (GPT-4), and medical domain–specific LLMs, such as Med-PaLM 2, have exhibited medical competency on benchmarks such as the United States Medical Licensing Examination (USMLE) exam [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. Generalist LLMs can sometimes outperform the domain-specific LLMs, as was recently found with GPT-4 outperforming MedPaLM 2 on the MedQA medical benchmark [<xref ref-type="bibr" rid="ref25">25</xref>]. Finally, Med-PaLM-2 was also found to be effective at determining psychiatric functioning from free text, including patient-generated information during patient interviews [<xref ref-type="bibr" rid="ref26">26</xref>].</p>
      </sec>
      <sec>
        <title>Objective</title>
        <p>We seek to leverage the capabilities of LLMs to detect or predict SI with plan among patients enrolled in a national telemental health platform, using patient-generated free text at intake. We will benchmark the performance of this LLM-based prediction against a cohort of senior mental health clinician experts.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Overview</title>
        <p>The study consisted of clinicians completing a digital questionnaire where they were asked to predict whether a patient would endorse SI with a plan during the course of their treatment, based on patient-generated text describing their chief complaint. The same chief complaint texts were then served to the LLM GPT-4 with the same questionnaire instructions. The classification performance of the clinicians and GPT-4 were evaluated and compared.</p>
        <sec>
          <title>Data Acquisition</title>
          <p>The retrospective patient data used in this study were collected as part of the standard of care at Brightside Health and deidentified for research purposes. All patients treated at Brightside consent at intake to the terms of use and privacy policy that include consenting to Brightside’s use of their data for research purposes.</p>
        </sec>
        <sec>
          <title>Inclusion Criteria</title>
          <p>Data from patients who completed intake on the Brightside platform after March 15, 2023, and endorsed current SI (at intake) or subsequent SI (post intake and during the course of treatment) were included in the study set, along with a random cohort of patients treated during the same time frame who never endorsed SI with plan. In order to be included in the study sample, patients had to attend at least 1 psychiatric or therapy appointment and complete the chief complaint section of their digital intake form. Patients who left the chief complaint section empty were excluded.</p>
        </sec>
        <sec>
          <title>Data and Outcome Variables</title>
          <p>Patient-generated free text (chief complaint) was extracted from patient intake as the answer to the question “In your own words, what are you feeling or experiencing?” and any personal identifiers (such as age, birthdate, name, location, email address, phone number, and social security number) within the free text were replaced with asterisks. In addition, patient data extracted from intake included age, gender identity, and history of previous suicide attempts. Clinicians and the LLM did not have access to the age or gender identity of the patients and were only shown deidentified patient-generated free text and then the patients’ self-reported history of suicide attempts.</p>
          <p>SI with plan was determined from answers to question 9 of the Patient Health Questionnaire-9 (PHQ-9). The PHQ-9 is a self-report questionnaire consisting of 9 questions measuring depression symptom severity ranging from 0 to 3 (not at all, several days, more than half the days, and nearly every day, respectively) within the past 2 weeks and includes a specific question related to the frequency of suicidal thoughts (item 9). If a patient endorses SI on the Brightside platform (item 9 answer value &gt;0), a follow-up Brightside proprietary question asks whether the suicidal thoughts are something the patient has made specific plans for. At Brightside, the PHQ-9 is administered to all patients at intake and requested every 2 weeks during the course of treatment. PHQ-9 answers at intake and the date of the first SI with plan relative to intake were also extracted for this study.</p>
        </sec>
        <sec>
          <title>Classification Label Definitions</title>
          <p>The patients positive for SI with plan were defined as those having endorsed SI in the PHQ-9 at intake or any point during the later course of treatment and subsequently responded that the SI was something they had made specific plans for. Patients negative for SI with plan were defined as those with no PHQ-9 item 9 values &gt;0, that is, those who had never endorsed SI in their PHQ-9 screenings.</p>
        </sec>
        <sec>
          <title>Clinician Questionnaire Design</title>
          <p>After the creation of the study data set, 6 clinicians employed at Brightside Health were recruited and all consented to participate in the study. Clinicians 1, 2, and 3 are senior psychiatrists with 18 to 30 years of clinical experience. Clinicians 4, 5, and 6 are senior psychologists with 10 to 23 years of clinical experience.</p>
          <p>Each clinician was presented with the same questionnaire with the same randomized order of questions. Presented with a patient’s deidentified chief complaint, they were asked to answer the following questions: (1) do you expect this patient to endorse SI with a plan in the course of their treatment? (yes or no) and (2) how confident are you? (high, medium, or low).</p>
          <p>The clinicians were then presented with additional information as to whether the patient endorsed a previous suicide attempt and reprompted with the same questions. All chief complaints and questions were displayed one at a time. Clinicians were given 2 weeks to complete the questionnaire with no other instructions or training and were not required to complete it in a single sitting.</p>
        </sec>
        <sec>
          <title>Large Language Model Prompt Design</title>
          <p>In this study, we evaluated OpenAI’s GPT-4 text-only model’s ability to predict whether a patient would endorse SI with plan during the course of treatment. All model results were produced in Python (Python Software Foundation) with OpenAI’s application programming interface and GPT-4 (“gpt-4-1106-preview” with default parameters) [<xref ref-type="bibr" rid="ref27">27</xref>].</p>
          <p>First, the model context was constructed using step-by-step instructions and few-shot prompting with 3 real examples of chief complaints and their respective correct, expected answers (<xref ref-type="boxed-text" rid="box1">Textbox 1</xref>). Note that the examples chosen for the few-shot prompting were not included in the study data set and were redacted for publication.</p>
          <boxed-text id="box1" position="float">
            <title>GPT-4 few-shot prompt template for predicting suicidal ideation with plan in chief complaint text.</title>
            <p>You are a trained psychiatric professional. You will be presented with a patient’s answer to the question “In your own words, what are you feeling or experiencing?” also referred to as a patient’s chief complaint.</p>
            <p>Your task is to determine based on a patient’s chief complaint, if that patient will endorse suicidal ideation with plan in the course of their treatment.</p>
            <p>You will generate your answer as JSON: {“at_risk”: “”, “confidence”: “”, “risk_indicators”: “[]”}</p>
            <p>Use the following step-by-step instructions to determine your answer:</p>
            <list list-type="bullet">
              <list-item>
                <p>Step 1. Answer in the key “at_risk” with only the values Yes or No</p>
              </list-item>
              <list-item>
                <p>Step 2. Answer in the key “confidence” with only the values High, Medium, or Low, how confident you are in your answer.</p>
              </list-item>
              <list-item>
                <p>Step 3. Answer in the key “risk_indicators” with one or more values from the list of possible risk indicators below that determined your Yes or No answer.</p>
              </list-item>
            </list>
            <p>Separate risk indicators with a “; ”.</p>
            <p>If Other, specify your answer as “Other-&lt;insert your answer&gt;”. If no risk indicators are identified, answer with None.</p>
            <p>List of possible risk indicators values:</p>
            <list list-type="bullet">
              <list-item>
                <p>Recent Stress, Loss, or Trauma</p>
              </list-item>
              <list-item>
                <p>History of Trauma</p>
              </list-item>
              <list-item>
                <p>Chronic medical conditions</p>
              </list-item>
              <list-item>
                <p>Substance use</p>
              </list-item>
              <list-item>
                <p>Previous suicide attempt</p>
              </list-item>
              <list-item>
                <p>Lack or loss of relationships or support</p>
              </list-item>
              <list-item>
                <p>Social isolation</p>
              </list-item>
              <list-item>
                <p>Family history of suicide</p>
              </list-item>
              <list-item>
                <p>Impulsive or aggressive language</p>
              </list-item>
              <list-item>
                <p>Explicit mentions of suicide, suicidal thoughts, or self harm</p>
              </list-item>
              <list-item>
                <p>Death imagery or metaphors</p>
              </list-item>
              <list-item>
                <p>Apathy, indifference or emotional detachment</p>
              </list-item>
              <list-item>
                <p>Sense of Hopelessness</p>
              </list-item>
              <list-item>
                <p>Other</p>
              </list-item>
            </list>
            <p>Here is an example of a chief complaint with a Yes to suicidal ideation with plan:</p>
            <p>“&lt;<italic>text redacted for publication</italic>&gt; ”</p>
            <p>Your answer would be:{“risk_indicators”: “Sense of Hopelessness; Social isolation; Explicit mentions of suicide, suicidal thoughts, or self harm”, “at_risk”: “Yes”, “confidence”: “High”}</p>
            <p>Here is an example of a chief complaint with a No to suicidal ideation with plan: “&lt;<italic>text redacted for publication</italic>&gt;”</p>
            <p>Your answer would be: {“risk_indicators”: “None”, “at_risk”: “No”, “confidence”: “High”}</p>
            <p>Here is an example of a chief complaint with a No to suicidal ideation with plan:</p>
            <p>“&lt;<italic>text redacted for publication</italic>&gt;”</p>
            <p>Your answer would be: {“risk_indicators”: “None”, “at_risk”: “No”,“confidence”: “High”}</p>
          </boxed-text>
          <p>Next, the output format of the model was specified as JavaScript Object Notation for ease of analysis. In addition to the prediction of SI with plan during the course of treatment, the model was also asked to provide a confidence level (high, medium, and low) to the prediction (similar to the clinicians’ questionnaire) and to provide reasoning from a list of explicitly provided risk indicators.</p>
          <p>Finally, the deidentified patient-generated chief complaint text was given to the model in the user prompt. Each chief complaint was provided independently and then the LLM was reset back to the original context.</p>
          <p>In order to evaluate the model’s performance when served the additional information of patient self-reported previous suicide attempts, the sentence “I have attempted suicide before” or “I have never attempted suicide before” was appended to the end of the chief complaint and served as the prompt with the same context.</p>
        </sec>
        <sec>
          <title>Performance Analysis</title>
          <p>All analyses were performed in Python 3.8.12 with the package scikit-learn version 1.3.1 [<xref ref-type="bibr" rid="ref28">28</xref>]. For comparison of performance, analyses were performed on positive for SI with plan at intake versus negative for SI during the entire course of treatment, as well as positive for SI with plan post intake versus the same data set of negative for SI during treatment.</p>
        </sec>
        <sec>
          <title>Classification and Predictive Performance</title>
          <p>Clinician and model performances in the ability to predict whether a chief complaint text sample was positive for SI with plan, at intake, and post intake, were evaluated for accuracy, sensitivity, specificity, and precision. Accuracy was defined as the proportion of correctly predicted samples over the total number of samples. Precision (or positive predictive value) was defined as the proportion of correctly predicted positive samples over the total number of predicted positive samples. Sensitivity was defined as the proportion of correctly predicted positive samples over the total number of positive samples. Specificity was defined as the proportion of correctly predicted negative samples over the total number of negative samples. As an additional baseline reference, previous suicide attempt information (yes or no) as a stand-alone predictor was also included in the evaluation.</p>
        </sec>
        <sec>
          <title>Clinician and Large Language Model Agreement</title>
          <p>To measure the agreement between the clinician and GPT-4’s predictions, the Cohen κ statistic, which measures interrater agreement for categorical data, was calculated for each clinician and GPT-4 pairing.</p>
        </sec>
        <sec>
          <title>Clinical Consensus and Confidence</title>
          <p>Clinical consensus was defined as instances in which all clinicians answered with the same predicted outcome for a given sample, regardless of whether the prediction was correct. Rates of clinical consensus and rates of confidence were calculated to measure the variability and difficulty of clinical assessments on the given samples.</p>
        </sec>
      </sec>
      <sec>
        <title>Accuracy of Clinical Consensus Influence on Large Language Model Performance</title>
        <p>To measure the influence of the accuracy of clinical consensus on GPT-4 performance, subsets of chief complaint text samples where at least 1, 2, 3, 4, 5, or all 6 clinicians not only agreed but also correctly predicted the outcome for a given sample were evaluated for GPT-4 accuracy, sensitivity, specificity, and precision.</p>
      </sec>
      <sec>
        <title>Risk Indicator Language and Clinician Performance</title>
        <p>The GPT-4 prompt included a request to provide the rationale for its prediction from a list of explicitly provided risk indicators (<xref ref-type="boxed-text" rid="box1">Textbox 1</xref>). Clinician performance was then re-evaluated on patient chief complaints with no GPT-4–identified risk indicators as a way to understand how difficult these cases were to clinical experts.</p>
        <p>Due to the generative nature of an LLM, GPT-4 occasionally will produce an answer that is not from the list of those that are explicitly defined in the instructions. For the purpose of this analysis, only the following explicit risk indicators defined as exact string match were assessed: “recent stress, loss, or trauma,” “history of trauma,” “chronic medical conditions,” “substance use,” “previous suicide attempt,” “lack or loss of relationships or support,” “social isolation,” “family history of suicide,” “impulsive or aggressive language,” “explicit mentions of suicide, suicidal thoughts, or self-harm,” “death imagery or metaphors,” “apathy, indifference or emotional detachment,” and “sense of hopelessness.”</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>This study was conducted according to the guidelines of the Declaration of Helsinki and approved by the Institutional Review Board of WCG (protocol 20240207).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Overview</title>
        <p>At the conclusion of the study (December 13, 2023), 260 patients met inclusion criteria and were positive for SI with plan. A total of 140 patients were positive for SI with plan at the time of intake and 120 patients were positive for SI with plan post intake in their subsequent treatment. A random subset of 200 patients was selected from those who met the inclusion criteria and were negative for SI with plan. A summary of the data can be found in <xref ref-type="table" rid="table1">Table 1</xref>.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Summary of data for patients with no SI with plan (n=200), SI with plan indicated at intake (n=140), and SI with plan indicated post intake (n=120).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="310"/>
            <col width="200"/>
            <col width="220"/>
            <col width="240"/>
            <thead>
              <tr valign="top">
                <td colspan="2">
                  <break/>
                </td>
                <td>No SI with plan (n=200)</td>
                <td>SI with plan at intake (n=140)</td>
                <td>SI with plan post intake (n=120)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">Age (years), mean (95% CI)</td>
                <td>37.2 (35.7-38.9)</td>
                <td>34.4 (32.5-36.3)</td>
                <td>32.4 (30.3-34.5)</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Gender identity, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Women</td>
                <td>135 (67.5)</td>
                <td>76 (54.3)</td>
                <td>59 (49.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Men</td>
                <td>64 (32)</td>
                <td>57 (40.7)</td>
                <td>59 (49.2)</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Ethnicity, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>White</td>
                <td>152 (76)</td>
                <td>94 (67.1)</td>
                <td>73 (60.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hispanic</td>
                <td>16 (8)</td>
                <td>20 (14.3)</td>
                <td>14 (11.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Black</td>
                <td>13 (6.5)</td>
                <td>13 (9.3)</td>
                <td>16 (13.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Asian</td>
                <td>10 (5)</td>
                <td>6 (4.3)</td>
                <td>8 (6.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Other</td>
                <td>9 (4.5)</td>
                <td>7 (5)</td>
                <td>9 (7.5)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Average chief complaint word count (95% CI)</td>
                <td>49.6 (41.3-57.9)</td>
                <td>58 (33-83.1)</td>
                <td>57.2 (44.2-70.3)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Average days between first SI with plan date and chief complaint (95% CI)</td>
                <td>—<sup>a</sup></td>
                <td>0 (0)</td>
                <td>62.6 (52.4-72.8)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Average PHQ-9<sup>b</sup> total score at first SI with plan (95% CI)</td>
                <td>—</td>
                <td>21.1 (20.2-21.9)</td>
                <td>19.0 (17.8-20.2)</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Number of patients with PHQ-9 item 9 score value at first SI with plan, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>0</td>
                <td>—</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>1</td>
                <td>—</td>
                <td>32 (22.9)</td>
                <td>34 (28.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>2</td>
                <td>—</td>
                <td>34 (24.3)</td>
                <td>29 (24.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>3</td>
                <td>—</td>
                <td>74 (52.9)</td>
                <td>57 (47.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>With specific plan</td>
                <td>—</td>
                <td>140 (100)</td>
                <td>120 (100)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Average PHQ-9 total score at intake (95% CI)</td>
                <td>13.5 (12.7-14.2)</td>
                <td>20.9 (20.1-21.7)</td>
                <td>18.3 (17.2-19.4)</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Number of patients with PHQ-9 item 9 score value at intake, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>0</td>
                <td>200 (100)</td>
                <td>0 (0)</td>
                <td>34 (28.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>1</td>
                <td>0 (0)</td>
                <td>32 (22.9)</td>
                <td>34 (28.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>2</td>
                <td>0 (0)</td>
                <td>34 (24.3)</td>
                <td>20 (16.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>3</td>
                <td>0 (0)</td>
                <td>74 (52.9)</td>
                <td>32 (26.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>With specific plan</td>
                <td>0 (0)</td>
                <td>140 (100)</td>
                <td>0 (0)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Previous suicide attempt</td>
                <td>14 (7)</td>
                <td>55 (39.3)</td>
                <td>40 (33.3)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>Not applicable.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>PHQ: Patient Health Questionnaire-9.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Prediction Performance</title>
        <sec>
          <title>Predicting SI With Plan at Intake</title>
          <p>The performance of the previous suicide attempt alone to predict SI with plan at the time of intake was similar to both GPT-4 and clinicians except for the low sensitivity at 0.39 (<xref ref-type="table" rid="table2">Table 2</xref>).</p>
          <p>GPT-4 performed with similar accuracy (0.67) and higher sensitivity (0.62) in predicting SI with plan at the time of intake based on the chief complaint text only, as compared with the average accuracy (0.7) and sensitivity (0.53) across our 6 clinician participants (<xref ref-type="table" rid="table2">Table 2</xref>). However, GPT-4 performed with lower specificity (0.71) and precision (0.6) than the average clinician specificity (0.82) and precision (0.69). The interrater agreement between GPT-4 and each clinician was moderate as indicated by an average Cohen κ of 0.49.</p>
          <p>Additional knowledge of the previous suicide attempt increased overall performance across clinicians (accuracy=0.75; sensitivity=0.59; specificity=0.86; precision=0.77). Additional knowledge of the previous suicide attempts significantly increased sensitivity for GPT-4 but decreased accuracy, specificity, and precision (accuracy=0.64; sensitivity=0.84; specificity=0.51; precision=0.54). The interrater agreement between GPT-4 and each clinician also decreased to an average Cohen κ of 0.39 with the additional information of the previous suicide attempts.</p>
          <table-wrap position="float" id="table2">
            <label>Table 2</label>
            <caption>
              <p>Performance results for predicting suicidal ideation with a plan at the time of intake and predicting suicidal ideation with a plan in the future post intake based solely on chief complaint versus chief complaint plus knowledge of the previous attempt for GPT-4 and 6 clinicians. The performance of the previous suicide attempt alone as a predictor is included for baseline reference.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="30"/>
              <col width="30"/>
              <col width="130"/>
              <col width="0"/>
              <col width="90"/>
              <col width="0"/>
              <col width="90"/>
              <col width="0"/>
              <col width="90"/>
              <col width="0"/>
              <col width="90"/>
              <col width="0"/>
              <col width="80"/>
              <col width="0"/>
              <col width="90"/>
              <col width="0"/>
              <col width="90"/>
              <col width="0"/>
              <col width="90"/>
              <col width="0"/>
              <col width="100"/>
              <thead>
                <tr valign="top">
                  <td colspan="4">
                    <break/>
                  </td>
                  <td colspan="2">True negative, n</td>
                  <td colspan="2">False positive, n</td>
                  <td colspan="2">False negative, n</td>
                  <td colspan="2">True positive, n</td>
                  <td colspan="2">Accuracy</td>
                  <td colspan="2">Sensitivity</td>
                  <td colspan="2">Specificity</td>
                  <td colspan="2">Precision</td>
                  <td>Cohen κ with GPT-4</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="21">
                    <bold>SI with plan at intake (n=140) versus no SI with plan (n=200)</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">Baseline for comparison: previous suicide attempts only</td>
                  <td colspan="2">186</td>
                  <td colspan="2">14</td>
                  <td colspan="2">85</td>
                  <td colspan="2">55</td>
                  <td colspan="2">0.71</td>
                  <td colspan="2">0.39</td>
                  <td colspan="2">0.93</td>
                  <td colspan="2">0.8</td>
                  <td colspan="2">—<sup>a</sup></td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="20">
                    <bold>Chief complaint text only</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>GPT-4</td>
                  <td colspan="2">141</td>
                  <td colspan="2">59</td>
                  <td colspan="2">53</td>
                  <td colspan="2">87</td>
                  <td colspan="2">0.67</td>
                  <td colspan="2">0.62</td>
                  <td colspan="2">0.71</td>
                  <td colspan="2">0.6</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 1</td>
                  <td colspan="2">160</td>
                  <td colspan="2">40</td>
                  <td colspan="2">58</td>
                  <td colspan="2">82</td>
                  <td colspan="2">0.71</td>
                  <td colspan="2">0.59</td>
                  <td colspan="2">0.8</td>
                  <td colspan="2">0.67</td>
                  <td colspan="2">0.53</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 2</td>
                  <td colspan="2">189</td>
                  <td colspan="2">11</td>
                  <td colspan="2">95</td>
                  <td colspan="2">45</td>
                  <td colspan="2">0.69</td>
                  <td colspan="2">0.32</td>
                  <td colspan="2">0.95</td>
                  <td colspan="2">0.80</td>
                  <td colspan="2">0.36</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 3</td>
                  <td colspan="2">138</td>
                  <td colspan="2">62</td>
                  <td colspan="2">48</td>
                  <td colspan="2">92</td>
                  <td colspan="2">0.68</td>
                  <td colspan="2">0.66</td>
                  <td colspan="2">0.69</td>
                  <td colspan="2">0.6</td>
                  <td colspan="2">0.56</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 4</td>
                  <td colspan="2">183</td>
                  <td colspan="2">17</td>
                  <td colspan="2">85</td>
                  <td colspan="2">55</td>
                  <td colspan="2">0.77</td>
                  <td colspan="2">0.39</td>
                  <td colspan="2">0.92</td>
                  <td colspan="2">0.76</td>
                  <td colspan="2">0.44</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 5</td>
                  <td colspan="2">162</td>
                  <td colspan="2">38</td>
                  <td colspan="2">58</td>
                  <td colspan="2">82</td>
                  <td colspan="2">0.72</td>
                  <td colspan="2">0.59</td>
                  <td colspan="2">0.81</td>
                  <td colspan="2">0.68</td>
                  <td colspan="2">0.5</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 6</td>
                  <td colspan="2">156</td>
                  <td colspan="2">44</td>
                  <td colspan="2">52</td>
                  <td colspan="2">88</td>
                  <td colspan="2">0.72</td>
                  <td colspan="2">0.63</td>
                  <td colspan="2">0.78</td>
                  <td colspan="2">0.67</td>
                  <td colspan="2">0.54</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Average across clinicians</td>
                  <td colspan="2">—</td>
                  <td colspan="2">—</td>
                  <td colspan="2">—</td>
                  <td colspan="2">—</td>
                  <td colspan="2">0.70</td>
                  <td colspan="2">0.53</td>
                  <td colspan="2">0.82</td>
                  <td colspan="2">0.7</td>
                  <td colspan="2">0.49</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="20">
                    <bold>Chief complaint text + previous suicide attempt knowledge</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>GPT-4</td>
                  <td colspan="2">102</td>
                  <td colspan="2">98</td>
                  <td colspan="2">23</td>
                  <td colspan="2">117</td>
                  <td colspan="2">0.64</td>
                  <td colspan="2">0.84</td>
                  <td colspan="2">0.51</td>
                  <td colspan="2">0.54</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 1</td>
                  <td colspan="2">163</td>
                  <td colspan="2">37</td>
                  <td colspan="2">49</td>
                  <td colspan="2">91</td>
                  <td colspan="2">0.75</td>
                  <td colspan="2">0.65</td>
                  <td colspan="2">0.82</td>
                  <td colspan="2">0.71</td>
                  <td colspan="2">0.46</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 2</td>
                  <td colspan="2">194</td>
                  <td colspan="2">6</td>
                  <td colspan="2">89</td>
                  <td colspan="2">51</td>
                  <td colspan="2">0.72</td>
                  <td colspan="2">0.36</td>
                  <td colspan="2">0.97</td>
                  <td colspan="2">0.9</td>
                  <td colspan="2">0.21</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 3</td>
                  <td colspan="2">152</td>
                  <td colspan="2">48</td>
                  <td colspan="2">39</td>
                  <td colspan="2">101</td>
                  <td colspan="2">0.74</td>
                  <td colspan="2">0.72</td>
                  <td colspan="2">0.76</td>
                  <td colspan="2">0.68</td>
                  <td colspan="2">0.5</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 4</td>
                  <td colspan="2">187</td>
                  <td colspan="2">13</td>
                  <td colspan="2">67</td>
                  <td colspan="2">73</td>
                  <td colspan="2">0.77</td>
                  <td colspan="2">0.52</td>
                  <td colspan="2">0.94</td>
                  <td colspan="2">0.85</td>
                  <td colspan="2">0.329</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 5</td>
                  <td colspan="2">173</td>
                  <td colspan="2">27</td>
                  <td colspan="2">53</td>
                  <td colspan="2">87</td>
                  <td colspan="2">0.77</td>
                  <td colspan="2">0.62</td>
                  <td colspan="2">0.87</td>
                  <td colspan="2">0.76</td>
                  <td colspan="2">0.4</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 6</td>
                  <td colspan="2">159</td>
                  <td colspan="2">41</td>
                  <td colspan="2">47</td>
                  <td colspan="2">93</td>
                  <td colspan="2">0.74</td>
                  <td colspan="2">0.66</td>
                  <td colspan="2">0.8</td>
                  <td colspan="2">0.69</td>
                  <td colspan="2">0.42</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Average across clinicians</td>
                  <td colspan="2">—</td>
                  <td colspan="2">—</td>
                  <td colspan="2">—</td>
                  <td colspan="2">—</td>
                  <td colspan="2">0.75</td>
                  <td colspan="2">0.59</td>
                  <td colspan="2">0.86</td>
                  <td colspan="2">0.77</td>
                  <td colspan="2">0.39</td>
                </tr>
                <tr valign="top">
                  <td colspan="21">
                    <bold>SI with plan post intake (n=120) versus no SI with plan (n=200)</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">Baseline for comparison: prior suicide attempt only</td>
                  <td colspan="2">186</td>
                  <td colspan="2">14</td>
                  <td colspan="2">80</td>
                  <td colspan="2">40</td>
                  <td colspan="2">0.71</td>
                  <td colspan="2">0.33</td>
                  <td colspan="2">0.93</td>
                  <td colspan="2">0.74</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="20">
                    <bold>Chief complaint text only</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>GPT-4</td>
                  <td colspan="2">141</td>
                  <td colspan="2">—</td>
                  <td colspan="2">65</td>
                  <td colspan="2">55</td>
                  <td colspan="2">0.61</td>
                  <td colspan="2">0.46</td>
                  <td colspan="2">0.71</td>
                  <td colspan="2">0.48</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 1</td>
                  <td colspan="2">160</td>
                  <td colspan="2">—</td>
                  <td colspan="2">69</td>
                  <td colspan="2">51</td>
                  <td colspan="2">0.66</td>
                  <td colspan="2">0.43</td>
                  <td colspan="2">0.8</td>
                  <td colspan="2">0.56</td>
                  <td colspan="2">0.44</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 2</td>
                  <td colspan="2">189</td>
                  <td colspan="2">—</td>
                  <td colspan="2">100</td>
                  <td colspan="2">20</td>
                  <td colspan="2">0.65</td>
                  <td colspan="2">0.17</td>
                  <td colspan="2">0.95</td>
                  <td colspan="2">0.65</td>
                  <td colspan="2">0.26</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 3</td>
                  <td colspan="2">138</td>
                  <td colspan="2">—</td>
                  <td colspan="2">54</td>
                  <td colspan="2">66</td>
                  <td colspan="2">0.64</td>
                  <td colspan="2">0.55</td>
                  <td colspan="2">0.69</td>
                  <td colspan="2">0.52</td>
                  <td colspan="2">0.44</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 4</td>
                  <td colspan="2">183</td>
                  <td colspan="2">—</td>
                  <td colspan="2">84</td>
                  <td colspan="2">36</td>
                  <td colspan="2">0.68</td>
                  <td colspan="2">0.3</td>
                  <td colspan="2">0.92</td>
                  <td colspan="2">0.68</td>
                  <td colspan="2">0.34</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 5</td>
                  <td colspan="2">162</td>
                  <td colspan="2">—</td>
                  <td colspan="2">70</td>
                  <td colspan="2">50</td>
                  <td colspan="2">0.66</td>
                  <td colspan="2">0.42</td>
                  <td colspan="2">0.81</td>
                  <td colspan="2">0.57</td>
                  <td colspan="2">0.43</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 6</td>
                  <td colspan="2">156</td>
                  <td colspan="2">—</td>
                  <td colspan="2">56</td>
                  <td colspan="2">64</td>
                  <td colspan="2">0.69</td>
                  <td colspan="2">0.53</td>
                  <td colspan="2">0.78</td>
                  <td colspan="2">0.59</td>
                  <td colspan="2">0.50</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Average across clinicians</td>
                  <td colspan="2">—</td>
                  <td colspan="2">—</td>
                  <td colspan="2">—</td>
                  <td colspan="2">—</td>
                  <td colspan="2">0.66</td>
                  <td colspan="2">0.4</td>
                  <td colspan="2">0.82</td>
                  <td colspan="2">0.59</td>
                  <td colspan="2">0.4</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="20">
                    <bold>Chief complaint text + prior suicide attempt knowledge</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>GPT-4</td>
                  <td colspan="2">102</td>
                  <td colspan="2">—</td>
                  <td colspan="2">31</td>
                  <td colspan="2">89</td>
                  <td colspan="2">0.6</td>
                  <td colspan="2">0.74</td>
                  <td colspan="2">0.51</td>
                  <td colspan="2">0.48</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 1</td>
                  <td colspan="2">163</td>
                  <td colspan="2">—</td>
                  <td colspan="2">59</td>
                  <td colspan="2">61</td>
                  <td colspan="2">0.7</td>
                  <td colspan="2">0.51</td>
                  <td colspan="2">0.82</td>
                  <td colspan="2">0.62</td>
                  <td colspan="2">0.37</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 2</td>
                  <td colspan="2">194</td>
                  <td colspan="2">—</td>
                  <td colspan="2">90</td>
                  <td colspan="2">30</td>
                  <td colspan="2">0.7</td>
                  <td colspan="2">0.25</td>
                  <td colspan="2">0.97</td>
                  <td colspan="2">0.83</td>
                  <td colspan="2">0.17</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 3</td>
                  <td colspan="2">152</td>
                  <td colspan="2">—</td>
                  <td colspan="2">49</td>
                  <td colspan="2">71</td>
                  <td colspan="2">0.7</td>
                  <td colspan="2">0.59</td>
                  <td colspan="2">0.76</td>
                  <td colspan="2">0.6</td>
                  <td colspan="2">0.45</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 4</td>
                  <td colspan="2">187</td>
                  <td colspan="2">—</td>
                  <td colspan="2">76</td>
                  <td colspan="2">44</td>
                  <td colspan="2">0.72</td>
                  <td colspan="2">0.37</td>
                  <td colspan="2">0.94</td>
                  <td colspan="2">0.77</td>
                  <td colspan="2">0.27</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 5</td>
                  <td colspan="2">173</td>
                  <td colspan="2">—</td>
                  <td colspan="2">63</td>
                  <td colspan="2">57</td>
                  <td colspan="2">0.72</td>
                  <td colspan="2">0.48</td>
                  <td colspan="2">0.87</td>
                  <td colspan="2">0.68</td>
                  <td colspan="2">0.36</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Clinician 6</td>
                  <td colspan="2">159</td>
                  <td colspan="2">—</td>
                  <td colspan="2">54</td>
                  <td colspan="2">66</td>
                  <td colspan="2">0.7</td>
                  <td colspan="2">0.55</td>
                  <td colspan="2">0.8</td>
                  <td colspan="2">0.62</td>
                  <td colspan="2">0.35</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Average across clinicians</td>
                  <td colspan="2">—</td>
                  <td colspan="2">—</td>
                  <td colspan="2">—</td>
                  <td colspan="2">—</td>
                  <td colspan="2">0.71</td>
                  <td colspan="2">0.46</td>
                  <td colspan="2">0.86</td>
                  <td colspan="2">0.69</td>
                  <td colspan="2">0.33</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table2fn1">
                <p><sup>a</sup>Not applicable.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
        <sec>
          <title>Predicting SI With Plan Post Intake</title>
          <p>Performance decreased for both clinicians and GPT-4 when predicting future SI with plan post intake. Note that specificity results were consistent with predicting SI with plan at intake, as there was no change in the negative samples.</p>
          <p>GPT-4 performed with similar accuracy (0.61) and higher, but still poor, sensitivity (0.46) in predicting SI with plan post intake based solely on the chief complaint compared with the average accuracy (0.66) and sensitivity (0.4) across the 6 clinicians (<xref ref-type="table" rid="table2">Table 2</xref>). GPT-4 performed with lower precision (0.48) than the average clinician precision (0.59). The interrater agreement between GPT-4 and each clinician remained moderate at an average Cohen κ of 0.4.</p>
          <p>Additional knowledge of the previous suicide attempts increased performance across all clinicians (accuracy=0.71; sensitivity=0.46; precision=0.69). Additional knowledge of the previous suicide attempt significantly increased sensitivity for GPT-4 but decreased accuracy and precision (accuracy=0.6; sensitivity=0.74; precision=0.48). The interrater agreement between GPT-4 and each clinician was lower, with an average Cohen κ of 0.33 with the additional information.</p>
        </sec>
      </sec>
      <sec>
        <title>Clinical Consensus and Confidence</title>
        <p>Clinical consensus was defined as instances in which all 6 clinicians agreed on the predicted outcome for a given sample, regardless of whether the prediction was correct. Clinical consensus occurred in 52% (104/200) of “no SI with plan” samples, 40.7% (57/140) of “SI with plan at intake” samples, and 40% (48/120) of “SI with plan postintake” samples (<xref ref-type="table" rid="table3">Table 3</xref>). For SI with plan samples with a clinical consensus, the agreed-upon prediction was correct 61.4% (35/140) of the time for “SI with plan at intake” versus much lower at 25% (25/120) of the time for “SI with plan postintake.” For the “no SI with plan” samples, the clinicians’ agreed-upon prediction was correct at a high rate of 98.1% (102/200).</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Rates of clinical consensus are defined as instances in which all 6 clinicians agreed on the predicted outcome for a given sample.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="360"/>
            <col width="190"/>
            <col width="220"/>
            <col width="230"/>
            <thead>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>No SI with plan (n=200), n (%)</td>
                <td>SI with plan at intake (n=140), n (%)</td>
                <td>SI with plan post intake (n=120), n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Number of samples with clinical consensus</td>
                <td>104 (52)</td>
                <td>57 (40.7)</td>
                <td>48 (40)</td>
              </tr>
              <tr valign="top">
                <td>Clinical consensus predicted SI with plan</td>
                <td>2 (1.9)</td>
                <td>35 (61.4)</td>
                <td>12 (25)</td>
              </tr>
              <tr valign="top">
                <td>Clinical consensus predicted no SI with plan</td>
                <td>102 (98.1)</td>
                <td>22 (38.6)</td>
                <td>36 (75)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <p>In addition, clinicians, on average, had lower rates of high confidence (even when answers were correct) compared with GPT-4 (<xref ref-type="table" rid="table4">Table 4</xref>). On average, clinicians answered correctly “no with high confidence” in 9.5% (19/200) of “no SI with plan” samples versus GPT-4 answered “no with high confidence” in 35% (70/200). Clinicians answered correctly “yes with high confidence” in 15.7% (22/140) of “SI with plan at intake” samples versus GPT-4 at 29.3% (41/140). Rates of correctly answered “yes with high confidence” were lower in “SI with plan postintake” samples but were higher for GPT-4 compared with average clinician rates (13.3%, 16/120 vs 7.2%, 8.7/120).</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Rates of high confidence answers.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="220"/>
            <col width="130"/>
            <col width="130"/>
            <col width="0"/>
            <col width="130"/>
            <col width="130"/>
            <col width="0"/>
            <col width="130"/>
            <col width="130"/>
            <thead>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">No SI<sup>a</sup> with plan (n=200)</td>
                <td colspan="3">SI with plan at intake (n=140)</td>
                <td colspan="2">SI with plan post intake (n=120)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Answered yes with high confidence, n (%)</td>
                <td>Answered no with high confidence, n (%)</td>
                <td colspan="2">Answered yes with high confidence, n (%)</td>
                <td>Answered no with high confidence, n (%)</td>
                <td colspan="2">Answered yes with high confidence, n (%)</td>
                <td>Answered no with high confidence, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Clinician 1</td>
                <td>5 (2.5)</td>
                <td>6 (3)</td>
                <td colspan="2">45 (32.1)</td>
                <td>1 (0.7)</td>
                <td colspan="2">16 (13.3)</td>
                <td>2 (1.7)</td>
              </tr>
              <tr valign="top">
                <td>Clinician 2</td>
                <td>0 (0)</td>
                <td>19 (9.5)</td>
                <td colspan="2">5 (3.6)</td>
                <td>7 (5.0)</td>
                <td colspan="2">1 (0.8)</td>
                <td>4 (3.3)</td>
              </tr>
              <tr valign="top">
                <td>Clinician 3</td>
                <td>2 (1)</td>
                <td>41 (20.5)</td>
                <td colspan="2">20 (14.3)</td>
                <td>9 (6.4)</td>
                <td colspan="2">9 (7.5)</td>
                <td>6 (5)</td>
              </tr>
              <tr valign="top">
                <td>Clinician 4</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
                <td colspan="2">1 (0.7)</td>
                <td>0 (0)</td>
                <td colspan="2">0 (0)</td>
                <td>0 (0)</td>
              </tr>
              <tr valign="top">
                <td>Clinician 5</td>
                <td>0 (0)</td>
                <td>2 (1)</td>
                <td colspan="2">23 (16.4)</td>
                <td>0 (0)</td>
                <td colspan="2">5 (4.2)</td>
                <td>3 (2.5)</td>
              </tr>
              <tr valign="top">
                <td>Clinician 6</td>
                <td>2 (1)</td>
                <td>46 (23)</td>
                <td colspan="2">38 (27.1)</td>
                <td>13 (9.3)</td>
                <td colspan="2">21 (17.5)</td>
                <td>12 (10)</td>
              </tr>
              <tr valign="top">
                <td>Average across clinicians (%)</td>
                <td>1.5 (0.75)</td>
                <td>19 (9.5)</td>
                <td colspan="2">22 (15.7)</td>
                <td>5 (3.6)</td>
                <td colspan="2">8.7 (7.2)</td>
                <td>4.5 (3.8)</td>
              </tr>
              <tr valign="top">
                <td>GPT-4<sup>b</sup></td>
                <td>1 (0.5)</td>
                <td>70 (35.0)</td>
                <td colspan="2">41 (29.3)</td>
                <td>17 (12.1)</td>
                <td colspan="2">16 (13.3)</td>
                <td>14 (11.7)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>SI: suicidal ideation.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>GPT-4: generative pretrained transformer 4.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Accuracy of Clinical Consensus and GPT-4 Performance</title>
        <p>A range of accurate clinical consensus samples was defined as samples where several clinicians, ranging from at least 1 to all 6, not only agreed on the predicted outcome but also correctly predicted the outcome. There were 316 samples of the “SI with plan at intake” and “no SI with plan” samples where at least 1 clinician predicted the outcome correctly versus 137 samples where all 6 clinicians predicted the outcome correctly (<xref ref-type="table" rid="table5">Table 5</xref>). There were 282 samples of the “SI with plan postintake” and “no SI with plan” samples where at least 1 clinician predicted the outcome correctly versus 114 samples where all 6 clinicians predicted the outcome correctly.</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Performance results for GPT-4 solely on the chief complaint in samples where at least 1, 2, 3, 4, 5, or all 6 clinicians correctly predicted the outcome of those samples.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="90"/>
            <col width="0"/>
            <col width="100"/>
            <col width="0"/>
            <col width="110"/>
            <col width="0"/>
            <col width="0"/>
            <col width="110"/>
            <col width="0"/>
            <col width="0"/>
            <col width="110"/>
            <col width="0"/>
            <col width="0"/>
            <col width="110"/>
            <col width="0"/>
            <col width="0"/>
            <col width="80"/>
            <col width="0"/>
            <col width="0"/>
            <col width="90"/>
            <col width="0"/>
            <col width="0"/>
            <col width="90"/>
            <col width="0"/>
            <col width="0"/>
            <col width="80"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Number of clinicians correctly predicting samples’ consensus threshold</td>
                <td colspan="2">Number of samples</td>
                <td colspan="3">True negative</td>
                <td colspan="3">False positive</td>
                <td colspan="3">False negative</td>
                <td colspan="3">True positive</td>
                <td colspan="3">Accuracy</td>
                <td colspan="3">Sensitivity</td>
                <td colspan="3">Specificity</td>
                <td>Precision</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="27">
                  <bold>SI with plan at intake (original n=140) versus no SI with plan (original n=200)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥1</td>
                <td colspan="2">316</td>
                <td colspan="3">141</td>
                <td colspan="3">57</td>
                <td colspan="3">32</td>
                <td colspan="3">86</td>
                <td colspan="3">0.72</td>
                <td colspan="3">0.73</td>
                <td colspan="3">0.71</td>
                <td colspan="2">0.60</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥2</td>
                <td colspan="2">284</td>
                <td colspan="3">141</td>
                <td colspan="3">52</td>
                <td colspan="3">14</td>
                <td colspan="3">77</td>
                <td colspan="3">0.77</td>
                <td colspan="3">0.85</td>
                <td colspan="3">0.73</td>
                <td colspan="2">0.60</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥3</td>
                <td colspan="2">259</td>
                <td colspan="3">137</td>
                <td colspan="3">42</td>
                <td colspan="3">7</td>
                <td colspan="3">73</td>
                <td colspan="3">0.81</td>
                <td colspan="3">0.91</td>
                <td colspan="3">0.77</td>
                <td colspan="2">0.64</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥4</td>
                <td colspan="2">236</td>
                <td colspan="3">133</td>
                <td colspan="3">36</td>
                <td colspan="3">2</td>
                <td colspan="3">65</td>
                <td colspan="3">0.84</td>
                <td colspan="3">0.97</td>
                <td colspan="3">0.79</td>
                <td colspan="2">0.64</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥5</td>
                <td colspan="2">200</td>
                <td colspan="3">123</td>
                <td colspan="3">24</td>
                <td colspan="3">0</td>
                <td colspan="3">53</td>
                <td colspan="3">0.88</td>
                <td colspan="3">1</td>
                <td colspan="3">0.84</td>
                <td colspan="2">0.69</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>6</td>
                <td colspan="2">137</td>
                <td colspan="3">89</td>
                <td colspan="3">13</td>
                <td colspan="3">0</td>
                <td colspan="3">35</td>
                <td colspan="3">0.91</td>
                <td colspan="3">1</td>
                <td colspan="3">0.87</td>
                <td colspan="2">0.73</td>
              </tr>
              <tr valign="top">
                <td colspan="27">
                  <bold>SI with plan post intake (original n=120) versus no SI with plan (original n=200)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥1</td>
                <td colspan="2">282</td>
                <td colspan="2">141</td>
                <td colspan="3">57</td>
                <td colspan="3">31</td>
                <td colspan="3">53</td>
                <td colspan="3">0.69</td>
                <td colspan="3">0.63</td>
                <td colspan="3">0.71</td>
                <td colspan="3">0.48</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥2</td>
                <td colspan="2">266</td>
                <td colspan="2">141</td>
                <td colspan="3">52</td>
                <td colspan="3">23</td>
                <td colspan="3">50</td>
                <td colspan="3">0.72</td>
                <td colspan="3">0.69</td>
                <td colspan="3">0.73</td>
                <td colspan="3">0.49</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥3</td>
                <td colspan="2">233</td>
                <td colspan="2">137</td>
                <td colspan="3">42</td>
                <td colspan="3">10</td>
                <td colspan="3">44</td>
                <td colspan="3">0.78</td>
                <td colspan="3">0.82</td>
                <td colspan="3">0.77</td>
                <td colspan="3">0.51</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥4</td>
                <td colspan="2">211</td>
                <td colspan="2">133</td>
                <td colspan="3">36</td>
                <td colspan="3">6</td>
                <td colspan="3">36</td>
                <td colspan="3">0.80</td>
                <td colspan="3">0.86</td>
                <td colspan="3">0.79</td>
                <td colspan="3">0.5</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥5</td>
                <td colspan="2">169</td>
                <td colspan="2">123</td>
                <td colspan="3">24</td>
                <td colspan="3">1</td>
                <td colspan="3">21</td>
                <td colspan="3">0.85</td>
                <td colspan="3">0.96</td>
                <td colspan="3">0.84</td>
                <td colspan="3">0.47</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>6</td>
                <td colspan="2">114</td>
                <td colspan="2">89</td>
                <td colspan="3">13</td>
                <td colspan="3">0</td>
                <td colspan="3">12</td>
                <td colspan="3">0.89</td>
                <td colspan="3">1</td>
                <td colspan="3">0.87</td>
                <td colspan="3">0.48</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <p>As the accurate clinical consensus threshold increased, GPT-4 performance increased significantly in those samples (<xref ref-type="table" rid="table5">Table 5</xref>). When assessing the “SI with plan at intake” and “no SI with plan” samples with a clinical consensus of 3 or more and correct predictions, GPT-4 performed with an accuracy of 0.81, sensitivity of 0.91, specificity of 0.77, and precision of 0.64. When assessing the “SI with plan postintake” and “no SI with plan” samples with a clinical consensus of 3 or more and correct predictions, GPT-4 performed with an accuracy of 0.80, sensitivity of 0.86, and precision of 0.51.</p>
      </sec>
      <sec>
        <title>Risk Indicators Identified in Chief Complaint Text by GPT-4</title>
        <p>At least 1 risk indicator was identified in the chief complaint text by GPT-4 on 45.5% (91/200) of “no SI with plan” samples (<xref ref-type="table" rid="table6">Table 6</xref>). A total of 70% (98/140) of “SI with plan at intake” samples and 54.2% (65/120) of “SI with plan postintake” samples had at least 1 GPT-4–identified risk indicator. The most common risk indicator in “SI with plan at intake” samples identified by GPT-4 was “sense of hopelessness” (in 40% [56/140] of samples, compared with 27.5% [33/120] of “SI with plan postintake” and 16.5% [33/200] of “no SI with plan”). The most common risk indicator in “no SI with plan” samples was “recent stress, loss, or trauma” (in 25.5% [51/200] of samples, compared with 22.1% [31/140] of “SI with plan at intake” samples and 17.5% [21/120] of “SI with plan postintake” samples). In addition, the rate of identification of “social isolation” as a risk factor in “SI with plan postintake” samples (15/120, 12.5%) was higher in both “no SI with plan” (22/140, 5.7%) samples and “SI with plan at intake” samples (33/200, 6.5%).</p>
        <table-wrap position="float" id="table6">
          <label>Table 6</label>
          <caption>
            <p>Number of samples per explicit risk indicator identified by GPT-4.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="330"/>
            <col width="180"/>
            <col width="220"/>
            <col width="240"/>
            <thead>
              <tr valign="top">
                <td colspan="2">
                  <break/>
                </td>
                <td>No SI with plan (n=200)</td>
                <td>SI with plan at intake (n=140)</td>
                <td>SI with plan post intake (n=120)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="5">
                  <bold>Number of risk indicators identified by GPT-4, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>0</td>
                <td>109 (54.5)</td>
                <td>42 (30)</td>
                <td>55 (45.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>1</td>
                <td>34 (17)</td>
                <td>28 (20</td>
                <td>22 (18.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>2</td>
                <td>34 (17)</td>
                <td>37 (26.4)</td>
                <td>18 (15)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>3</td>
                <td>16 (8)</td>
                <td>22 (15.7)</td>
                <td>15 (12.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>4</td>
                <td>4 (2)</td>
                <td>6 (4.3)</td>
                <td>8 (6.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>5</td>
                <td>3 (1)</td>
                <td>3 (2.1)</td>
                <td>1 (0.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>6</td>
                <td>0 (0)</td>
                <td>2 (1.4)</td>
                <td>1 (0.8)</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Risk indicator identified by GPT-4, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Sense of hopelessness</td>
                <td>33 (16.5)</td>
                <td>56 (40)</td>
                <td>33 (27.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Explicit mentions of suicide, suicidal thoughts, or self-harm</td>
                <td>2 (1)</td>
                <td>38 (27.1)</td>
                <td>19 (15.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Recent stress, loss, or trauma</td>
                <td>51 (25.5)</td>
                <td>31 (22.1)</td>
                <td>21 (17.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Apathy, indifference, or emotional detachment</td>
                <td>19 (9.5)</td>
                <td>22 (15.7)</td>
                <td>19 (15.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Lack or loss of relationships or support</td>
                <td>22 (11)</td>
                <td>17 (12.1)</td>
                <td>12 (10)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Social isolation</td>
                <td>13 (6.5)</td>
                <td>8 (5.7)</td>
                <td>15 (12.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Chronic medical conditions</td>
                <td>13 (6.5)</td>
                <td>13 (9.3)</td>
                <td>8 (6.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>History of trauma</td>
                <td>13 (6.5)</td>
                <td>10 (7.1)</td>
                <td>8 (6.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Impulsive or aggressive language</td>
                <td>3 (1.5)</td>
                <td>8 (5.7)</td>
                <td>6 (5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Previous suicide attempt</td>
                <td>0 (0)</td>
                <td>9 (6.4)</td>
                <td>1 (0.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Substance use</td>
                <td>10 (5)</td>
                <td>6 (4.3)</td>
                <td>3 (2.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Family history of suicide</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
                <td>1 (0.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Death imagery or metaphors</td>
                <td>2 (1)</td>
                <td>1 (0.7)</td>
                <td>0 (0)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Chief Complaints With No Risk Indicators and Clinician Performance</title>
        <p>Assessing the clinicians’ performance on samples where GPT-4 identified no explicit risk indicators in the chief complaint text, the average clinician sensitivity was found to be low for both “SI with plan at intake” and “SI with plan postintake” at 0.22 and 0.17, respectively (<xref ref-type="table" rid="table7">Table 7</xref>). The average clinician specificity and precision were high for both “SI with plan at intake” and “SI with plan postintake” at 0.93 and 0.63 versus 0.93 and 0.6, respectively. While the sample size in this analysis was significantly decreased, n=109/200 (54.5%) for “no SI with plan,” n=42/140 (30%) for “SI with plan at intake,” and n=55/120 (45.8%) for “SI with plan postintake,” clinicians’ performance resulted in fewer false positives and a lower rate of positive prediction, indicating that clinicians are less likely to predict SI with plan in patients where GPT did not identify any risk factors.</p>
        <table-wrap position="float" id="table7">
          <label>Table 7</label>
          <caption>
            <p>Performance results for chief complaint text-only samples where GPT-4 identified zero explicit risk indicators.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="190"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <col width="80"/>
            <col width="90"/>
            <col width="90"/>
            <col width="80"/>
            <thead>
              <tr valign="top">
                <td colspan="2">
                  <break/>
                </td>
                <td>True negative</td>
                <td>False positive</td>
                <td>False negative</td>
                <td>True positive</td>
                <td>Accuracy</td>
                <td>Sensitivity</td>
                <td>Specificity</td>
                <td>Precision</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="10">
                  <bold>SI<sup>a</sup> with plan at intake (n=42) versus no SI with plan (n=109)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>GPT-4</td>
                <td>109</td>
                <td>0</td>
                <td>40</td>
                <td>2</td>
                <td>0.74</td>
                <td>0.05</td>
                <td>1</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Clinician 1</td>
                <td>100</td>
                <td>9</td>
                <td>33</td>
                <td>9</td>
                <td>0.72</td>
                <td>0.21</td>
                <td>0.92</td>
                <td>0.5</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Clinician 2</td>
                <td>108</td>
                <td>1</td>
                <td>40</td>
                <td>2</td>
                <td>0.73</td>
                <td>0.05</td>
                <td>0.99</td>
                <td>0.67</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Clinician 3</td>
                <td>91</td>
                <td>18</td>
                <td>27</td>
                <td>15</td>
                <td>0.70</td>
                <td>0.36</td>
                <td>0.84</td>
                <td>0.46</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Clinician 4</td>
                <td>109</td>
                <td>0</td>
                <td>39</td>
                <td>3</td>
                <td>0.74</td>
                <td>0.07</td>
                <td>1</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Clinician 5</td>
                <td>101</td>
                <td>8</td>
                <td>28</td>
                <td>14</td>
                <td>0.76</td>
                <td>0.33</td>
                <td>0.93</td>
                <td>0.64</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Clinician 6</td>
                <td>96</td>
                <td>13</td>
                <td>29</td>
                <td>13</td>
                <td>0.72</td>
                <td>0.31</td>
                <td>0.88</td>
                <td>0.5</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Average across clinicians</td>
                <td>—<sup>b</sup></td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>0.73</td>
                <td>0.22</td>
                <td>0.93</td>
                <td>0.63</td>
              </tr>
              <tr valign="top">
                <td colspan="10">
                  <bold>SI with plan post intake (n=55) versus no SI with plan (n=109)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>GPT-4</td>
                <td>109</td>
                <td>0</td>
                <td>54</td>
                <td>1</td>
                <td>0.67</td>
                <td>0.02</td>
                <td>1</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Clinician 1</td>
                <td>100</td>
                <td>9</td>
                <td>45</td>
                <td>10</td>
                <td>0.67</td>
                <td>0.18</td>
                <td>0.92</td>
                <td>0.53</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Clinician 2</td>
                <td>108</td>
                <td>1</td>
                <td>54</td>
                <td>1</td>
                <td>0.67</td>
                <td>0.02</td>
                <td>0.99</td>
                <td>0.5</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Clinician 3</td>
                <td>91</td>
                <td>18</td>
                <td>37</td>
                <td>18</td>
                <td>0.67</td>
                <td>0.33</td>
                <td>0.84</td>
                <td>0.5</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Clinician 4</td>
                <td>109</td>
                <td>0</td>
                <td>51</td>
                <td>4</td>
                <td>0.69</td>
                <td>0.07</td>
                <td>1</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Clinician 5</td>
                <td>101</td>
                <td>8</td>
                <td>44</td>
                <td>11</td>
                <td>0.68</td>
                <td>0.2</td>
                <td>0.93</td>
                <td>0.58</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Clinician 6</td>
                <td>96</td>
                <td>13</td>
                <td>43</td>
                <td>12</td>
                <td>0.66</td>
                <td>0.22</td>
                <td>0.88</td>
                <td>0.48</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Average across clinicians</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>0.67</td>
                <td>0.17</td>
                <td>0.93</td>
                <td>0.6</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table7fn1">
              <p><sup>a</sup>SI: suicidal ideation.</p>
            </fn>
            <fn id="table7fn2">
              <p><sup>b</sup>Not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Overview</title>
        <p>The objective of this study was to evaluate the performance of the foundation LLM GPT-4 compared with experienced mental health clinicians in predicting SI with plan based on a patient-generated chief complaint–free text at intake on a national telemental health platform. This study supports previous research that LLMs are able to perform comparably to clinicians in medical applications and that generalist models such as GPT-4 are able to deliver comparable performance without specialized fine-tuning or domain expertise [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref25">25</xref>].</p>
      </sec>
      <sec>
        <title>Findings</title>
        <p>GPT-4 is capable of predicting the risk of SI with plan using patient-generated chief complaint–free text without extensive work on prompt design and without being trained explicitly on this task. The performance of these GPT-4–based predictions approach those of the clinicians on a variety of measures.</p>
        <p>The variability in clinicians’ performance and agreement indicate that identifying SI with plan in patient text alone is a difficult problem even for clinical experts. However, using the clinical experts in this study as a benchmark, GPT-4 was still able to perform comparably in sensitivity but with lower specificity and precision. When assessing GPT-4 on samples with high clinician agreement and performance, this study found that GPT-4 was capable of significantly high sensitivity as well as specificity. These results support that models such as GPT-4, without large amounts of time spent on highly complex data cleaning or model training, are capable of identifying the risk of crisis comparable to the average clinician.</p>
        <p>This study also explored the use of GPT-4 as an NLP technique for the extraction of meaningful clinical information. GPT-4 was able to identify and return explicit indicators of risk in text, such as “sense of hopelessness,” that could further assist in crisis triaging and resourcing.</p>
        <p>In addition, while not a specific aim or analysis in this study, the average clinician took approximately 3 hours to evaluate the 460 samples of text provided. GPT-4 completed the full evaluation in less than 10 minutes, without optimization for computing or memory, highlighting the possible increased operational efficiency that could be leveraged by automating a tedious and emotionally trying manual task.</p>
        <p>Taking into consideration the current behavioral health care workforce shortage, and the increasing rates of suicide, there is a need for scalable, efficient, technology-enabled screening techniques, such as the one used in this study, to assist with suicide risk detection. More efficient risk detection will allow for faster delivery of interventions to help prevent suicide attempts. The use of technology for this purpose would also be a cost-saving and efficient way to more broadly screen for suicide risk. Patients deemed at high risk might be triaged by clinicians with greater expertise in managing suicidality.</p>
        <p>Responsible integration and the use of generative AI as a screening tool for predicting the likelihood of crisis would depend on achieving at least similar accuracy to a team of clinicians and should always follow-up with a clinician review, who would be given additional context behind the GPT-4–based prediction and have access to additional clinical data.</p>
        <p>Overall, GPT-4 shows promise as a solution to help clinicians deliver more timely care.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>We do not intend for this study, the LLM choice, or the prompt design to be viewed as a generalizable solution to predict and identify suicidal risk. Instead, we have shown how the capabilities of these LLMs can be tailored to specific psychiatric assessments and how they compare to the limitations of expert clinician predictions. We hope that the findings encourage further research.</p>
        <p>Several limitations in this study must be addressed before the results of such a system could be applied in practice, including but not limited to data from a larger or more diverse population, use of other LLMs, and in particular, LLMs that were built for application in the medical domain, and a greater exploration of prompt design and its impact on performance. Similar to the use of real-time clinical decision support for precision prescribing at Brightside, which is reliant on medical decision-making by trained clinicians, the use of LLM for triage would be limited to suggestions and distillation of information for further clinician assessment [<xref ref-type="bibr" rid="ref29">29</xref>].</p>
        <p>Suicide has been notoriously difficult to predict. Due to the difficult nature of identifying or predicting future SI with plan, precision uncertainties are a reality in treating higher-severity behavioral health patients. This can be seen by the number of false positives and lower precision across several clinicians. Due to this uncertainty, awareness of risk does not necessarily dictate treatment decisions but might influence triage to a provider with more expertise in treating suicidality.</p>
        <p>GPT-4 was on the higher end for false positives with chief complaint text only relative to the clinicians, and when previous attempt knowledge was added, this rate was almost doubled, making this metric relative to the worst-performing clinician. While work should be done to further align this GPT-4–based system with the expert clinicians, especially with previous attempt information, these false positives are clearly a reality in treating patients today.</p>
        <p>GPT-4 was on the lower end for false negatives relative to the clinicians, in some cases having half as many false positives as the worst-performing clinicians. It is our view that increasing awareness around potential risk through the use of systems such as this is valuable, especially for clinicians who have less expertise.</p>
        <p>Finally, as previously discussed, LLMs have tendencies to perpetuate biases inherent in the data on which they are trained [<xref ref-type="bibr" rid="ref30">30</xref>]. Future work should explore how these biases may influence the quality of the prediction within different subpopulations of patients [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>The use of ML and LLMs to analyze speech and language patterns offers an opportunity for behavioral health clinicians and researchers to explore technologies such as these to assist with the detection and prediction of mental health conditions, along with specific symptoms such as suicidal thoughts, intent, and behaviors [<xref ref-type="bibr" rid="ref32">32</xref>]. This study served as a model for comparing the predictive value of generative AI to clinician (imperfect) predictions when both were given access to the same limited data set. Research evaluating applications of AI technology to human speech, language, and behavior is in its infancy, but findings such as the ones presented in this study may help clinicians and researchers leverage the potential of LLMs to help those struggling with mental illness. Generative AI has the potential to transform areas of mental health care that might otherwise be overlooked. However, great care must be taken by both developers of this technology and the clinicians who deploy them to ensure that the benefits far outweigh the safety challenges and risks.</p>
        <p>Further research is encouraged in this area, with consideration of the ethical and clinical implications of the use of AI for detecting and predicting mental health issues [<xref ref-type="bibr" rid="ref32">32</xref>]. This research will assist in setting standards and guidelines for how such use could be deployed.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">GPT-4</term>
          <def>
            <p>generative pretrained transformer 4</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">ML</term>
          <def>
            <p>machine learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">PHQ-9</term>
          <def>
            <p>Patient Health Questionnaire-9</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">SI</term>
          <def>
            <p>suicidal ideation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">USMLE</term>
          <def>
            <p>United States Medical Licensing Examination</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors would like to thank the 6 clinicians who contributed their time to participate in data collection for this study.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>All the authors hold stock in and are employees of Brightside Health, Inc. The authors declare that this study received funding from Brightside Health. Aside from the employment status, the funder was not involved in the study design, interpretation of data, or the decision to submit for publication.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <source>WISQARS (Web-based injury statistics query and reporting system)</source>
          <year>2023</year>
          <access-date>2024-01-20</access-date>
          <publisher-loc>Atlanta, GA</publisher-loc>
          <publisher-name>Centers for Disease Control and Prevention</publisher-name>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/injury/wisqars/index.html">https://www.cdc.gov/injury/wisqars/index.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <source>Suicide data and statistics. Suicide prevention</source>
          <year>2023</year>
          <access-date>2024-01-20</access-date>
          <publisher-loc>Atlanta, GA</publisher-loc>
          <publisher-name>Centers for Disease Control and Prevention</publisher-name>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/suicide/suicide-data-statistics.html">https://www.cdc.gov/suicide/suicide-data-statistics.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <source>Understanding the U.S. Behavioral Health Workforce shortage</source>
          <access-date>2024-06-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.commonwealthfund.org/publications/explainer/2023/may/understanding-us-behavioral-health-workforce-shortage">https://www.commonwealthfund.org/publications/explainer/2023/may/understanding-us-behavioral-health-workforce-shortage</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Beautrais</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Joyce</surname>
              <given-names>PR</given-names>
            </name>
            <name name-style="western">
              <surname>Mulder</surname>
              <given-names>RT</given-names>
            </name>
            <name name-style="western">
              <surname>Fergusson</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Deavoll</surname>
              <given-names>BJ</given-names>
            </name>
            <name name-style="western">
              <surname>Nightingale</surname>
              <given-names>SK</given-names>
            </name>
          </person-group>
          <article-title>Prevalence and comorbidity of mental disorders in persons making serious suicide attempts: a case-control study</article-title>
          <source>Am J Psychiatry</source>
          <year>1996</year>
          <volume>153</volume>
          <issue>8</issue>
          <fpage>1009</fpage>
          <lpage>1014</lpage>
          <pub-id pub-id-type="doi">10.1176/ajp.153.8.1009</pub-id>
          <pub-id pub-id-type="medline">8678168</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="web">
          <source>Risk and protective factors. Suicide prevention</source>
          <year>2023</year>
          <access-date>2024-01-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/suicide/factors/index.html">https://www.cdc.gov/suicide/factors/index.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ribeiro</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Fox</surname>
              <given-names>KR</given-names>
            </name>
            <name name-style="western">
              <surname>Franklin</surname>
              <given-names>JC</given-names>
            </name>
          </person-group>
          <article-title>Depression and hopelessness as risk factors for suicide ideation, attempts and death: meta-analysis of longitudinal studies</article-title>
          <source>Br J Psychiatry</source>
          <year>2018</year>
          <volume>212</volume>
          <issue>5</issue>
          <fpage>279</fpage>
          <lpage>286</lpage>
          <pub-id pub-id-type="doi">10.1192/bjp.2018.27</pub-id>
          <pub-id pub-id-type="medline">29587888</pub-id>
          <pub-id pub-id-type="pii">S0007125018000272</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Motillon-Toudic</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Walter</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Séguin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Carrier</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Berrouiguet</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lemey</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Social isolation and suicide risk: literature review and perspectives</article-title>
          <source>Eur Psychiatry</source>
          <year>2022</year>
          <volume>65</volume>
          <issue>1</issue>
          <fpage>e65</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36216777"/>
          </comment>
          <pub-id pub-id-type="doi">10.1192/j.eurpsy.2022.2320</pub-id>
          <pub-id pub-id-type="medline">36216777</pub-id>
          <pub-id pub-id-type="pii">S0924933822023203</pub-id>
          <pub-id pub-id-type="pmcid">PMC9641655</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Castellví</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Miranda‐Mendizábal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Parés‐Badell</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Almenara</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Alonso</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Blasco</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Cebrià</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gabilondo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gili</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lagares</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Piqueras</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Roca</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rodríguez‐Marín</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rodríguez‐Jimenez</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Soto‐Sanz</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Alonso</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Exposure to violence, a risk for suicide in youths and young adults. A meta‐analysis of longitudinal studies</article-title>
          <source>Acta Psychiatr Scand</source>
          <year>2016</year>
          <volume>135</volume>
          <issue>3</issue>
          <fpage>195</fpage>
          <lpage>211</lpage>
          <pub-id pub-id-type="doi">10.1111/acps.12679</pub-id>
          <pub-id pub-id-type="medline">27995627</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Irigoyen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Porras-Segovia</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Galván</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Puigdevall</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Giner</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>De Leon</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Baca-García</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Predictors of re-attempt in a cohort of suicide attempters: a survival analysis</article-title>
          <source>J Affect Disord</source>
          <year>2019</year>
          <volume>247</volume>
          <fpage>20</fpage>
          <lpage>28</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jad.2018.12.050</pub-id>
          <pub-id pub-id-type="medline">30640026</pub-id>
          <pub-id pub-id-type="pii">S0165-0327(18)31383-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hubers</surname>
              <given-names>AAM</given-names>
            </name>
            <name name-style="western">
              <surname>Moaddine</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Peersmann</surname>
              <given-names>SHM</given-names>
            </name>
            <name name-style="western">
              <surname>Stijnen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>van Duijn</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>van der Mast</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Dekkers</surname>
              <given-names>OM</given-names>
            </name>
            <name name-style="western">
              <surname>Giltay</surname>
              <given-names>EJ</given-names>
            </name>
          </person-group>
          <article-title>Suicidal ideation and subsequent completed suicide in both psychiatric and non-psychiatric populations: a meta-analysis</article-title>
          <source>Epidemiol Psychiatr Sci</source>
          <year>2018</year>
          <volume>27</volume>
          <issue>2</issue>
          <fpage>186</fpage>
          <lpage>198</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27989254"/>
          </comment>
          <pub-id pub-id-type="doi">10.1017/S2045796016001049</pub-id>
          <pub-id pub-id-type="medline">27989254</pub-id>
          <pub-id pub-id-type="pii">S2045796016001049</pub-id>
          <pub-id pub-id-type="pmcid">PMC6998965</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jobes</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Joiner</surname>
              <given-names>TE</given-names>
            </name>
          </person-group>
          <article-title>Reflections on suicidal ideation</article-title>
          <source>Crisis</source>
          <year>2019</year>
          <volume>40</volume>
          <issue>4</issue>
          <fpage>227</fpage>
          <lpage>230</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://econtent.hogrefe.com/doi/abs/10.1027/0227-5910/a000615?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:crossref.org&amp;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1027/0227-5910/a000615</pub-id>
          <pub-id pub-id-type="medline">31274031</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nock</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Borges</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Bromet</surname>
              <given-names>EJ</given-names>
            </name>
            <name name-style="western">
              <surname>Cha</surname>
              <given-names>CB</given-names>
            </name>
            <name name-style="western">
              <surname>Kessler</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Suicide and suicidal behavior</article-title>
          <source>Epidemiol Rev</source>
          <year>2008</year>
          <volume>30</volume>
          <issue>1</issue>
          <fpage>133</fpage>
          <lpage>154</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/18653727"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/epirev/mxn002</pub-id>
          <pub-id pub-id-type="medline">18653727</pub-id>
          <pub-id pub-id-type="pii">mxn002</pub-id>
          <pub-id pub-id-type="pmcid">PMC2576496</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O'Connor</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Kirtley</surname>
              <given-names>OJ</given-names>
            </name>
          </person-group>
          <article-title>The integrated motivational-volitional model of suicidal behaviour</article-title>
          <source>Philos Trans R Soc Lond B Biol Sci</source>
          <year>2018</year>
          <volume>373</volume>
          <issue>1754</issue>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://royalsocietypublishing.org/doi/abs/10.1098/rstb.2017.0268?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:crossref.org&amp;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1098/rstb.2017.0268</pub-id>
          <pub-id pub-id-type="medline">30012735</pub-id>
          <pub-id pub-id-type="pii">rstb.2017.0268</pub-id>
          <pub-id pub-id-type="pmcid">PMC6053985</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="web">
          <source>Suicide - National Institute of Mental Health (NIMH)</source>
          <access-date>2024-01-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nimh.nih.gov/health/statistics/suicide">https://www.nimh.nih.gov/health/statistics/suicide</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="web">
          <source>Suicide statistics</source>
          <access-date>2024-01-20</access-date>
          <publisher-name>American Foundation for Suicide Prevention</publisher-name>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://afsp.org/suicide-statistics/">https://afsp.org/suicide-statistics/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Simon</surname>
              <given-names>GE</given-names>
            </name>
            <name name-style="western">
              <surname>Rutter</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Oliver</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Whiteside</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Operskalski</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ludman</surname>
              <given-names>EJ</given-names>
            </name>
          </person-group>
          <article-title>Does response on the PHQ-9 depression questionnaire predict subsequent suicide attempt or suicide death?</article-title>
          <source>Psychiatr Serv</source>
          <year>2013</year>
          <volume>64</volume>
          <issue>12</issue>
          <fpage>1195</fpage>
          <lpage>1202</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24036589"/>
          </comment>
          <pub-id pub-id-type="doi">10.1176/appi.ps.201200587</pub-id>
          <pub-id pub-id-type="medline">24036589</pub-id>
          <pub-id pub-id-type="pii">1738338</pub-id>
          <pub-id pub-id-type="pmcid">PMC4086215</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Simon</surname>
              <given-names>GE</given-names>
            </name>
            <name name-style="western">
              <surname>Yarborough</surname>
              <given-names>BJ</given-names>
            </name>
            <name name-style="western">
              <surname>Rossom</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Lawrence</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Lynch</surname>
              <given-names>FL</given-names>
            </name>
            <name name-style="western">
              <surname>Waitzfelder</surname>
              <given-names>BE</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmedani</surname>
              <given-names>BK</given-names>
            </name>
            <name name-style="western">
              <surname>Shortreed</surname>
              <given-names>SM</given-names>
            </name>
          </person-group>
          <article-title>Self-reported suicidal ideation as a predictor of suicidal behavior among outpatients with diagnoses of psychotic disorders</article-title>
          <source>Psychiatr Serv</source>
          <year>2019</year>
          <volume>70</volume>
          <issue>3</issue>
          <fpage>176</fpage>
          <lpage>183</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30526341"/>
          </comment>
          <pub-id pub-id-type="doi">10.1176/appi.ps.201800381</pub-id>
          <pub-id pub-id-type="medline">30526341</pub-id>
          <pub-id pub-id-type="pmcid">PMC6520048</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ursano</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Heeringa</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Stein</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Jain</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Raman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chiu</surname>
              <given-names>WT</given-names>
            </name>
            <name name-style="western">
              <surname>Colpe</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Fullerton</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Gilman</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Hwang</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Naifeh</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Nock</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Rosellini</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Sampson</surname>
              <given-names>NA</given-names>
            </name>
            <name name-style="western">
              <surname>Schoenbaum</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zaslavsky</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Kessler</surname>
              <given-names>RC</given-names>
            </name>
          </person-group>
          <article-title>Prevalence and correlates of suicidal behavior among new soldiers in the US Army: results from the army study to assess risk and resilience in service members (Army STARRS)</article-title>
          <source>Depress Anxiety</source>
          <year>2015</year>
          <month>01</month>
          <volume>32</volume>
          <issue>1</issue>
          <fpage>3</fpage>
          <lpage>12</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://hdl.handle.net/2027.42/110590"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/da.22317</pub-id>
          <pub-id pub-id-type="medline">25338964</pub-id>
          <pub-id pub-id-type="pmcid">PMC5113817</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rossom</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Coleman</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmedani</surname>
              <given-names>BK</given-names>
            </name>
            <name name-style="western">
              <surname>Beck</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Oliver</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Simon</surname>
              <given-names>GE</given-names>
            </name>
          </person-group>
          <article-title>Suicidal ideation reported on the PHQ9 and risk of suicidal behavior across age groups</article-title>
          <source>J Affect Disord</source>
          <year>2017</year>
          <volume>215</volume>
          <fpage>77</fpage>
          <lpage>84</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28319695"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jad.2017.03.037</pub-id>
          <pub-id pub-id-type="medline">28319695</pub-id>
          <pub-id pub-id-type="pii">S0165-0327(16)31768-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC5412508</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stone</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Laughren</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Levenson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Holland</surname>
              <given-names>PC</given-names>
            </name>
            <name name-style="western">
              <surname>Hughes</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hammad</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Temple</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rochester</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Risk of suicidality in clinical trials of antidepressants in adults: analysis of proprietary data submitted to US Food and Drug Administration</article-title>
          <source>BMJ</source>
          <year>2009</year>
          <volume>339</volume>
          <fpage>b2880</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/19671933"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.b2880</pub-id>
          <pub-id pub-id-type="medline">19671933</pub-id>
          <pub-id pub-id-type="pii">bmj.b2880</pub-id>
          <pub-id pub-id-type="pmcid">PMC2725270</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carson</surname>
              <given-names>NJ</given-names>
            </name>
            <name name-style="western">
              <surname>Mullin</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Sanchez</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Menezes</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cook</surname>
              <given-names>BL</given-names>
            </name>
          </person-group>
          <article-title>Identification of suicidal behavior among psychiatrically hospitalized adolescents using natural language processing and machine learning of electronic health records</article-title>
          <source>PLoS One</source>
          <year>2019</year>
          <volume>14</volume>
          <issue>2</issue>
          <fpage>e0211116</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0211116"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0211116</pub-id>
          <pub-id pub-id-type="medline">30779800</pub-id>
          <pub-id pub-id-type="pii">PONE-D-18-15627</pub-id>
          <pub-id pub-id-type="pmcid">PMC6380543</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arowosegbe</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Oyelade</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Application of natural language processing (NLP) in detecting and preventing suicide ideation: a systematic review</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2023</year>
          <volume>20</volume>
          <issue>2</issue>
          <fpage>1514</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph20021514"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph20021514</pub-id>
          <pub-id pub-id-type="medline">36674270</pub-id>
          <pub-id pub-id-type="pii">ijerph20021514</pub-id>
          <pub-id pub-id-type="pmcid">PMC9859480</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Swaminathan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>López</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Mar</surname>
              <given-names>RAG</given-names>
            </name>
            <name name-style="western">
              <surname>Heist</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>McClintock</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Caoili</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Grace</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rubashkin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Boggs</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Gevaert</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Mou</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Nock</surname>
              <given-names>MK</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing system for rapid detection and intervention of mental health crisis chat messages</article-title>
          <source>NPJ Digit Med</source>
          <year>2023</year>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>213</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-023-00951-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-023-00951-3</pub-id>
          <pub-id pub-id-type="medline">37990134</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41746-023-00951-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC10663535</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Singhal</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Azizi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Mahdavi</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>HW</given-names>
            </name>
            <name name-style="western">
              <surname>Scales</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Tanwani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cole-Lewis</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Pfohl</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Payne</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Seneviratne</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gamble</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Kelly</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Babiker</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Schärli</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Chowdhery</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mansfield</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Demner-Fushman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Agüera Y Arcas</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Webster</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Corrado</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Matias</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chou</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Gottweis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tomasev</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Rajkomar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Barral</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Semturs</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Karthikesalingam</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Natarajan</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Large language models encode clinical knowledge</article-title>
          <source>Nature</source>
          <year>2023</year>
          <month>08</month>
          <volume>620</volume>
          <issue>7972</issue>
          <fpage>172</fpage>
          <lpage>180</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37438534"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41586-023-06291-2</pub-id>
          <pub-id pub-id-type="medline">37438534</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41586-023-06291-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC10396962</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nori</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Carignan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Edgar</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Fusi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>King</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Larson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>McKinney</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ness</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Poon</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Qin</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Usuyama</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>White</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Horvitz</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <source>Can generalist foundation models outcompete special-purpose tuning? Case study in medicine</source>
          <access-date>2023-12-04</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/2311.16452">http://arxiv.org/abs/2311.16452</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Galatzer-Levy</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>McDuff</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Natarajan</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Karthikesalingam</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>The capability of large language models to measure psychiatric functioning</article-title>
          <comment>Preprint posted on August 3, 2023</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2308.01834"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>OpenAI</collab>
          </person-group>
          <article-title>GPT-4 technical report</article-title>
          <comment>Preprint posted online on March 15, 2023</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2303.08774"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/ARXIV.2303.08774</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abraham</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pedregosa</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Eickenberg</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gervais</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Mueller</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kossaifi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gramfort</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Thirion</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Varoquaux</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Machine learning for neuroimaging with scikit-learn</article-title>
          <source>Front Neuroinform</source>
          <year>2014</year>
          <volume>8</volume>
          <fpage>14</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/24600388"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fninf.2014.00014</pub-id>
          <pub-id pub-id-type="medline">24600388</pub-id>
          <pub-id pub-id-type="pmcid">PMC3930868</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O'Callaghan</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Sullivan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Belanger</surname>
              <given-names>HG</given-names>
            </name>
            <name name-style="western">
              <surname>Winsberg</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Feasibility and acceptability of a novel telepsychiatry-delivered precision prescribing intervention for anxiety and depression</article-title>
          <source>BMC Psychiatry</source>
          <year>2022</year>
          <volume>22</volume>
          <issue>1</issue>
          <fpage>483</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpsychiatry.biomedcentral.com/articles/10.1186/s12888-022-04113-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12888-022-04113-9</pub-id>
          <pub-id pub-id-type="medline">35854281</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12888-022-04113-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC9297585</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ray</surname>
              <given-names>PP</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT: a comprehensive review on background, applications, key challenges, bias, ethics, limitations and future scope</article-title>
          <source>Internet of Things and Cyber Physical Systems</source>
          <year>2023</year>
          <volume>3</volume>
          <fpage>121</fpage>
          <lpage>154</lpage>
          <pub-id pub-id-type="doi">10.1016/j.iotcps.2023.04.003</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Timmons</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Duong</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Simo Fiallo</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Vo</surname>
              <given-names>HPQ</given-names>
            </name>
            <name name-style="western">
              <surname>Ahle</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Comer</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Brewer</surname>
              <given-names>LC</given-names>
            </name>
            <name name-style="western">
              <surname>Frazier</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Chaspari</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>A call to action on assessing and mitigating bias in artificial intelligence applications for mental health</article-title>
          <source>Perspect Psychol Sci</source>
          <year>2023</year>
          <volume>18</volume>
          <issue>5</issue>
          <fpage>1062</fpage>
          <lpage>1096</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36490369"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/17456916221134490</pub-id>
          <pub-id pub-id-type="medline">36490369</pub-id>
          <pub-id pub-id-type="pmcid">PMC10250563</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Diaz-Asper</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hauglid</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Chandler</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Foltz</surname>
              <given-names>PW</given-names>
            </name>
            <name name-style="western">
              <surname>Elvevåg</surname>
              <given-names>Brita</given-names>
            </name>
          </person-group>
          <article-title>A framework for language technologies in behavioral research and clinical applications: ethical challenges, implications, and solutions</article-title>
          <source>Am Psychol</source>
          <year>2024</year>
          <volume>79</volume>
          <issue>1</issue>
          <fpage>79</fpage>
          <lpage>91</lpage>
          <pub-id pub-id-type="doi">10.1037/amp0001195</pub-id>
          <pub-id pub-id-type="medline">38236217</pub-id>
          <pub-id pub-id-type="pii">2024-44313-007</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
