<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMH</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Ment Health</journal-id>
      <journal-title>JMIR Mental Health</journal-title>
      <issn pub-type="epub">2368-7959</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v9i1e24699</article-id>
      <article-id pub-id-type="pmid">35072648</article-id>
      <article-id pub-id-type="doi">10.2196/24699</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Acoustic and Facial Features From Clinical Interviews for Machine Learning–Based Psychiatric Diagnosis: Algorithm Development</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Torous</surname>
            <given-names>John</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Hudon</surname>
            <given-names>Alexandre</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Hidalgo-Mazzei</surname>
            <given-names>Diego</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Fulford</surname>
            <given-names>Daniel</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Wright</surname>
            <given-names>Abigail</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Birnbaum</surname>
            <given-names>Michael L</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Psychiatry</institution>
            <institution>The Zucker Hillside Hospital</institution>
            <institution>Northwell Health</institution>
            <addr-line>75-59 263rd St</addr-line>
            <addr-line>Glen Oaks, NY, 11004</addr-line>
            <country>United States</country>
            <phone>1 7184708305</phone>
            <email>mbirnbaum@northwell.edu</email>
          </address>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4285-7868</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Abrami</surname>
            <given-names>Avner</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3387-5607</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Heisig</surname>
            <given-names>Stephen</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8096-1730</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Ali</surname>
            <given-names>Asra</given-names>
          </name>
          <degrees>MA</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8552-330X</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Arenare</surname>
            <given-names>Elizabeth</given-names>
          </name>
          <degrees>BA</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0911-3207</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Agurto</surname>
            <given-names>Carla</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0617-4488</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Lu</surname>
            <given-names>Nathaniel</given-names>
          </name>
          <degrees>MA</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9695-2249</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Kane</surname>
            <given-names>John M</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2628-9442</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Cecchi</surname>
            <given-names>Guillermo</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1013-8348</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Psychiatry</institution>
        <institution>The Zucker Hillside Hospital</institution>
        <institution>Northwell Health</institution>
        <addr-line>Glen Oaks, NY</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>The Feinstein Institute for Medical Research</institution>
        <institution>Northwell Health</institution>
        <addr-line>Manhasset, NY</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>The Donald and Barbara Zucker School of Medicine at Hofstra/Northwell</institution>
        <addr-line>Hempstead, NY</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Computational Biology Center</institution>
        <institution>IBM Research</institution>
        <addr-line>Yorktown Heights, NY</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Icahn School of Medicine at Mount Sinai</institution>
        <addr-line>New York City, NY</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Michael L Birnbaum <email>mbirnbaum@northwell.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>1</month>
        <year>2022</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>24</day>
        <month>1</month>
        <year>2022</year>
      </pub-date>
      <volume>9</volume>
      <issue>1</issue>
      <elocation-id>e24699</elocation-id>
      <history>
        <date date-type="received">
          <day>1</day>
          <month>10</month>
          <year>2020</year>
        </date>
        <date date-type="rev-request">
          <day>14</day>
          <month>11</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>29</day>
          <month>4</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>1</day>
          <month>12</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Michael L Birnbaum, Avner Abrami, Stephen Heisig, Asra Ali, Elizabeth Arenare, Carla Agurto, Nathaniel Lu, John M Kane, Guillermo Cecchi. Originally published in JMIR Mental Health (https://mental.jmir.org), 24.01.2022.</copyright-statement>
      <copyright-year>2022</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Mental Health, is properly cited. The complete bibliographic information, a link to the original publication on https://mental.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://mental.jmir.org/2022/1/e24699" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>In contrast to all other areas of medicine, psychiatry is still nearly entirely reliant on subjective assessments such as patient self-report and clinical observation. The lack of objective information on which to base clinical decisions can contribute to reduced quality of care. Behavioral health clinicians need objective and reliable patient data to support effective targeted interventions.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>We aimed to investigate whether reliable inferences—psychiatric signs, symptoms, and diagnoses—can be extracted from audiovisual patterns in recorded evaluation interviews of participants with schizophrenia spectrum disorders and bipolar disorder.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We obtained audiovisual data from 89 participants (mean age 25.3 years; male: 48/89, 53.9%; female: 41/89, 46.1%): individuals with schizophrenia spectrum disorders (n=41), individuals with bipolar disorder (n=21), and healthy volunteers (n=27). We developed machine learning models based on acoustic and facial movement features extracted from participant interviews to predict diagnoses and detect clinician-coded neuropsychiatric symptoms, and we assessed model performance using area under the receiver operating characteristic curve (AUROC) in 5-fold cross-validation.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The model successfully differentiated between schizophrenia spectrum disorders and bipolar disorder (AUROC 0.73) when aggregating face and voice features. Facial action units including cheek-raising muscle (AUROC 0.64) and chin-raising muscle (AUROC 0.74) provided the strongest signal for men. Vocal features, such as energy in the frequency band 1 to 4 kHz (AUROC 0.80) and spectral harmonicity (AUROC 0.78), provided the strongest signal for women. Lip corner–pulling muscle signal discriminated between diagnoses for both men (AUROC 0.61) and women (AUROC 0.62). Several psychiatric signs and symptoms were successfully inferred: blunted affect (AUROC 0.81), avolition (AUROC 0.72), lack of vocal inflection (AUROC 0.71), asociality (AUROC 0.63), and worthlessness (AUROC 0.61).</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This study represents advancement in efforts to capitalize on digital data to improve diagnostic assessment and supports the development of a new generation of innovative clinical tools by employing acoustic and facial data analysis.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>audiovisual patterns</kwd>
        <kwd>speech analysis</kwd>
        <kwd>facial analysis</kwd>
        <kwd>psychiatry</kwd>
        <kwd>schizophrenia spectrum disorders</kwd>
        <kwd>bipolar disorder</kwd>
        <kwd>symptom prediction</kwd>
        <kwd>diagnostic prediction</kwd>
        <kwd>machine learning</kwd>
        <kwd>audiovisual</kwd>
        <kwd>speech</kwd>
        <kwd>schizophrenia</kwd>
        <kwd>spectrum disorders</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Approximately 20% of individuals aged 15 years and older experience psychiatric illness annually [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>]. Psychiatrists may see as many as 8 patients hourly and are often unable to obtain the detailed information necessary to make effective, evidence-based, and personalized clinical decisions [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref6">6</xref>]. In contrast to all other areas of medicine, psychiatry is still nearly entirely reliant on subjective assessments such as patient self-report and clinical observation [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref8">8</xref>]. There are few valid and reliable tests, biomarkers, and objective sources of collateral information available to support diagnostic procedures and assess health status. The lack of objective information on which to base clinical decisions can contribute to reduced quality of care, underrecognized signs and symptoms, and poorer treatment outcomes, including higher dropout rates, reduced medication adherence, and persistent substance abuse [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. Behavioral health clinicians need access to objective and reliable, easily collected, and interpretable patient data to enable quick, effective, and targeted interventions [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>].</p>
      <p>In recent years, progress has been made in audiovisual data processing [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref21">21</xref>]. Advances in this technology could play a pivotal role in supporting automated methods of collecting objective adjunctive patient data to inform diagnostic procedures, psychiatric symptom identification, and psychiatric symptom monitoring. Speech analysis, in particular, has been studied [<xref ref-type="bibr" rid="ref22">22</xref>-<xref ref-type="bibr" rid="ref36">36</xref>] because changes in both the content and acoustic properties of speech are known to be associated with several psychiatric conditions: disorganized speech in schizophrenia, pressured speech in mania, and slowed speech in depression [<xref ref-type="bibr" rid="ref7">7</xref>]. Moreover, speech represents a universal, easily extracted, and clinically meaningful biological process and is therefore well positioned to serve as an objective marker of psychiatric illness [<xref ref-type="bibr" rid="ref27">27</xref>]. Prior research has demonstrated the potential for the use of speech properties to distinguish between individuals with and without a variety of psychiatric disorders with high degrees of accuracy [<xref ref-type="bibr" rid="ref22">22</xref>-<xref ref-type="bibr" rid="ref36">36</xref>]. Acoustic analysis, for instance, has demonstrated that participants with schizophrenia tend to exhibit less total time talking, reduced speech rate, and higher pause duration [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref33">33</xref>-<xref ref-type="bibr" rid="ref40">40</xref>] than healthy participants and that participants with bipolar disorder demonstrate increases in tonality [<xref ref-type="bibr" rid="ref41">41</xref>-<xref ref-type="bibr" rid="ref43">43</xref>].</p>
      <p>Concurrently, alterations in facial expressivity accompany several psychiatric illnesses: flat or inappropriate affect in individuals with schizophrenia, euphoric or labile affect in mania, and slowed or diminished facial movements in depression [<xref ref-type="bibr" rid="ref7">7</xref>]. Video analysis has accordingly emerged as a potentially objective and reliable method for capturing subtle head, face, and eye movements with greater precision than by clinical observation alone [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref44">44</xref>-<xref ref-type="bibr" rid="ref46">46</xref>]. Alterations in facial expressivity have demonstrated success in predicting the presence of various psychiatric illnesses including schizophrenia spectrum disorders [<xref ref-type="bibr" rid="ref47">47</xref>-<xref ref-type="bibr" rid="ref49">49</xref>], mood disorders [<xref ref-type="bibr" rid="ref49">49</xref>-<xref ref-type="bibr" rid="ref51">51</xref>], and autism spectrum disorders [<xref ref-type="bibr" rid="ref48">48</xref>].</p>
      <p>Audiovisual patterns represent an easily extractable, naturalistic, universal, and objective data that could serve as viable digital biomarkers in psychiatry, contributing adjunctive information about a patient, beyond what can be assessed solely through traditional means. No study, to the best of our knowledge, has explored the potential for using audiovisual data to discriminate between a diagnosis of schizophrenia or bipolar disorder, a task which can be challenging for behavioral health clinicians given significant symptom overlap [<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref53">53</xref>], especially during the early course of illness development. Additionally, few studies [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref54">54</xref>] have explored the relationship between audiovisual data and psychiatric symptoms, commonly used as primary outcome measures, to more efficiently and more effectively identify the presence of a specific psychiatric sign or symptom. Furthermore, research thus far has largely explored individual data sources in isolation [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>], however, advancing this critical work will now require integrating multiple streams of digital data.</p>
      <p>We aimed to differentiate between schizophrenia spectrum disorders and bipolar disorder using audiovisual data alone. We hypothesized that physiological data from voice acoustics and facial action units could be used to distinguish between individuals with schizophrenia spectrum disorders and individuals with bipolar disorder and that these signals would be associated with specific psychiatric signs and symptoms.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Recruitment</title>
        <p>Participants between the ages of 15 and 35 years old diagnosed with schizophrenia spectrum disorders or bipolar disorder were recruited from Northwell Health Zucker Hillside Hospital’s inpatient and outpatient psychiatric departments. Diagnoses were based on clinical assessment of the most recent episode and were extracted from participant’s medical record at the time of consent. Most participants with schizophrenia spectrum disorders were recruited from the Early Treatment Program, which is a specialized outpatient early psychosis intervention clinic. Individuals with psychiatric comorbidities (such as substance use disorders) were included. Participants with known physical impairments (such as paralysis or severe laryngitis) capable of impacting facial movements or acoustic capabilities were excluded. Eligible participants were recruited by a research staff member. Healthy volunteers who had already been screened for prior studies were also recruited. Recruitment occurred between September 2018 and July 2019. The study was approved by the institutional review board (18-0137) of Northwell Health. Written informed consent was obtained from adult participants and legal guardians of participants under 18 years. Assent was obtained from minors. All participants received treatment as usual.</p>
      </sec>
      <sec>
        <title>Interviews</title>
        <p>Participants were assessed at baseline and invited to return for optional quarterly assessments thereafter for a maximum of 12 months. Healthy volunteers were assessed at baseline and invited to return for optional assessments at month 6 and month 12. At each visit, all participants, including healthy volunteers, were interviewed by a trained and reliable research rater utilizing the Brief Psychiatric Rating Scale (BPRS) [<xref ref-type="bibr" rid="ref55">55</xref>], Scale for the Assessment of Negative Symptoms (SANS) [<xref ref-type="bibr" rid="ref56">56</xref>], Hamilton Depression Rating Scale (HAMD) [<xref ref-type="bibr" rid="ref57">57</xref>], and Young Mania Rating Scale (YMRS) [<xref ref-type="bibr" rid="ref58">58</xref>]. In addition, at each visit, participants were asked a series of 5 emotionally neutral, open-ended questions designed to encourage speech production. For example, participants were asked to describe a typical dinner, discuss a television show or movie that they had watched, or talk about a current or prior pet. Participants were instructed to talk freely and prompted to continue to talk as much as they liked for each response. Similar methods for speech extraction have been successfully implemented in prior research [<xref ref-type="bibr" rid="ref34">34</xref>]. Both participant and the interviewer wore headsets with microphones connected to a 2 by 2 amplifier (TASCAM) to record audio. Video was recorded with an iPad Pro (Apple Inc) focused on participants’ facial expressions.</p>
        <p>Raw data were stored in a firewalled server and were never shared outside of Northwell Health. The processing of high-level features was implemented locally, and only those features were used for further analysis outside the raw data server. High-level feature data remained within Health Insurance Portability and Accountability Act–compliant servers.</p>
      </sec>
      <sec>
        <title>Data Preprocessing</title>
        <p>Before extracting acoustic features, saturation, if present, was removed by identifying time points with amplitudes higher than 99.99% of the maximum value, and given that recordings involved the use of two audio channels (one each, for participant and interviewer), we extracted only the participant’s voice.</p>
        <p>Acoustic features were extracted using the OpenSMILE open-source toolbox [<xref ref-type="bibr" rid="ref59">59</xref>]. We used a predefined feature set [<xref ref-type="bibr" rid="ref60">60</xref>] for low-level descriptors. This configuration encompasses 150 features, which were computed with a fixed window size (ie, mel-frequency cepstral coefficients -25 ms) but with a sampling rate of 10 ms (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
        <p>For facial features, we used openFace software [<xref ref-type="bibr" rid="ref61">61</xref>]. This tool detects the presence and intensity of 18 facial expressions called action units (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). The video sampling rate was 30 Hz.</p>
        <p>Both facial action units and acoustic time series were downsampled to 10 Hz (by taking the average value in each consecutive 0.1-second window) and aligned. We then fragmented each interview into consecutive 1.5-minute blocks. In each block, we derived 2 sets of aggregate features (one that was computed when the participant was listening, the other while speaking) to help ensure that the silence between answers did not have an effect on acoustic feature values and that the dynamics of facial action units in both conditions were captured by the models. Mean value and standard deviation were computed for each feature and for each 1.5-minute block. For better classification generalization and to reduce overfitting, we augmented each interview 25 times by selecting only 1 out of 2 consecutive blocks randomly for each block in the sequence.</p>
      </sec>
      <sec>
        <title>Classification Tasks</title>
        <p>We explored 2 main classification tasks: differential diagnosis, assigning an interview as belonging to a specific group (either schizophrenia spectrum disorders or bipolar disorder) based purely on physiological patterns, and symptom detection, predicting the presence of a psychiatric sign or symptom. In total, 75 classification tasks were run, each corresponding to the 75 unique psychiatric signs and symptoms assessed with the BPRS (18 items), SANS (22 items), YMRS (11 items), and HAMD (24 items). For each classification task, participants were assigned to the positive class if their symptom score exceeded the clinical threshold of at least mild severity: score ≥3 on BPRS items (range 1-7), score ≥2 on SANS items (range 0-5), score ≥2 or ≥4 on YMRS items (with ranges 0-4 and 0-8, respectively), and score ≥2 or ≥1 on HAMD items (with ranges 0-4 and 0-2, respectively). Total scores could range from 18 to 126 for the BPRS, 0 to 110 for the SANS, 0 to 60 for the YMRS, and 0 to 76 for the HAMD.</p>
        <p>For each classification task, we computed 2 independent models for both men and women. This was done to prevent possible sex-specific physiological confounds in voice and face to impact the results, as the bipolar disorder group was composed of a majority of women. Additionally, we aimed to build models that were not individual-dependent.</p>
        <p>All inferences were undertaken using a gradient boosting classifier [<xref ref-type="bibr" rid="ref62">62</xref>] (Python; Scikit-learn library [<xref ref-type="bibr" rid="ref63">63</xref>]) (fixed seed 0, deviance loss, 0.1 learning rate, 100 weak learners, with 10% of all samples selected randomly used for fitting the individual base learners). All inferences were run in stratified 5-fold cross-validation (participants were divided in 5 nonoverlapping groups and each group was used once as a validation, while the 4 remaining groups formed the training set). Only the most predictive features—those achieving a leave-one-out area under the receiver operating characteristic curve [AUROC] greater than 0.6 on the training set of each fold—were used by the gradient boosting classifier.</p>
        <p>Finally, we ensured that each group (both in the positive and negative class) had similar average interview durations, We removed the final few minutes from the end of the lengthier interviews (corresponding to the difference between the average length in each class) to ensure that interview duration was not a confounding factor in classification performance, because longer interviews would provide greater statistical sampling of the features.</p>
      </sec>
      <sec>
        <title>Aggregating Different Modalities</title>
        <p>We investigated 3 different models including a Face model (all relevant facial action units features), a Voice model (all relevant acoustic features), and a Face–Voice model, which was constructed by averaging the probability outputs of the Face model and the Voice model. For each inference, 5-fold AUROC, accuracy, accuracy chance (the accuracy one would get by randomly attributing the classes), and F scores (for both classes of the classification) were calculated. A threshold of 0.5 was used to compute accuracy and F scores. To rank features (to assess which ones were most predictive), we used a 5-fold AUROC for each feature sequence alone. We report the most successful models per modality (voice alone, face alone, or combined voice and face).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>General</title>
        <p>In total, 89 participants (mean age 25.3 years; male: 48/89, 53.9%; female: 41/89, 46.1%) with schizophrenia spectrum disorders (n=41), bipolar disorder (n=21), and healthy volunteers (n=27) were included (<xref ref-type="table" rid="table1">Table 1</xref>), resulting in 146 interviews (mean 1.64, SD 0.84 interviews per participant). Total scores (representing aggregate scores from individual items) indicated that participants were predominantly in remission at the time of the assessments (<xref ref-type="table" rid="table2">Table 2</xref>); however, several participants scored moderate or severe on 1 or more items in the BPRS (schizophrenia spectrum disorders: 22/41, 54%; bipolar disorder: 8/21, 38%), SANS (schizophrenia spectrum disorders: 33/41, 80%; bipolar disorder: 14/21, 67%), YMRS (schizophrenia spectrum disorders: 18/41, 44%; bipolar disorder: 8/21, 38%), and HAMD (schizophrenia spectrum disorders: 32/41, 78%; bipolar disorder: 10/21, 48%). Participant assessments, including speech extraction and symptom rating scales, lasted a mean duration of 27 minutes (SD 11).</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Demographic and clinical characteristics.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="180"/>
            <col width="0"/>
            <col width="280"/>
            <col width="0"/>
            <col width="170"/>
            <col width="0"/>
            <col width="190"/>
            <col width="0"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Characteristic</td>
                <td colspan="2">Schizophrenia spectrum disorders (n=41)</td>
                <td colspan="2">Bipolar disorder (n=21)</td>
                <td colspan="2">Healthy volunteers (n=27)</td>
                <td>Full sample (n=89)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">Age (in years), mean (SD)</td>
                <td colspan="2">23.7 (3.97)</td>
                <td colspan="2">25.3 (4.24)</td>
                <td colspan="2">28.5 (5.15)</td>
                <td>25.5 (4.83)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Sex, n (%)</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Male</td>
                <td colspan="2">29 (71)</td>
                <td colspan="2">7 (33)</td>
                <td colspan="2">12 (44)</td>
                <td colspan="2">48 (54)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female</td>
                <td colspan="2">12 (29)</td>
                <td colspan="2">14 (67)</td>
                <td colspan="2">15 (56)</td>
                <td colspan="2">41 (46)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Race/ethnicity, n (%)</bold>
                </td>
                <td colspan="2"/>
                <td colspan="2"/>
                <td colspan="2"/>
                <td/>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>African American/Black</td>
                <td colspan="2">24 (58)</td>
                <td colspan="2">3 (14)</td>
                <td colspan="2">8 (30)</td>
                <td colspan="2">35 (39)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Asian</td>
                <td colspan="2">6 (15)</td>
                <td colspan="2">4 (19)</td>
                <td colspan="2">6 (22)</td>
                <td colspan="2">16 (18)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Caucasian</td>
                <td colspan="2">10 (24.)</td>
                <td colspan="2">9 (43)</td>
                <td colspan="2">10 (37)</td>
                <td colspan="2">29 (33)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Mixed race/other</td>
                <td colspan="2">1 (2)</td>
                <td colspan="2">5 (24)</td>
                <td colspan="2">2 (7)</td>
                <td colspan="2">8 (9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Pacific Islander</td>
                <td colspan="2">0 (0)</td>
                <td colspan="2">0 (0)</td>
                <td colspan="2">1 (4)</td>
                <td colspan="2">1 (1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hispanic</td>
                <td colspan="2">5 (12)</td>
                <td colspan="2">3 (14)</td>
                <td colspan="2">1 (4)</td>
                <td colspan="2">9 (10)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Diagnosis (most recent episode), n (%)</bold>
                </td>
                <td colspan="2"/>
                <td colspan="2"/>
                <td colspan="2"/>
                <td/>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Schizophrenia</td>
                <td colspan="2">19 (46)</td>
                <td colspan="2">N/A<sup>a</sup></td>
                <td colspan="2">N/A</td>
                <td colspan="2">19 (21.)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Schizophreniform</td>
                <td colspan="2">10 (24)</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">10 (11)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Schizoaffective</td>
                <td colspan="2">7 (17)</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">7 (8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Unspecified schizophrenia spectrum disorders</td>
                <td colspan="2">5 (12)</td>
                <td colspan="2">N/A</td>
                <td colspan="2">N/A</td>
                <td colspan="2">5 (6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Bipolar disorder (manic)</td>
                <td colspan="2">N/A</td>
                <td colspan="2">16 (76)</td>
                <td colspan="2">N/A</td>
                <td colspan="2">16 (18)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Bipolar disorder (depressed)</td>
                <td colspan="2">N/A</td>
                <td colspan="2">3 (14)</td>
                <td colspan="2">N/A</td>
                <td colspan="2">3 (3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Bipolar disorder (mixed)</td>
                <td colspan="2">N/A</td>
                <td colspan="2">2 (10)</td>
                <td colspan="2">N/A</td>
                <td colspan="2">2 (2)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Interviews, n</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Baseline</td>
                <td colspan="2">41</td>
                <td colspan="2">21</td>
                <td colspan="2">27</td>
                <td colspan="2">89</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Follow up</td>
                <td colspan="2">33</td>
                <td colspan="2">17</td>
                <td colspan="2">7</td>
                <td colspan="2">57</td>
              </tr>
              <tr valign="top">
                <td colspan="3">Interview length, mean (SD)</td>
                <td colspan="2">29.5 (13.1)</td>
                <td colspan="2">29.5 (9.3)</td>
                <td colspan="2">20.7 (6.1)</td>
                <td>27 (11)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>N/A: not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Symptom rating scale scores for diagnostic and sex groups.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="170"/>
            <col width="0"/>
            <col width="200"/>
            <col width="0"/>
            <col width="200"/>
            <col width="0"/>
            <col width="200"/>
            <col width="0"/>
            <col width="200"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Group</td>
                <td colspan="2">Brief Psychiatric Rating Scale score<sup>a</sup>, mean (SD)</td>
                <td colspan="2">Scale for the Assessment of Negative Symptoms score<sup>b</sup>, mean (SD)</td>
                <td colspan="2">Young Mania Rating Scale score<sup>c</sup>, mean (SD)</td>
                <td>Hamilton Depression Rating Scale score<sup>d</sup>, mean (SD)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">
                  <bold>Schizophrenia spectrum disorders</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>All</td>
                <td colspan="2">26.5 (6.8)</td>
                <td colspan="2">22.6 (12.3)</td>
                <td colspan="2">3.9 (3.6)</td>
                <td colspan="2">8.7 (6.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Men</td>
                <td colspan="2">28.1 (7.0)</td>
                <td colspan="2">25.5 (11.2)</td>
                <td colspan="2">4.6 (3.8)</td>
                <td colspan="2">9.8 (6.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Women</td>
                <td colspan="2">22.8 (4.4)</td>
                <td colspan="2">15.8 (12.1)</td>
                <td colspan="2">2.3 (2.1)</td>
                <td colspan="2">6.0 (4.1)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Bipolar disorder</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>All</td>
                <td colspan="2">26.8 (8.3)</td>
                <td colspan="2">14.0 (9.2)</td>
                <td colspan="2">7.5 (8.5)</td>
                <td colspan="2">9.4 (7.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Men</td>
                <td colspan="2">25.9 (5.7)</td>
                <td colspan="2">10.5 (8.8)</td>
                <td colspan="2">8.9 (9.1)</td>
                <td colspan="2">9.8 (10.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Women</td>
                <td colspan="2">27.3 (9.5)</td>
                <td colspan="2">16.2 (8.7)</td>
                <td colspan="2">6.7 (8.1)</td>
                <td colspan="2">9.2 (5.9)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>The total score can range from 18-126.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>The total score can range from 0-110.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>The total score can range from 0-60.</p>
            </fn>
            <fn id="table2fn4">
              <p><sup>d</sup>The total score can range from 0-76.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Differential Diagnosis</title>
        <p>Differential diagnosis classification performed well (5-fold AUROC 0.73) when aggregating features from both face and voice (<xref ref-type="table" rid="table3">Table 3</xref>). Facial action units, such as AU17 (<xref rid="figure1" ref-type="fig">Figure 1</xref>A), provided the strongest signal in discrimination between men with schizophrenia spectrum disorders and men with bipolar disorder. Men with schizophrenia spectrum disorders activated their chin-raising muscle (AU17: 5-fold AUROC 0.74) and lip corner–pulling muscle (AU12: 5-fold AUROC 0.61) more frequently than men with bipolar disorder, while demonstrating reduced activation of their cheek-raising muscle (AU6: 5-fold AUROC 0.64). In contrast, voice features, such as mean energy in the in the frequency band 1-4 kHz (<xref rid="figure1" ref-type="fig">Figure 1</xref>B), performed best for women. Women with schizophrenia spectrum disorders demonstrated reduced energy in the frequency band 1-4 kHz (5-fold AUROC 0.80), reduced spectral harmonicity (5-fold AUROC 0.78), and increased spectral slope (5-fold AUROC 0.77) compared with women with bipolar disorder. When comparing participants with schizophrenia spectrum disorders to healthy volunteers and bipolar disorder to healthy volunteers, we achieved a 5-fold AUROC of 0.78 for both classification tasks.</p>
        <p>We identified some features that discriminated well between schizophrenia spectrum disorders and bipolar disorder across both sexes: lip-corner pulling (AU12), which represented the movement of lip corners pulled diagonally by the zygomaticus major muscle (5-fold AUROC men: 0.61; women: 0.62) for which the mean value was higher on average for participants with schizophrenia spectrum disorders than for participants with bipolar disorder (<xref rid="figure2" ref-type="fig">Figure 2</xref>). The timing of this feature was observed to be important to classification performance—AU12 values were higher on average at the beginning of the interview and decreased over time.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Diagnostic classification.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="170"/>
            <col width="170"/>
            <col width="170"/>
            <col width="170"/>
            <col width="170"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td>Features</td>
                <td>AUROC<sup>a</sup></td>
                <td>Accuracy</td>
                <td>Accuracy chance</td>
                <td colspan="2">F score</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Schizophrenia spectrum disorders</td>
                <td>Bipolar disorder</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Voice</td>
                <td>0.65</td>
                <td>0.71</td>
                <td>0.55</td>
                <td>0.80</td>
                <td>0.46</td>
              </tr>
              <tr valign="top">
                <td>Face</td>
                <td>0.68</td>
                <td>0.72</td>
                <td>N/A<sup>b</sup></td>
                <td>0.80</td>
                <td>0.56</td>
              </tr>
              <tr valign="top">
                <td>Face and voice</td>
                <td>0.73</td>
                <td>0.72</td>
                <td>N/A</td>
                <td>0.80</td>
                <td>0.56</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>AUROC: area under the receiver operating characteristic curve.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>N/A: not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Sex-specific features that discriminate between schizophrenia spectrum disorders and bipolar disorder: (A) mean activation of AU17 (chin raising while speaking), and (B) mean value of the energy in the frequency band 1-4 kHz. BD: bipolar disorder; SSD: schizophrenia spectrum disorders.</p>
          </caption>
          <graphic xlink:href="mental_v9i1e24699_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>AU12 (lip-corner pulling while speaking) feature. For each signal,  the 25th percentile, median, and 75th percentile values are shown for each 1.5-minute window. Bipolar disorder is represented in blue, schizophrenia spectrum disorders is represented in yellow, and on the adjacent plot, healthy volunteers is represented in black. BD: bipolar disorder; SSD: schizophrenia spectrum disorders.</p>
          </caption>
          <graphic xlink:href="mental_v9i1e24699_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Symptom Classification</title>
        <p>Best performing models were derived from the SANS scale, predominantly from the affective flattening and blunting subgroup (global affective flattening, vocal inflection, paucity of expression, unchanging facial), avolition/apathy subgroup (physical anergia, role function level, global avolition), and asociality/anhedonia subgroup (sexual interest, asociality, intimacy). Two items passed the performance threshold from the BPRS (blunted affect and motor retardation), and 2 others were derived from the HAMD scale (work interest and worthlessness). No signs or symptoms from the YMRS passed the performance threshold criteria.</p>
        <p>Voice outperformed facial action units for blunted affect (5-fold AUROC 0.81), whereas facial action units outperformed voice for unchanging facial expression (5-fold AUROC 0.64) (<xref ref-type="table" rid="table4">Table 4</xref>). Synergy between both modalities was observed for paucity of expression (5-fold AUROC 0.81).</p>
        <p>Voice alone outperformed facial action units for several items including asociality (5-fold AUROC 0.63) and work and interests (5-fold AUROC 0.64) (<xref ref-type="table" rid="table5">Table 5</xref>). Facial action units alone outperformed voice for worthlessness (5-fold AUROC 0.61). Synergy between both modalities was observed for several other symptoms including avolition (5-fold AUROC 0.72) and anergia (5-fold AUROC 0.68). Importantly, given that these symptoms represent self-reported experiences, their relationship with measured physiological signals is likely indirect and one hypothesis is that they are linked to observable symptoms. For example, we found a correlation (<italic>r</italic>=0.35; <italic>P</italic>&#60;.001) between work and interests and blunted affect, and a correlation (<italic>r</italic>=0.31; <italic>P</italic>&#60;.001) between avolition and affective flattening.</p>
        <p>Among the top acoustic features (<xref rid="figure3" ref-type="fig">Figure 3</xref>) for objectively observed symptoms (<xref ref-type="table" rid="table4">Table 4</xref>), the mean value of the energy in the frequency band 1-4 kHz was most indicative of paucity of expression (<italic>r</italic>= –0.27, <italic>P</italic>=.004). Specifically, a reduction in the average amount of energy in high frequencies was associated with the presence of this symptom. In addition to affecting voice quality or timber (in the form vocal overtones), high frequencies (1-4 kHz) are typical in shaping consonants through rapid air motion from the mouth and through the teeth. In contrast, vowels are generally in the lower frequencies (500 Hz) and contain the majority of the voice energy. Clinically, mismatch between the acoustic frequencies of vowels and consonants jeopardizes the natural sound of the voice and leads to a reduction in speech intelligibility. This observation is stable across sex.</p>
        <p>Among the top facial action unit features (<xref rid="figure4" ref-type="fig">Figure 4</xref>) for the objectively observed symptoms, the standard deviation of cheek raising muscle activation, often activated to form a smile, was most indicative of blunted affect for both men and women (<italic>r</italic>= –0.26, <italic>P</italic>=.002 during speaking). When the symptom is present, the standard deviation of this feature is decreased.</p>
        <p>Among the top features for self-reported symptoms (<xref ref-type="table" rid="table5">Table 5</xref>), the mean value of AU45 (blinking) during speaking is higher when the symptom feature worthlessness is present (<italic>r</italic>=0.30, <italic>P</italic>=.001, calculated over all participants) (<xref rid="figure5" ref-type="fig">Figure 5</xref>).</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Objectively observed item classification.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="210"/>
            <col width="0"/>
            <col width="160"/>
            <col width="0"/>
            <col width="160"/>
            <col width="0"/>
            <col width="160"/>
            <col width="0"/>
            <col width="140"/>
            <col width="0"/>
            <col width="140"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Symptom</td>
                <td colspan="2">Modality</td>
                <td colspan="2">AUROC<sup>a</sup></td>
                <td colspan="2">Accuracy (random)</td>
                <td colspan="3">F score</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">Above clinical threshold</td>
                <td>Below clinical threshold</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">
                  <bold>Brief Psychiatric Rating Scale</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Blunted affect</td>
                <td colspan="2">Voice</td>
                <td colspan="2">0.81</td>
                <td colspan="2">0.95 (0.87)</td>
                <td colspan="2">0.40 &#124;</td>
                <td colspan="2">0.97</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Motor retardation</td>
                <td colspan="2">Face</td>
                <td colspan="2">0.68</td>
                <td colspan="2">0.94 (0.88)</td>
                <td colspan="2">0.36</td>
                <td colspan="2">0.97</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Scale for the Assessment of Negative Symptoms</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Paucity of expression</td>
                <td colspan="2">Voice, face</td>
                <td colspan="2">0.81</td>
                <td colspan="2">0.80 (0.66)</td>
                <td colspan="2">0.42</td>
                <td colspan="2">0.88</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Global affective flattening</td>
                <td colspan="2">Voice, face</td>
                <td colspan="2">0.79</td>
                <td colspan="2">0.82 (0.71)</td>
                <td colspan="2">0.44</td>
                <td colspan="2">0.89</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Lack of vocal inflection</td>
                <td colspan="2">Voice, face</td>
                <td colspan="2">0.71</td>
                <td colspan="2">0.88 (0.78)</td>
                <td colspan="2">0.43</td>
                <td colspan="2">0.94</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Unchanging facial</td>
                <td colspan="2">Face</td>
                <td colspan="2">0.64</td>
                <td colspan="2">0.83 (0.70)</td>
                <td colspan="2">0.39</td>
                <td colspan="2">0.90</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>AUROC: area under the receiver operating characteristic curve.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Self-reported items classification.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="210"/>
            <col width="160"/>
            <col width="160"/>
            <col width="160"/>
            <col width="140"/>
            <col width="140"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Symptom</td>
                <td>Modality</td>
                <td>AUROC<sup>a</sup></td>
                <td>Accuracy (random)</td>
                <td colspan="2">F score</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Above clinical threshold</td>
                <td>Below clinical threshold</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">
                  <bold>Scale for the Assessment of Negative Symptoms</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Global avolition</td>
                <td>Voice, face</td>
                <td>0.72</td>
                <td>0.66 (0.53)</td>
                <td>0.75</td>
                <td>0.49</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Physical anergia</td>
                <td>Voice, face</td>
                <td>0.68</td>
                <td>0.63 (0.51)</td>
                <td>0.70</td>
                <td>0.53</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Role function level</td>
                <td>Voice, face</td>
                <td>0.65</td>
                <td>0.63 (0.58)</td>
                <td>0.75</td>
                <td>0.31</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Sexual interest</td>
                <td>Voice, face</td>
                <td>0.64</td>
                <td>0.62 (0.52)</td>
                <td>0.46</td>
                <td>0.70</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Intimacy</td>
                <td>Voice</td>
                <td>0.64</td>
                <td>0.63 (0.51)</td>
                <td>0.56</td>
                <td>0.67</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Asociality</td>
                <td>Voice</td>
                <td>0.63</td>
                <td>0.60 (0.51)</td>
                <td>0.54</td>
                <td>0.65</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Hamilton Depression Rating Scale</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Work and interests</td>
                <td>Voice</td>
                <td>0.62</td>
                <td>0.65 (0.52)</td>
                <td>0.73</td>
                <td>0.52</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Worthlessness</td>
                <td>Face</td>
                <td>0.61</td>
                <td>0.88 (0.82)</td>
                <td>0.32</td>
                <td>0.94</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>AUROC: area under the receiver operating characteristic curve.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Paucity of expression score as a function of the mean value of the energy in the high frequency band 1-4 KHz (log-scale) for healthy volunteers (blue), patient participants with symptom rating scale scores below symptom threshold (orange), and patient participants with symptom rating scale scores above symptom threshold (green). A lower value of this feature is indicative of a more severe symptom across sex. The black line indicates the median value of the feature.</p>
          </caption>
          <graphic xlink:href="mental_v9i1e24699_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Blunted affect score as a function of the standard deviation of cheek raising (AU06) for healthy volunteers (blue), patient participants with symptom rating scale scores below symptom threshold (orange), and patient participants with symptom rating scale scores above symptom threshold (green). A lower value of this feature is indicative of a more severe symptom across sex. The black line indicates the median value of the feature.</p>
          </caption>
          <graphic xlink:href="mental_v9i1e24699_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Worthlessness score as a function of the mean value of blinking (AU45) for healthy volunteers (blue), patient participants with symptom rating scale scores below symptom threshold (orange), and patient participants with symptom rating scale scores above symptom threshold (green). A higher value of this feature is indicative of a more severe symptom across sex. The black line indicates the median value of the feature.</p>
          </caption>
          <graphic xlink:href="mental_v9i1e24699_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <p>We aimed to explore the feasibility of utilizing audiovisual data extracted from participant interviews for psychiatric diagnoses and to predict the presence of psychiatric signs and symptoms. Our results indicate that computational algorithms developed from vocal acoustics and facial action units can successfully differentiate between participants with either schizophrenia spectrum disorders or bipolar disorder, as well as identify the presence of several psychiatric signs and symptoms with high degrees of accuracy. Both acoustic and facial action unit features could be independently used to differentiate between participants with schizophrenia spectrum disorders and bipolar disorder in our data set, and integrating the two modalities produced the strongest signal, as previously seen in studies of depression [<xref ref-type="bibr" rid="ref64">64</xref>-<xref ref-type="bibr" rid="ref66">66</xref>], suggesting a synergistic interaction. Importantly, different top features were identified for men and women. Specifically, the strongest signals separating men with schizophrenia spectrum disorders from men with bipolar disorder were derived from facial features, while the strongest signals for women were derived from acoustic features. These physiological differences may be partially explained by different distributions of psychiatric signs and symptoms among the diagnostic categories. For example, men with schizophrenia spectrum disorders rated higher on average on the BPRS and SANS than men with bipolar disorder, while women with schizophrenia spectrum disorders on average scored lower than women with bipolar disorder on all rating scales. Alternatively, notable sex-specific variations in the prevalence, onset, symptom profiles, and outcome have been identified in the literature and have been attributed to differences in premorbid functioning, psychosocial response to symptoms, and differing levels of circulating hormones and receptors [<xref ref-type="bibr" rid="ref67">67</xref>-<xref ref-type="bibr" rid="ref70">70</xref>]. Audiovisual data may therefore detect subtle physiological differences unique to each sex and present in the expression of psychiatric disorders. In either scenario, sex differences are clearly of utmost importance when performing voice and facial analyses and must be taken into consideration when conducting future research.</p>
      <p>We also identified audiovisual features common to both sexes that successfully differentiated between diagnostic categories. In line with prior work demonstrating altered facial expressivity in individuals with psychiatric disorders [<xref ref-type="bibr" rid="ref47">47</xref>-<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref71">71</xref>,<xref ref-type="bibr" rid="ref72">72</xref>], we found that participants with schizophrenia spectrum disorders were much more likely to activate the facial muscle responsible for pulling the corners of their lips than participants with bipolar disorder. While this muscle is activated for several reasons, including the formation of certain words while speaking, it is also commonly used to form a smile. Interestingly, many patients with schizophrenia spectrum disorders, including the participants in our sample, experienced facial blunting and diminished facial expressivity, and one would, therefore, expect reduced facial activity compared to that of participants with bipolar disorder. While this finding may initially appear counterintuitive, it is important to note that the presence of blunted affect was associated with reduced variation in the cheek-raising muscle, which is also activated during the formation of a smile. Participants with schizophrenia spectrum disorders, therefore, activate lip corner–pulling muscles more than participants with bipolar disorder (perhaps to form a smile), though the range of activation of cheek movement was reduced if blunting was present. These findings warrant additional research particularly to understand the clinical significance of increased activation of certain facial muscles alongside decreased variability throughout the interview and its relationship to a diagnosis of schizophrenia spectrum disorders.</p>
      <p>Some top features contributing to the diagnostic classification remained stable throughout the course of the interview, while others changed depending on the temporal pattern. For example, AU12 (lip-corner pulling), demonstrated a consistent downward trend for all participants, whereas the energy of the voice signal in the frequency band 1-4 kHz remained mostly flat. These same trends were noted in healthy volunteers as well, suggesting that the identified differences in facial activity and voice represent subtle pathological variations in the frequency or intensity of otherwise healthy activity. The amount of high frequency energy in the voice, for example, may represent a subtle state marker of psychiatric illness or perhaps a physiological response to certain medications, impacting speech intelligibility. Additionally, activating lip corner–pulling muscles more at the start of an assessment (perhaps to produce a smile) may represent a healthy behavior (as it was seen in the healthy volunteers population as well), though the frequency and degree of activation is what separates those with schizophrenia spectrum disorders from those with bipolar disorder.</p>
      <p>Our findings suggest that a tool capable of extracting and analyzing audiovisual data from newly identified psychiatric patients might offer valuable collateral clinical information, supporting a more reliable approach to differential diagnoses. Accurately diagnosing someone as having either schizophrenia spectrum disorders or bipolar disorder is a critical first step in selecting appropriate medications and therapeutic interventions, and a task that is often challenging to behavioral health clinicians given significant symptom overlap [<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref53">53</xref>], especially during the early course of illness development. Leveraging audiovisual signals holds promise to overcome many of the challenges associated with current assessment methods [<xref ref-type="bibr" rid="ref73">73</xref>-<xref ref-type="bibr" rid="ref76">76</xref>], including inaccuracies and biases in self-report and recall, as well as substantial time constraints that limit the ability to effectively obtain necessary clinical information. Diagnoses, however, are complex entities, based on multiple psychiatric symptoms, each likely corresponding to several unique audiovisual features that will need to be integrated to achieve an accurate and reliable measure. Furthermore, each symptom may correspond to various alterations in audiovisual characteristics depending on multiple factors including the frequency and intensity of the experience, as well as the individual experiencing them. Future research will therefore require large clinical and computerized collaborative efforts to characterize psychiatric symptoms and diagnoses in an accurate and objective manner.</p>
      <p>Several psychiatric signs and symptom inferences were accurately made using features extracted from voice and face either individually or combined. Similar to the findings of prior studies [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref71">71</xref>], the most successful models were derived from the SANS, and greater accuracy was achieved with externally observable psychiatric signs and symptoms such as blunted affect and lack of vocal inflection. Integrating audiovisual data into symptom assessment might, therefore, offer more efficient and objective methods to identify and track changes in negative symptoms, beyond what can be achieved through traditional clinical observation alone. A more challenging task will be to provide greater objectivity to the assessment of symptoms such as hallucinations, delusions, and suicidal thoughts. In contrast to the findings of prior research, we did not find association between brow movements and delusions or depression [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref72">72</xref>]. One possibility is that the prevalence of negative symptoms (such as blunted affect and affective flattening) in our sample masked the expression (and, therefore, detection) of subtle physiological signals associated with these symptoms. Our findings do, however, suggest that audiovisual data can be representative of subjectively experienced symptoms, including worthlessness and avolition, though further research is required to uncover their complex correlational structure. For instance, the observed associations between audiovisual features and psychiatric symptoms may be justly considered as purely epiphenomenal, yet a mechanistic understanding of how the symptom is expressed in the feature is not obvious and may provide insights into the diagnostic conditions. When the severity of one symptom changes, it may affect the distribution of the other symptoms in a deterministic way. Consequently, it is possible to find correlations between symptoms and physiological data even if they are not causally linked. Those correlations, if confirmed in larger studies, would be very valuable as they offer indirect proxies to more subjective experiences that are not directly quantifiable. Further research is required to determine the clinical significance of physiological changes in voice and face, as well as how they might correspond to a particular psychiatric symptom to effectively incorporate audiovisual data into clinical care. A critical, though challenging, task for future research would be maximize the level of isolated psychiatric symptoms while containing other symptoms to avoid confounding the signals that we aim to capture. Accordingly, comparing participants to themselves longitudinally as symptoms fluctuate over the course of various pathological states would also help reduce potential confounds in the signals. Future research should consider how physiological differences in facial expression and voice may manifest in other clinical settings and structured tasks as well, such as emotion elicitation [<xref ref-type="bibr" rid="ref77">77</xref>]. Lastly, follow-up studies should consider exploring participant response times, and other measures of interviewer–interviewee interaction by recording and analyzing the voice and facial expressions of the interviewer as well.</p>
      <p>There are several noteworthy limitations to our study. First, while prior analyses using machine learning on audio and visual features have enrolled comparable sample sizes [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref48">48</xref>], a power analysis was not conducted given the exploratory nature of this project, and additional research with more participants is necessary to support generalizability. Second, many patients included in the project were clinically stable, experiencing mild to moderate symptoms and minimal symptom fluctuations throughout the trial, which limited our ability to assess audiovisual patterns as a function of symptom severity. It is also possible that predominant negative symptoms in our sample, such as facial blunting and lack of vocal inflection, limited our ability to detect a greater number of signs and symptoms from the BPRS, HAMD, and YMRS. Third, the effects of various medications on physiological changes in voice and facial movements in our sample remain unclear and were not taken into consideration. Further research will be needed to determine the impact of the class and dose of prescribed medications on audiovisual patterns, as well as their potential impact on behavior over the course of the interview. Furthermore, demographic variables differed among the 3 groups. Although sex differences were accounted for in our models, the potential impact of physiological differences stemming from age, race, and ethnicity (though much less likely [<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref78">78</xref>]) warrant further exploration. Fourth, the interviewer was not blinded to diagnostic groups, which may have biased the ratings. However, the interviewer was highly trained to utilize rating scales and achieved high interrater reliability prior to study initiation. Fifth, diagnoses were clinically ascertained and extracted from the medical records. Future research should consider implementing more reliable and structured methods for diagnostic assessment, such as a structured clinical interview [<xref ref-type="bibr" rid="ref79">79</xref>], to ensure the most accurate diagnoses. Sixth, many top features contribute to each of the best performing models, both independently and combined. Given the very large number of relevant features, we chose to emphasize and illustrate a select few in the manuscript. Corresponding clinical interpretations may, therefore, be dependent on the features highlighted and additional research will be necessary to confirm findings before clinical conclusions can be drawn. Finally, we chose to focus our analysis on acoustic components of speech rather than content as they are less dependent on cultural, socioeconomic, and educational backgrounds. Our group is, however, engaged in ongoing research aimed at the integration of speech content in the analytics framework, which we anticipate will improve our ability to detect additional psychiatric signs and symptoms.</p>
      <p>Audiovisual data hold promise for gathering objective, scalable, noninvasive, and easily accessed, indicators of psychiatric illness. Much like an x-ray or blood test is routinely used as adjunctive data to inform clinical care, integrating audiovisual data could change the way mental health clinicians diagnose and monitor patients, enabling faster, more accurate identification of illness and enhancing a personalized approach to medicine. This would be a significant step forward for psychiatry, which is limited by its reliance on largely retrospective, self-reported data.</p>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Voice features.</p>
        <media xlink:href="mental_v9i1e24699_app1.docx" xlink:title="DOCX File , 15 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Facial action units.</p>
        <media xlink:href="mental_v9i1e24699_app2.docx" xlink:title="DOCX File , 13 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AUROC</term>
          <def>
            <p>area under the receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">BPRS</term>
          <def>
            <p>Brief Psychiatric Rating Scale</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">HAMD</term>
          <def>
            <p>Hamilton Depression Rating Scale</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">SANS</term>
          <def>
            <p>Scale for the Assessment of Negative Symptoms</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">YMRS</term>
          <def>
            <p>Young Mania Rating Scale</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors are thankful to the volunteer participants without whose active involvement, the present study would not have been possible. We would also like to thank Rachel Ostrand, PhD, who contributed to the development of the speech prompts utilized and helped setup the audiovisual data equipment.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>GC, SH, MB, and JK conceptualized and executed the project. AA designed and performed data analysis with input from GC, and MB, AA, SH, and CA performed data preprocessing. AFA and EA performed participant recruitment and data collection. AA and MB wrote the manuscript, and all authors reviewed and edited.</p>
      </fn>
      <fn fn-type="conflict">
        <p>AA, GC, and CA disclose that their employer, IBM Research, is the research branch of IBM Corporation.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Auerbach</surname>
              <given-names>RP</given-names>
            </name>
            <name name-style="western">
              <surname>Mortier</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bruffaerts</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Alonso</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Benjet</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Cuijpers</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Demyttenaere</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ebert</surname>
              <given-names>DD</given-names>
            </name>
            <name name-style="western">
              <surname>Green</surname>
              <given-names>JG</given-names>
            </name>
            <name name-style="western">
              <surname>Hasking</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Murray</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Nock</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Pinder-Amaker</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sampson</surname>
              <given-names>NA</given-names>
            </name>
            <name name-style="western">
              <surname>Stein</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Vilagut</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Zaslavsky</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Kessler</surname>
              <given-names>RC</given-names>
            </name>
            <collab>WHO WMH-ICS Collaborators</collab>
          </person-group>
          <article-title>WHO world mental health surveys international college student project: prevalence and distribution of mental disorders</article-title>
          <source>J Abnorm Psychol</source>
          <year>2018</year>
          <month>10</month>
          <volume>127</volume>
          <issue>7</issue>
          <fpage>623</fpage>
          <lpage>638</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30211576"/>
          </comment>
          <pub-id pub-id-type="doi">10.1037/abn0000362</pub-id>
          <pub-id pub-id-type="medline">30211576</pub-id>
          <pub-id pub-id-type="pii">2018-44951-001</pub-id>
          <pub-id pub-id-type="pmcid">PMC6193834</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Steel</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Marnane</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Iranpour</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chey</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Jackson</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Silove</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>The global prevalence of common mental disorders: a systematic review and meta-analysis 1980-2013</article-title>
          <source>Int J Epidemiol</source>
          <year>2014</year>
          <month>04</month>
          <volume>43</volume>
          <issue>2</issue>
          <fpage>476</fpage>
          <lpage>93</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://ije.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=24648481"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/ije/dyu038</pub-id>
          <pub-id pub-id-type="medline">24648481</pub-id>
          <pub-id pub-id-type="pii">dyu038</pub-id>
          <pub-id pub-id-type="pmcid">PMC3997379</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>PB</given-names>
            </name>
          </person-group>
          <article-title>Adult mental health disorders and their age at onset</article-title>
          <source>Br J Psychiatry Suppl</source>
          <year>2013</year>
          <month>01</month>
          <volume>54</volume>
          <fpage>s5</fpage>
          <lpage>10</lpage>
          <pub-id pub-id-type="doi">10.1192/bjp.bp.112.119164</pub-id>
          <pub-id pub-id-type="medline">23288502</pub-id>
          <pub-id pub-id-type="pii">202/s54/s5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O'Connor</surname>
              <given-names>Karen</given-names>
            </name>
            <name name-style="western">
              <surname>Muller Neff</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Pitman</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Burnout in mental health professionals: a systematic review and meta-analysis of prevalence and determinants</article-title>
          <source>Eur Psychiatry</source>
          <year>2018</year>
          <month>09</month>
          <day>26</day>
          <volume>53</volume>
          <fpage>74</fpage>
          <lpage>99</lpage>
          <pub-id pub-id-type="doi">10.1016/j.eurpsy.2018.06.003</pub-id>
          <pub-id pub-id-type="medline">29957371</pub-id>
          <pub-id pub-id-type="pii">S0924-9338(18)30127-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rotstein</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hudaib</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Facey</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kulkarni</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Psychiatrist burnout: a meta-analysis of Maslach burnout inventory means</article-title>
          <source>Australas Psychiatry</source>
          <year>2019</year>
          <month>06</month>
          <day>25</day>
          <volume>27</volume>
          <issue>3</issue>
          <fpage>249</fpage>
          <lpage>254</lpage>
          <pub-id pub-id-type="doi">10.1177/1039856219833800</pub-id>
          <pub-id pub-id-type="medline">30907115</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Chew</surname>
              <given-names>QH</given-names>
            </name>
            <name name-style="western">
              <surname>Sim</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Burnout and associated factors in psychiatry residents: a systematic review</article-title>
          <source>Int J Med Educ</source>
          <year>2019</year>
          <month>07</month>
          <day>30</day>
          <volume>10</volume>
          <fpage>149</fpage>
          <lpage>160</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ijme.net/pmid/31381505"/>
          </comment>
          <pub-id pub-id-type="doi">10.5116/ijme.5d21.b621</pub-id>
          <pub-id pub-id-type="medline">31381505</pub-id>
          <pub-id pub-id-type="pii">ijme.10.149160</pub-id>
          <pub-id pub-id-type="pmcid">PMC6766386</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>American</surname>
              <given-names>PA</given-names>
            </name>
          </person-group>
          <source>Diagnostic and Statistical Manual of Mental Disorders (5th ed)</source>
          <year>2013</year>
          <publisher-loc>Arlington, VA</publisher-loc>
          <publisher-name>American Psychiatric Association</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gaebel</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zielasek</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Reed</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Mental and behavioural disorders in the ICD-11: concepts, methodologies, and current status</article-title>
          <source>Psychiatr Pol</source>
          <year>2017</year>
          <month>04</month>
          <day>30</day>
          <volume>51</volume>
          <issue>2</issue>
          <fpage>169</fpage>
          <lpage>195</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.12740/PP/69660"/>
          </comment>
          <pub-id pub-id-type="doi">10.12740/PP/69660</pub-id>
          <pub-id pub-id-type="medline">28581530</pub-id>
          <pub-id pub-id-type="pii">69660</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fusar-Poli</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Hijazi</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Stahl</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Steyerberg</surname>
              <given-names>EW</given-names>
            </name>
          </person-group>
          <article-title>The science of prognosis in psychiatry: a review</article-title>
          <source>JAMA Psychiatry</source>
          <year>2018</year>
          <month>12</month>
          <day>01</day>
          <volume>75</volume>
          <issue>12</issue>
          <fpage>1289</fpage>
          <lpage>1297</lpage>
          <pub-id pub-id-type="doi">10.1001/jamapsychiatry.2018.2530</pub-id>
          <pub-id pub-id-type="medline">30347013</pub-id>
          <pub-id pub-id-type="pii">2707244</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Levchenko</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nurgaliev</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kanapin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Samsonova</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gainetdinov</surname>
              <given-names>RR</given-names>
            </name>
          </person-group>
          <article-title>Current challenges and possible future developments in personalized psychiatry with an emphasis on psychotic disorders</article-title>
          <source>Heliyon</source>
          <year>2020</year>
          <month>05</month>
          <volume>6</volume>
          <issue>5</issue>
          <fpage>e03990</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2405-8440(20)30835-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.heliyon.2020.e03990</pub-id>
          <pub-id pub-id-type="medline">32462093</pub-id>
          <pub-id pub-id-type="pii">S2405-8440(20)30835-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC7240336</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bzdok</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Meyer-Lindenberg</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Machine learning for precision psychiatry: opportunities and challenges</article-title>
          <source>Biol Psychiatry Cogn Neurosci Neuroimaging</source>
          <year>2018</year>
          <month>12</month>
          <volume>3</volume>
          <issue>3</issue>
          <fpage>223</fpage>
          <lpage>230</lpage>
          <pub-id pub-id-type="doi">10.1016/j.bpsc.2017.11.007</pub-id>
          <pub-id pub-id-type="medline">29486863</pub-id>
          <pub-id pub-id-type="pii">S2451-9022(17)30206-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dwyer</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Falkai</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Koutsouleris</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Machine learning approaches for clinical psychology and psychiatry</article-title>
          <source>Annu Rev Clin Psychol</source>
          <year>2018</year>
          <month>05</month>
          <day>07</day>
          <volume>14</volume>
          <issue>1</issue>
          <fpage>91</fpage>
          <lpage>118</lpage>
          <pub-id pub-id-type="doi">10.1146/annurev-clinpsy-032816-045037</pub-id>
          <pub-id pub-id-type="medline">29401044</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pampouchidou</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Facial geometry and speech analysis for depression detection</article-title>
          <year>2017</year>
          <conf-name>39th Annual International Conference of the IEEE Engineering in Medicine and Biology Society</conf-name>
          <conf-date>July 11-15</conf-date>
          <conf-loc>Jeju, Korea</conf-loc>
          <pub-id pub-id-type="doi">10.1109/embc.2017.8037103</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Girard</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Cohn</surname>
              <given-names>JF</given-names>
            </name>
          </person-group>
          <article-title>Automated audiovisual depression analysis</article-title>
          <source>Curr Opin Psychol</source>
          <year>2015</year>
          <month>08</month>
          <volume>4</volume>
          <fpage>75</fpage>
          <lpage>79</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26295056"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.copsyc.2014.12.010</pub-id>
          <pub-id pub-id-type="medline">26295056</pub-id>
          <pub-id pub-id-type="pmcid">PMC4539261</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dibeklio</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Hammal</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Cohn</surname>
              <given-names>JF</given-names>
            </name>
          </person-group>
          <article-title>Multimodal detection of depression in clinical interviews</article-title>
          <source>Proceedings of the 2015 ACM on International Conference on Multimodal Interaction</source>
          <year>2015</year>
          <conf-name>ACM International Conference on Multimodal Interaction</conf-name>
          <conf-date>November 9-13</conf-date>
          <conf-loc>Seattle, Washington</conf-loc>
          <fpage>307</fpage>
          <lpage>310</lpage>
          <pub-id pub-id-type="doi">10.1145/2818346.2820776</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Renfordt</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Busch</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>[New diagnostic strategies in psychiatry by means of video-technique. The use of time-blind video analysis for the evaluation of antidepressant drug trials (author's transl)]</article-title>
          <source>Pharmakopsychiatr Neuropsychopharmakol</source>
          <year>1976</year>
          <month>03</month>
          <day>20</day>
          <volume>9</volume>
          <issue>2</issue>
          <fpage>67</fpage>
          <lpage>75</lpage>
          <pub-id pub-id-type="doi">10.1055/s-0028-1094480</pub-id>
          <pub-id pub-id-type="medline">790410</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kring</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Sloan</surname>
              <given-names>DM</given-names>
            </name>
          </person-group>
          <article-title>The facial expression coding system (FACES): development, validation, and utility</article-title>
          <source>Psychol Assess</source>
          <year>2007</year>
          <month>06</month>
          <volume>19</volume>
          <issue>2</issue>
          <fpage>210</fpage>
          <lpage>24</lpage>
          <pub-id pub-id-type="doi">10.1037/1040-3590.19.2.210</pub-id>
          <pub-id pub-id-type="medline">17563202</pub-id>
          <pub-id pub-id-type="pii">2007-07953-005</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cummins</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Baird</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Schuller</surname>
              <given-names>BW</given-names>
            </name>
          </person-group>
          <article-title>Speech analysis for health: current state-of-the-art and the increasing impact of deep learning</article-title>
          <source>Methods</source>
          <year>2018</year>
          <month>12</month>
          <day>01</day>
          <volume>151</volume>
          <fpage>41</fpage>
          <lpage>54</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ymeth.2018.07.007</pub-id>
          <pub-id pub-id-type="medline">30099083</pub-id>
          <pub-id pub-id-type="pii">S1046-2023(17)30371-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Low</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Bentley</surname>
              <given-names>KH</given-names>
            </name>
            <name name-style="western">
              <surname>Ghosh</surname>
              <given-names>SS</given-names>
            </name>
          </person-group>
          <article-title>Automated assessment of psychiatric disorders using speech: a systematic review</article-title>
          <source>Laryngoscope Investig Otolaryngol</source>
          <year>2020</year>
          <month>02</month>
          <day>31</day>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>96</fpage>
          <lpage>116</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32128436"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/lio2.354</pub-id>
          <pub-id pub-id-type="medline">32128436</pub-id>
          <pub-id pub-id-type="pii">LIO2354</pub-id>
          <pub-id pub-id-type="pmcid">PMC7042657</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Scherer</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Stratou</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mahmoud</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Boberg</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gratch</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Automatic behavior descriptors for psychological disorder analysis</article-title>
          <year>2013</year>
          <conf-name>10th IEEE International Conference and Workshops on Automatic Face and Gesture Recognition</conf-name>
          <conf-date>April 22-26</conf-date>
          <conf-loc>Shanghai, China</conf-loc>
          <fpage>1</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1109/fg.2013.6553789</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abrami</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gunzler</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kilbane</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ostrand</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Cecchi</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Automated computer vision assessment of hypomimia in Parkinson disease: proof-of-principle pilot study</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>02</month>
          <day>22</day>
          <volume>23</volume>
          <issue>2</issue>
          <fpage>e21037</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/2/e21037/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/21037</pub-id>
          <pub-id pub-id-type="medline">33616535</pub-id>
          <pub-id pub-id-type="pii">v23i2e21037</pub-id>
          <pub-id pub-id-type="pmcid">PMC7939934</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Fairbairn</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Cohn</surname>
              <given-names>JF</given-names>
            </name>
          </person-group>
          <article-title>Detecting depression severity from vocal prosody</article-title>
          <source>IEEE Trans Affect Comput</source>
          <year>2013</year>
          <volume>4</volume>
          <issue>2</issue>
          <fpage>142</fpage>
          <lpage>150</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26985326"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/T-AFFC.2012.38</pub-id>
          <pub-id pub-id-type="medline">26985326</pub-id>
          <pub-id pub-id-type="pmcid">PMC4791067</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Automated verbal and nonverbal speech analysis of interviews of individuals with schizophrenia and depression</article-title>
          <year>2019</year>
          <conf-name>41st Annual International Conference of the IEEE Engineering in Medicine and Biology Society</conf-name>
          <conf-date>July 23-27</conf-date>
          <conf-loc>Berlin, Germany</conf-loc>
          <pub-id pub-id-type="doi">10.1109/embc.2019.8857071</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Minor</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Bonfils</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Luther</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Firmin</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Kukla</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>MacLain</surname>
              <given-names>VR</given-names>
            </name>
            <name name-style="western">
              <surname>Buck</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lysaker</surname>
              <given-names>PH</given-names>
            </name>
            <name name-style="western">
              <surname>Salyers</surname>
              <given-names>MP</given-names>
            </name>
          </person-group>
          <article-title>Lexical analysis in schizophrenia: how emotion and social word use informs our understanding of clinical presentation</article-title>
          <source>J Psychiatr Res</source>
          <year>2015</year>
          <month>05</month>
          <volume>64</volume>
          <fpage>74</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jpsychires.2015.02.024</pub-id>
          <pub-id pub-id-type="medline">25777474</pub-id>
          <pub-id pub-id-type="pii">S0022-3956(15)00068-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Elvevåg</surname>
              <given-names>Brita</given-names>
            </name>
          </person-group>
          <article-title>Automated computerized analysis of speech in psychiatric disorders</article-title>
          <source>Curr Opin Psychiatry</source>
          <year>2014</year>
          <month>05</month>
          <volume>27</volume>
          <issue>3</issue>
          <fpage>203</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24613984"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/YCO.0000000000000056</pub-id>
          <pub-id pub-id-type="medline">24613984</pub-id>
          <pub-id pub-id-type="pmcid">PMC4212642</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>de Boer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Voppel</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Begemann</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Schnack</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wijnen</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Sommer</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Clinical use of semantic space models in psychiatry and neurology: a systematic review and meta-analysis</article-title>
          <source>Neurosci Biobehav Rev</source>
          <year>2018</year>
          <month>10</month>
          <volume>93</volume>
          <fpage>85</fpage>
          <lpage>92</lpage>
          <pub-id pub-id-type="doi">10.1016/j.neubiorev.2018.06.008</pub-id>
          <pub-id pub-id-type="medline">29890179</pub-id>
          <pub-id pub-id-type="pii">S0149-7634(18)30187-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rapcan</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>D'Arcy</surname>
              <given-names>Shona</given-names>
            </name>
            <name name-style="western">
              <surname>Yeap</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Afzal</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Thakore</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Reilly</surname>
              <given-names>RB</given-names>
            </name>
          </person-group>
          <article-title>Acoustic and temporal analysis of speech: a potential biomarker for schizophrenia</article-title>
          <source>Med Eng Phys</source>
          <year>2010</year>
          <month>11</month>
          <volume>32</volume>
          <issue>9</issue>
          <fpage>1074</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1016/j.medengphy.2010.07.013</pub-id>
          <pub-id pub-id-type="medline">20692864</pub-id>
          <pub-id pub-id-type="pii">S1350-4533(10)00165-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vanello</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Speech analysis for mood state characterization in bipolar patients</article-title>
          <year>2012</year>
          <conf-name>Annual International Conference of the IEEE Engineering in Medicine and Biology Society</conf-name>
          <conf-date>August 28-September 1</conf-date>
          <conf-loc>San Diego, California</conf-loc>
          <pub-id pub-id-type="doi">10.1109/embc.2012.6346375</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Gui</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Detecting manic state of bipolar disorder based on support vector machine and gaussian mixture model using spontaneous speech</article-title>
          <source>Psychiatry Investig</source>
          <year>2018</year>
          <month>07</month>
          <volume>15</volume>
          <issue>7</issue>
          <fpage>695</fpage>
          <lpage>700</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://psychiatryinvestigation.org/journal/view.php?doi=10.30773/pi.2017.12.15"/>
          </comment>
          <pub-id pub-id-type="doi">10.30773/pi.2017.12.15</pub-id>
          <pub-id pub-id-type="medline">29969852</pub-id>
          <pub-id pub-id-type="pii">pi.2017.12.15</pub-id>
          <pub-id pub-id-type="pmcid">PMC6056700</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Faurholt-Jepsen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Busk</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Frost</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Vinberg</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Christensen</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Winther</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Bardram</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Kessing</surname>
              <given-names>LV</given-names>
            </name>
          </person-group>
          <article-title>Voice analysis as an objective state marker in bipolar disorder</article-title>
          <source>Transl Psychiatry</source>
          <year>2016</year>
          <month>07</month>
          <day>19</day>
          <volume>6</volume>
          <issue>7</issue>
          <fpage>e856</fpage>
          <lpage>e856</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/tp.2016.123"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/tp.2016.123</pub-id>
          <pub-id pub-id-type="medline">27434490</pub-id>
          <pub-id pub-id-type="pii">tp2016123</pub-id>
          <pub-id pub-id-type="pmcid">PMC5545710</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Minor</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Willits</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Marggraf</surname>
              <given-names>MP</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Lysaker</surname>
              <given-names>PH</given-names>
            </name>
          </person-group>
          <article-title>Measuring disorganized speech in schizophrenia: automated analysis explains variance in cognitive deficits beyond clinician-rated scales</article-title>
          <source>Psychol Med</source>
          <year>2018</year>
          <month>04</month>
          <day>25</day>
          <volume>49</volume>
          <issue>3</issue>
          <fpage>440</fpage>
          <lpage>448</lpage>
          <pub-id pub-id-type="doi">10.1017/s0033291718001046</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Corcoran</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Carrillo</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Fernández-Slezak</surname>
              <given-names>Diego</given-names>
            </name>
            <name name-style="western">
              <surname>Bedi</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Klim</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Javitt</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Bearden</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Cecchi</surname>
              <given-names>GA</given-names>
            </name>
          </person-group>
          <article-title>Prediction of psychosis across protocols and risk cohorts using automated language analysis</article-title>
          <source>World Psychiatry</source>
          <year>2018</year>
          <month>02</month>
          <day>19</day>
          <volume>17</volume>
          <issue>1</issue>
          <fpage>67</fpage>
          <lpage>75</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1002/wps.20491"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/wps.20491</pub-id>
          <pub-id pub-id-type="medline">29352548</pub-id>
          <pub-id pub-id-type="pmcid">PMC5775133</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>He</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Automated depression analysis using convolutional neural networks from speech</article-title>
          <source>J Biomed Inform</source>
          <year>2018</year>
          <month>07</month>
          <volume>83</volume>
          <fpage>103</fpage>
          <lpage>111</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(18)30090-X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2018.05.007</pub-id>
          <pub-id pub-id-type="medline">29852317</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(18)30090-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mota</surname>
              <given-names>NB</given-names>
            </name>
            <name name-style="western">
              <surname>Vasconcelos</surname>
              <given-names>NAP</given-names>
            </name>
            <name name-style="western">
              <surname>Lemos</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Pieretti</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Kinouchi</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Cecchi</surname>
              <given-names>GA</given-names>
            </name>
            <name name-style="western">
              <surname>Copelli</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ribeiro</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Speech graphs provide a quantitative measure of thought disorder in psychosis</article-title>
          <source>PLoS One</source>
          <year>2012</year>
          <month>4</month>
          <day>9</day>
          <volume>7</volume>
          <issue>4</issue>
          <fpage>e34928</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0034928"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0034928</pub-id>
          <pub-id pub-id-type="medline">22506057</pub-id>
          <pub-id pub-id-type="pii">PONE-D-11-23505</pub-id>
          <pub-id pub-id-type="pmcid">PMC3322168</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Fedechko</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>EK</given-names>
            </name>
            <name name-style="western">
              <surname>Le</surname>
              <given-names>TP</given-names>
            </name>
            <name name-style="western">
              <surname>Foltz</surname>
              <given-names>PW</given-names>
            </name>
            <name name-style="western">
              <surname>Bernstein</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Holmlund</surname>
              <given-names>TB</given-names>
            </name>
            <name name-style="western">
              <surname>Elvevåg</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Ambulatory vocal acoustics, temporal dynamics, and serious mental illness</article-title>
          <source>J Abnorm Psychol</source>
          <year>2019</year>
          <month>03</month>
          <volume>128</volume>
          <issue>2</issue>
          <fpage>97</fpage>
          <lpage>105</lpage>
          <pub-id pub-id-type="doi">10.1037/abn0000397</pub-id>
          <pub-id pub-id-type="medline">30714793</pub-id>
          <pub-id pub-id-type="pii">2019-05392-001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Cowan</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Le</surname>
              <given-names>TP</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>EK</given-names>
            </name>
            <name name-style="western">
              <surname>Kirkpatrick</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Raugh</surname>
              <given-names>IM</given-names>
            </name>
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>HC</given-names>
            </name>
            <name name-style="western">
              <surname>Strauss</surname>
              <given-names>GP</given-names>
            </name>
          </person-group>
          <article-title>Ambulatory digital phenotyping of blunted affect and alogia using objective facial and vocal analysis: proof of concept</article-title>
          <source>Schizophr Res</source>
          <year>2020</year>
          <month>06</month>
          <volume>220</volume>
          <fpage>141</fpage>
          <lpage>146</lpage>
          <pub-id pub-id-type="doi">10.1016/j.schres.2020.03.043</pub-id>
          <pub-id pub-id-type="medline">32247747</pub-id>
          <pub-id pub-id-type="pii">S0920-9964(20)30153-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC7306442</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kliper</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Vaizman</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Weinshall</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Portuguese</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Evidence for depression and schizophrenia in speech prosody</article-title>
          <year>2010</year>
          <conf-name>Third ISCA Workshop on Experimental Linguistics</conf-name>
          <conf-date>2010</conf-date>
          <conf-loc>Greece</conf-loc>
          <pub-id pub-id-type="doi">10.36505/exling-2010/03/0022/000142</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kliper</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Portuguese</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Weinshall</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Serino</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Matic</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Giakoumis</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lopez</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Cipresso</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Serino</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Matic</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Giakoumis</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lopez</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Cipresso</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Prosodic analysis of speech and the underlying mental state</article-title>
          <source>Pervasive Computing Paradigms for Mental Health. MindCare 2015</source>
          <year>2016</year>
          <publisher-loc>Cham</publisher-loc>
          <publisher-name>Communications in Computer and Information Science, vol 604, Springer</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Perlini</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Marini</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Garzitto</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Isola</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cerruti</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Marinelli</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Rambaldelli</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Ferro</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tomelleri</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Dusi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Bellani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tansella</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fabbro</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Brambilla</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Linguistic production and syntactic comprehension in schizophrenia and bipolar disorder</article-title>
          <source>Acta Psychiatr Scand</source>
          <year>2012</year>
          <month>11</month>
          <volume>126</volume>
          <issue>5</issue>
          <fpage>363</fpage>
          <lpage>76</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1600-0447.2012.01864.x</pub-id>
          <pub-id pub-id-type="medline">22509998</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tahir</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Chakraborty</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Thalmann</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Thalmann</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Maniam</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Binte Abdul Rashid</surname>
              <given-names>Nur Amirah</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lee Chee Keong</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dauwels</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Non-verbal speech cues as objective measures for negative symptoms in patients with schizophrenia</article-title>
          <source>PLoS One</source>
          <year>2019</year>
          <month>4</month>
          <day>9</day>
          <volume>14</volume>
          <issue>4</issue>
          <fpage>e0214314</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0214314"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0214314</pub-id>
          <pub-id pub-id-type="medline">30964869</pub-id>
          <pub-id pub-id-type="pii">PONE-D-19-04262</pub-id>
          <pub-id pub-id-type="pmcid">PMC6456189</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guidi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Schoentgen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bertschy</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gentili</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Scilingo</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Vanello</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Features of vocal frequency contour and speech rhythm in bipolar disorder</article-title>
          <source>Biomedical Signal Processing and Control</source>
          <year>2017</year>
          <month>08</month>
          <volume>37</volume>
          <fpage>23</fpage>
          <lpage>31</lpage>
          <pub-id pub-id-type="doi">10.1016/j.bspc.2017.01.017</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guidi</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Analysis of running speech for the characterization of mood state in bipolar patients</article-title>
          <year>2015</year>
          <conf-name>AEIT International Annual Conference</conf-name>
          <conf-date>October 14-16</conf-date>
          <conf-loc>Naples, Italy</conf-loc>
          <pub-id pub-id-type="doi">10.1109/aeit.2015.7415275</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Gui</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Xue</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Analysis on speech signal features of manic patients</article-title>
          <source>J Psychiatr Res</source>
          <year>2018</year>
          <month>03</month>
          <volume>98</volume>
          <fpage>59</fpage>
          <lpage>63</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jpsychires.2017.12.012</pub-id>
          <pub-id pub-id-type="medline">29291581</pub-id>
          <pub-id pub-id-type="pii">S0022-3956(17)30481-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hamm</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kohler</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Gur</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Verma</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Automated facial action coding system for dynamic analysis of facial expressions in neuropsychiatric disorders</article-title>
          <source>J Neurosci Methods</source>
          <year>2011</year>
          <month>09</month>
          <day>15</day>
          <volume>200</volume>
          <issue>2</issue>
          <fpage>237</fpage>
          <lpage>56</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21741407"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jneumeth.2011.06.023</pub-id>
          <pub-id pub-id-type="medline">21741407</pub-id>
          <pub-id pub-id-type="pii">S0165-0270(11)00358-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC3402717</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kupper</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Ramseyer</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Hoffmann</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kalbermatten</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tschacher</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Video-based quantification of body movement during social interaction indicates the severity of negative symptoms in patients with schizophrenia</article-title>
          <source>Schizophr Res</source>
          <year>2010</year>
          <month>08</month>
          <volume>121</volume>
          <issue>1-3</issue>
          <fpage>90</fpage>
          <lpage>100</lpage>
          <pub-id pub-id-type="doi">10.1016/j.schres.2010.03.032</pub-id>
          <pub-id pub-id-type="medline">20434313</pub-id>
          <pub-id pub-id-type="pii">S0920-9964(10)01203-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sariyanidi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Gunes</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Cavallaro</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Automatic analysis of facial affect: a survey of registration, representation, and recognition</article-title>
          <source>IEEE Trans Pattern Anal Mach Intell</source>
          <year>2015</year>
          <month>06</month>
          <volume>37</volume>
          <issue>6</issue>
          <fpage>1113</fpage>
          <lpage>33</lpage>
          <pub-id pub-id-type="doi">10.1109/TPAMI.2014.2366127</pub-id>
          <pub-id pub-id-type="medline">26357337</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Haase</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Strauss</surname>
              <given-names>GP</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Mittal</surname>
              <given-names>VA</given-names>
            </name>
          </person-group>
          <article-title>Alterations in facial expressivity in youth at clinical high-risk for psychosis</article-title>
          <source>J Abnorm Psychol</source>
          <year>2019</year>
          <month>05</month>
          <volume>128</volume>
          <issue>4</issue>
          <fpage>341</fpage>
          <lpage>351</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30869926"/>
          </comment>
          <pub-id pub-id-type="doi">10.1037/abn0000413</pub-id>
          <pub-id pub-id-type="medline">30869926</pub-id>
          <pub-id pub-id-type="pii">2019-13436-001</pub-id>
          <pub-id pub-id-type="pmcid">PMC6499690</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Barrett</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Milonova</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gur</surname>
              <given-names>RE</given-names>
            </name>
            <name name-style="western">
              <surname>Gur</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Kohler</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Verma</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Automated video-based facial expression analysis of neuropsychiatric disorders</article-title>
          <source>J Neurosci Methods</source>
          <year>2008</year>
          <month>02</month>
          <day>15</day>
          <volume>168</volume>
          <issue>1</issue>
          <fpage>224</fpage>
          <lpage>38</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/18045693"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jneumeth.2007.09.030</pub-id>
          <pub-id pub-id-type="medline">18045693</pub-id>
          <pub-id pub-id-type="pii">S0165-0270(07)00475-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC2238802</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schneider</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Heimann</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Himer</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Huss</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mattes</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Adam</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Computer-based analysis of facial action in schizophrenic and depressed patients</article-title>
          <source>Eur Arch Psychiatry Clin Neurosci</source>
          <year>1990</year>
          <volume>240</volume>
          <issue>2</issue>
          <fpage>67</fpage>
          <lpage>76</lpage>
          <pub-id pub-id-type="doi">10.1007/BF02189974</pub-id>
          <pub-id pub-id-type="medline">2149651</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pampouchidou</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Video-based depression detection using local Curvelet binary patterns in pairwise orthogonal planes</article-title>
          <year>2016</year>
          <conf-name>38th Annual International Conference of the IEEE Engineering in Medicine and Biology Society</conf-name>
          <conf-date>August 16-20</conf-date>
          <conf-loc>Orlando, Florida</conf-loc>
          <pub-id pub-id-type="doi">10.1109/embc.2016.7591564</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alghowinem</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Cross-cultural detection of depression from nonverbal behaviour</article-title>
          <year>2015</year>
          <conf-name>IEEE International Conference and Workshops on Automatic Face and Gesture Recognition</conf-name>
          <conf-date>May 4-8</conf-date>
          <conf-loc>Ljubljana, Slovenia</conf-loc>
          <pub-id pub-id-type="doi">10.1109/fg.2015.7163113</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pearlson</surname>
              <given-names>GD</given-names>
            </name>
          </person-group>
          <article-title>Etiologic, phenomenologic, and endophenotypic overlap of schizophrenia and bipolar disorder</article-title>
          <source>Annu Rev Clin Psychol</source>
          <year>2015</year>
          <month>03</month>
          <day>28</day>
          <volume>11</volume>
          <issue>1</issue>
          <fpage>251</fpage>
          <lpage>81</lpage>
          <pub-id pub-id-type="doi">10.1146/annurev-clinpsy-032814-112915</pub-id>
          <pub-id pub-id-type="medline">25581236</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yalincetin</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Bora</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Binbay</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ulas</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Akdede</surname>
              <given-names>BB</given-names>
            </name>
            <name name-style="western">
              <surname>Alptekin</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Formal thought disorder in schizophrenia and bipolar disorder: a systematic review and meta-analysis</article-title>
          <source>Schizophr Res</source>
          <year>2017</year>
          <month>07</month>
          <volume>185</volume>
          <fpage>2</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1016/j.schres.2016.12.015</pub-id>
          <pub-id pub-id-type="medline">28017494</pub-id>
          <pub-id pub-id-type="pii">S0920-9964(16)30589-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vijay</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pennant</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ongur</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Baker</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Morency</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Computational study of psychosis symptoms and facial expressions</article-title>
          <year>2016</year>
          <conf-name>Computer Human Interaction Workshops</conf-name>
          <conf-date>May 7-12</conf-date>
          <conf-loc>San Jose, California</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shafer</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Meta-analysis of the brief psychiatric rating scale factor structure</article-title>
          <source>Psychol Assess</source>
          <year>2005</year>
          <month>09</month>
          <volume>17</volume>
          <issue>3</issue>
          <fpage>324</fpage>
          <lpage>35</lpage>
          <pub-id pub-id-type="doi">10.1037/1040-3590.17.3.324</pub-id>
          <pub-id pub-id-type="medline">16262458</pub-id>
          <pub-id pub-id-type="pii">2005-13213-008</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Andreasen</surname>
              <given-names>NC</given-names>
            </name>
          </person-group>
          <article-title>The scale for the assessment of negative symptoms (SANS): conceptual and theoretical foundations</article-title>
          <source>Br J Psychiatry Suppl</source>
          <year>1989</year>
          <month>11</month>
          <issue>7</issue>
          <fpage>49</fpage>
          <lpage>58</lpage>
          <pub-id pub-id-type="doi">10.1192/S0007125000291496</pub-id>
          <pub-id pub-id-type="medline">2695141</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hamilton</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A rating scale for depression</article-title>
          <source>J Neurol Neurosurg Psychiatry</source>
          <year>1960</year>
          <month>02</month>
          <day>01</day>
          <volume>23</volume>
          <issue>1</issue>
          <fpage>56</fpage>
          <lpage>62</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jnnp.bmj.com/lookup/pmidlookup?view=long&#38;pmid=14399272"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/jnnp.23.1.56</pub-id>
          <pub-id pub-id-type="medline">14399272</pub-id>
          <pub-id pub-id-type="pmcid">PMC495331</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Young</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Biggs</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Ziegler</surname>
              <given-names>VE</given-names>
            </name>
            <name name-style="western">
              <surname>Meyer</surname>
              <given-names>DA</given-names>
            </name>
          </person-group>
          <article-title>A rating scale for mania: reliability, validity and sensitivity</article-title>
          <source>Br J Psychiatry</source>
          <year>1978</year>
          <month>11</month>
          <day>01</day>
          <volume>133</volume>
          <issue>5</issue>
          <fpage>429</fpage>
          <lpage>35</lpage>
          <pub-id pub-id-type="doi">10.1192/bjp.133.5.429</pub-id>
          <pub-id pub-id-type="medline">728692</pub-id>
          <pub-id pub-id-type="pii">S0007125000198551</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eyben</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Wöllmer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Schuller</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Opensmile: the munich versatile and fast open-source audio feature extractor</article-title>
          <year>2010</year>
          <conf-name>International Conference on Multimedia</conf-name>
          <conf-date>October 25-29</conf-date>
          <conf-loc>Firenze, Italy</conf-loc>
          <fpage>1459</fpage>
          <lpage>62</lpage>
          <pub-id pub-id-type="doi">10.1145/1873951.1874246</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schuller</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>The interspeech computational paralinguistics challenge: social signals, conflict, emotion, autism</article-title>
          <year>2013</year>
          <conf-name>14th Annual Conference of the International Speech Communication Association</conf-name>
          <conf-date>August 25-29</conf-date>
          <conf-loc>Lyon, France</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baltrusaitis</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Robinson</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Morency</surname>
              <given-names>LP</given-names>
            </name>
          </person-group>
          <article-title>OpenFace: an open source facial behavior analysis toolkit</article-title>
          <year>2016</year>
          <conf-name>2016 IEEE Winter Conference on Applications of Computer Vision</conf-name>
          <conf-date>March 7-10</conf-date>
          <conf-loc>Lake Placid, New York</conf-loc>
          <fpage>1</fpage>
          <lpage>10</lpage>
          <pub-id pub-id-type="doi">10.1109/wacv.2016.7477553</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>JH</given-names>
            </name>
          </person-group>
          <article-title>Greedy function approximation: a gradient boosting machine</article-title>
          <source>Ann Statist</source>
          <year>2001</year>
          <month>10</month>
          <day>1</day>
          <volume>29</volume>
          <issue>5</issue>
          <fpage>1189</fpage>
          <lpage>1232</lpage>
          <pub-id pub-id-type="doi">10.1214/aos/1013203451</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Varoquaux</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Buitinck</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Louppe</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Grisel</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Pedregosa</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Mueller</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Scikit-learn</article-title>
          <source>GetMobile</source>
          <year>2015</year>
          <month>06</month>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>29</fpage>
          <lpage>33</lpage>
          <pub-id pub-id-type="doi">10.1145/2786984.2786995</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Williamson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Quatieri</surname>
              <given-names>TF</given-names>
            </name>
            <name name-style="western">
              <surname>Helfer</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Ciccarelli</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Mehta</surname>
              <given-names>DD</given-names>
            </name>
          </person-group>
          <article-title>Vocal and facial biomarkers of depression based on motor incoordination and timing</article-title>
          <source>Proceedings of the 4th International Workshop on Audio/Visual Emotion Challenge</source>
          <year>2014</year>
          <conf-name>4th International Workshop on Audio/Visual Emotion Challenge</conf-name>
          <conf-date>November 7</conf-date>
          <conf-loc>Orlando, Florida</conf-loc>
          <fpage>65</fpage>
          <lpage>72</lpage>
          <pub-id pub-id-type="doi">10.1145/2661806.2661809</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ray</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Reddy</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Mukherjee</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Garg</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Multilevel attention network using text, audio and video for depression prediction</article-title>
          <source>Proceedings of the 9th International on Audio/Visual Emotion Challenge and Workshop</source>
          <year>2019</year>
          <conf-name>9th International on Audio/Visual Emotion Challenge and Workshop</conf-name>
          <conf-date>21 October</conf-date>
          <conf-loc>Nice, France</conf-loc>
          <fpage>81</fpage>
          <lpage>88</lpage>
          <pub-id pub-id-type="doi">10.1145/3347320.3357697</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dibeklioglu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Hammal</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Cohn</surname>
              <given-names>JF</given-names>
            </name>
          </person-group>
          <article-title>Dynamic multimodal measurement of depression severity using deep autoencoding</article-title>
          <source>IEEE J Biomed Health Inform</source>
          <year>2018</year>
          <month>03</month>
          <volume>22</volume>
          <issue>2</issue>
          <fpage>525</fpage>
          <lpage>536</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28278485"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/JBHI.2017.2676878</pub-id>
          <pub-id pub-id-type="medline">28278485</pub-id>
          <pub-id pub-id-type="pmcid">PMC5581737</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abel</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Drake</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Goldstein</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Sex differences in schizophrenia</article-title>
          <source>Int Rev Psychiatry</source>
          <year>2010</year>
          <volume>22</volume>
          <issue>5</issue>
          <fpage>417</fpage>
          <lpage>28</lpage>
          <pub-id pub-id-type="doi">10.3109/09540261.2010.515205</pub-id>
          <pub-id pub-id-type="medline">21047156</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mendrek</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mancini-Marïe</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Sex/gender differences in the brain and cognition in schizophrenia</article-title>
          <source>Neurosci Biobehav Rev</source>
          <year>2016</year>
          <month>08</month>
          <volume>67</volume>
          <fpage>57</fpage>
          <lpage>78</lpage>
          <pub-id pub-id-type="doi">10.1016/j.neubiorev.2015.10.013</pub-id>
          <pub-id pub-id-type="medline">26743859</pub-id>
          <pub-id pub-id-type="pii">S0149-7634(15)30111-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ragazan</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Eberhard</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Berge</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Sex-specific associations between bipolar disorder pharmacological maintenance therapies and inpatient rehospitalizations: a 9-year swedish national registry study</article-title>
          <source>Front Psychiatry</source>
          <year>2020</year>
          <volume>11</volume>
          <fpage>598946</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3389/fpsyt.2020.598946"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fpsyt.2020.598946</pub-id>
          <pub-id pub-id-type="medline">33262715</pub-id>
          <pub-id pub-id-type="pmcid">PMC7688467</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mitchell</surname>
              <given-names>RHB</given-names>
            </name>
            <name name-style="western">
              <surname>Hower</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Birmaher</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Strober</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Merranko</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rooks</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Goldstein</surname>
              <given-names>TR</given-names>
            </name>
            <name name-style="western">
              <surname>Hunt</surname>
              <given-names>JI</given-names>
            </name>
            <name name-style="western">
              <surname>Dickstein</surname>
              <given-names>DP</given-names>
            </name>
            <name name-style="western">
              <surname>Diler</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>ND</given-names>
            </name>
            <name name-style="western">
              <surname>Gill</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Axelson</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Keller</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Yen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Goldstein</surname>
              <given-names>BI</given-names>
            </name>
          </person-group>
          <article-title>Sex differences in the longitudinal course and outcome of bipolar disorder in youth</article-title>
          <source>J Clin Psychiatry</source>
          <year>2020</year>
          <month>10</month>
          <day>27</day>
          <volume>81</volume>
          <issue>6</issue>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/33113597"/>
          </comment>
          <pub-id pub-id-type="doi">10.4088/JCP.19m13159</pub-id>
          <pub-id pub-id-type="medline">33113597</pub-id>
          <pub-id pub-id-type="pmcid">PMC8597235</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vail</surname>
              <given-names>AK</given-names>
            </name>
          </person-group>
          <article-title>Visual attention in schizophrenia eye contact and gaze aversion during clinical interactions</article-title>
          <year>2017</year>
          <conf-name>Seventh International Conference on Affective Computing and Intelligent Interaction</conf-name>
          <conf-date>October 23-26</conf-date>
          <conf-loc>San Antonio, Texas</conf-loc>
          <fpage>490</fpage>
          <lpage>497</lpage>
          <pub-id pub-id-type="doi">10.1109/acii.2017.8273644</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baker</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Pennant</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Baltrušaitis</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Vijay</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Liebson</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Ongur</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Morency</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Toward expert systems in mental health assessment: a computational approach to the face and voice in dyadic patient-doctor interactions</article-title>
          <source>iproc</source>
          <year>2016</year>
          <month>12</month>
          <day>30</day>
          <volume>2</volume>
          <issue>1</issue>
          <fpage>e44</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.iproc.org/2016/1/e44/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/iproc.6136</pub-id>
          <pub-id pub-id-type="pii">v2i1e44</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thombs</surname>
              <given-names>BD</given-names>
            </name>
            <name name-style="western">
              <surname>Roseman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kloda</surname>
              <given-names>LA</given-names>
            </name>
          </person-group>
          <article-title>Depression screening and mental health outcomes in children and adolescents: a systematic review protocol</article-title>
          <source>Syst Rev</source>
          <year>2012</year>
          <month>11</month>
          <day>24</day>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>58</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://systematicreviewsjournal.biomedcentral.com/articles/10.1186/2046-4053-1-58"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/2046-4053-1-58</pub-id>
          <pub-id pub-id-type="medline">23176742</pub-id>
          <pub-id pub-id-type="pii">2046-4053-1-58</pub-id>
          <pub-id pub-id-type="pmcid">PMC3563607</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref74">
        <label>74</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Roseman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kloda</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Saadat</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Riehm</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Ickowicz</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Baltzer</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Katz</surname>
              <given-names>LY</given-names>
            </name>
            <name name-style="western">
              <surname>Patten</surname>
              <given-names>SB</given-names>
            </name>
            <name name-style="western">
              <surname>Rousseau</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Thombs</surname>
              <given-names>BD</given-names>
            </name>
          </person-group>
          <article-title>Accuracy of depression screening tools to detect major depression in children and adolescents: a systematic review</article-title>
          <source>Can J Psychiatry</source>
          <year>2016</year>
          <month>12</month>
          <day>09</day>
          <volume>61</volume>
          <issue>12</issue>
          <fpage>746</fpage>
          <lpage>757</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27310247"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/0706743716651833</pub-id>
          <pub-id pub-id-type="medline">27310247</pub-id>
          <pub-id pub-id-type="pii">0706743716651833</pub-id>
          <pub-id pub-id-type="pmcid">PMC5564894</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref75">
        <label>75</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Addington</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Stowkowy</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Weiser</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Screening tools for clinical high risk for psychosis</article-title>
          <source>Early Interv Psychiatry</source>
          <year>2015</year>
          <month>10</month>
          <day>23</day>
          <volume>9</volume>
          <issue>5</issue>
          <fpage>345</fpage>
          <lpage>56</lpage>
          <pub-id pub-id-type="doi">10.1111/eip.12193</pub-id>
          <pub-id pub-id-type="medline">25345316</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref76">
        <label>76</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mulvaney-Day</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Marshall</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Downey Piscopo</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Korsen</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Lynch</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Karnell</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Moran</surname>
              <given-names>GE</given-names>
            </name>
            <name name-style="western">
              <surname>Daniels</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Ghose</surname>
              <given-names>SS</given-names>
            </name>
          </person-group>
          <article-title>Screening for behavioral health conditions in primary care settings: a systematic review of the literature</article-title>
          <source>J Gen Intern Med</source>
          <year>2018</year>
          <month>03</month>
          <day>25</day>
          <volume>33</volume>
          <issue>3</issue>
          <fpage>335</fpage>
          <lpage>346</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28948432"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11606-017-4181-0</pub-id>
          <pub-id pub-id-type="medline">28948432</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11606-017-4181-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC5834951</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref77">
        <label>77</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gross</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Levenson</surname>
              <given-names>RW</given-names>
            </name>
          </person-group>
          <article-title>Emotion elicitation using films</article-title>
          <source>Cogn Emot</source>
          <year>1995</year>
          <month>01</month>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>87</fpage>
          <lpage>108</lpage>
          <pub-id pub-id-type="doi">10.1080/02699939508408966</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref78">
        <label>78</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vorperian</surname>
              <given-names>HK</given-names>
            </name>
            <name name-style="western">
              <surname>Kent</surname>
              <given-names>RD</given-names>
            </name>
          </person-group>
          <article-title>Vowel acoustic space development in children: a synthesis of acoustic and anatomic data</article-title>
          <source>J Speech Lang Hear Res</source>
          <year>2007</year>
          <month>12</month>
          <volume>50</volume>
          <issue>6</issue>
          <fpage>1510</fpage>
          <lpage>45</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/18055771"/>
          </comment>
          <pub-id pub-id-type="doi">10.1044/1092-4388(2007/104)</pub-id>
          <pub-id pub-id-type="medline">18055771</pub-id>
          <pub-id pub-id-type="pii">50/6/1510</pub-id>
          <pub-id pub-id-type="pmcid">PMC2597712</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref79">
        <label>79</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>First</surname>
              <given-names>Michael B</given-names>
            </name>
          </person-group>
          <source>Structured Clinical Interview for the DSM-IV Axis I Disorders: SCID-I/P, Version 2.0</source>
          <year>1997</year>
          <publisher-loc>New York</publisher-loc>
          <publisher-name>Biometrics Research Dept., New York State Psychiatric Institute</publisher-name>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
