<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMH</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Ment Health</journal-id>
      <journal-title>JMIR Mental Health</journal-title>
      <issn pub-type="epub">2368-7959</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v13i1e92197</article-id>
      <article-id pub-id-type="pmid">42133936</article-id>
      <article-id pub-id-type="doi">10.2196/92197</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Cross-Dataset Evaluation of an Automated Video-Based Model for Detecting Tardive Dyskinesia Using the Clinician’s Tardive Inventory: Validation Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Torous</surname>
            <given-names>John</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Aiken</surname>
            <given-names>Chris</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Trabassi</surname>
            <given-names>Dante</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Trosch</surname>
            <given-names>Richard</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0006-5294-3782</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Sterns</surname>
            <given-names>Anthony</given-names>
          </name>
          <degrees>BSE, MA, PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <address>
            <institution>Scripps Gerontology Center</institution>
            <institution>Miami University</institution>
            <addr-line>100 Bishop Circle</addr-line>
            <addr-line>Oxford, OH, 45056</addr-line>
            <country>United States</country>
            <phone>1 3306066675</phone>
            <email>sternsa3@miamioh.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8609-9619</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Grimm</surname>
            <given-names>Bradley</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2896-5974</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Larsen</surname>
            <given-names>Loren</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5818-6651</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Talbot</surname>
            <given-names>Bretton</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3519-7638</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Ma</surname>
            <given-names>Fred</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0625-6560</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Ranjan</surname>
            <given-names>Rakesh</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0005-4005-9693</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>MacMillan</surname>
            <given-names>Carlene</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3837-2443</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Hughes</surname>
            <given-names>Joel</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff7" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6476-6588</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <name name-style="western">
            <surname>Friedman</surname>
            <given-names>Joseph</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff8" ref-type="aff">8</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2534-4160</ext-link>
        </contrib>
        <contrib id="contrib11" contrib-type="author">
          <name name-style="western">
            <surname>Muir</surname>
            <given-names>Owen</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4003-338X</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>William Beaumont School of Medicine</institution>
        <institution>Oakland University</institution>
        <addr-line>Farmington, MI</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Scripps Gerontology Center</institution>
        <institution>Miami University</institution>
        <addr-line>Oxford, OH</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Videra Health</institution>
        <addr-line>Orem, UT</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>iRxReminder</institution>
        <addr-line>Cleveland, OH</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Charak Health and Wellness Center</institution>
        <addr-line>Cleveland, OH</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Radial Health</institution>
        <addr-line>Brooklyn, NY</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff7">
        <label>7</label>
        <institution>Department of Psychological Sciences</institution>
        <institution>Kent State University</institution>
        <addr-line>Kent, OH</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff8">
        <label>8</label>
        <institution>Butler Hospital</institution>
        <addr-line>Providence, RI</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Anthony Sterns <email>sternsa3@miamioh.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2026</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>14</day>
        <month>5</month>
        <year>2026</year>
      </pub-date>
      <volume>13</volume>
      <elocation-id>e92197</elocation-id>
      <history>
        <date date-type="received">
          <day>26</day>
          <month>1</month>
          <year>2026</year>
        </date>
        <date date-type="rev-request">
          <day>20</day>
          <month>2</month>
          <year>2026</year>
        </date>
        <date date-type="rev-recd">
          <day>3</day>
          <month>4</month>
          <year>2026</year>
        </date>
        <date date-type="accepted">
          <day>4</day>
          <month>4</month>
          <year>2026</year>
        </date>
      </history>
      <copyright-statement>©Richard Trosch, Anthony Sterns, Bradley Grimm, Loren Larsen, Bretton Talbot, Fred Ma, Rakesh Ranjan, Carlene MacMillan, Joel Hughes, Joseph Friedman, Owen Muir. Originally published in JMIR Mental Health (https://mental.jmir.org), 14.05.2026.</copyright-statement>
      <copyright-year>2026</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Mental Health, is properly cited. The complete bibliographic information, a link to the original publication on https://mental.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://mental.jmir.org/2026/1/e92197" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Tardive dyskinesia (TD) is a common, often underrecognized movement disorder resulting from long-term antipsychotic use, yet its detection in routine mental health care remains inconsistent despite the availability of structured rating scales.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study evaluated the performance of an artificial intelligence–powered, video-based model for detecting abnormal movements associated with TD using the Clinician’s Tardive Inventory (CTI) dataset. We compare automated assessments of videos from the CTI dataset with previously completed clinician-rated Abnormal Involuntary Movement Scale (AIMS) and CTI scores for the dataset’s videos to determine the model’s reliability and the accuracy of its assessment conclusions relative to expert raters.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>In total, 69 videos with corresponding AIMS and CTI ratings were analyzed using the visual transformer algorithm model called TDtect reported previously. The dataset included single-video assessments per participant, with varied instructions and movement types. The relationship between automated predictions and clinician ratings was assessed using Pearson correlation, and predictive accuracy was evaluated using area under the curve (AUC) metrics.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The model showed a strong correlation with AIMS total scores (<italic>r</italic>=0.717) and high diagnostic accuracy (AUC 0.854), which improved further at an optimized threshold (AUC 0.900). Performance differed across anatomical regions, with the tongue, lips, and jaw displaying the highest predictive reliability. Functional CTI components had weaker correlations (<italic>r</italic>=0.27-0.63), as expected due to the subjective nature of these measures.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>These findings provide preliminary evidence that an artificial intelligence–driven TD detection model can generalize across video protocols, suggesting potential for broader clinical applicability, although further validation is needed. Future refinements and fine-tuning are expected to enhance accuracy, particularly in predicting functional impact.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>mental health</kwd>
        <kwd>artificial intelligence</kwd>
        <kwd>AI</kwd>
        <kwd>medication adherence</kwd>
        <kwd>tardive dyskinesia</kwd>
        <kwd>remote patient monitoring</kwd>
        <kwd>movement disorders</kwd>
        <kwd>Clinician’s Tardive Inventory</kwd>
        <kwd>CTI</kwd>
        <kwd>Abnormal Involuntary Movement Scale</kwd>
        <kwd>AIMS</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Tardive dyskinesia (TD) is a persistent neurological disorder caused by exposure to dopamine receptor–blocking agents, including antipsychotics and antiemetics [<xref ref-type="bibr" rid="ref1">1</xref>]. It is characterized by symptoms including stereotypy, akathisia, dystonia, chorea, myoclonus, vocalizations, and sensory issues [<xref ref-type="bibr" rid="ref2">2</xref>]. The prevalence of TD among those exposed is estimated to range from 15% to 40% in the United States, with risk factors such as age, drug class, treatment duration, and the presence of movement-related side effects during early treatment stages [<xref ref-type="bibr" rid="ref3">3</xref>-<xref ref-type="bibr" rid="ref6">6</xref>]. In addition to discomfort, TD is linked to increased morbidity, stigmatization, and reduced quality of life [<xref ref-type="bibr" rid="ref7">7</xref>].</p>
      <p>Despite available treatments, TD remains underdiagnosed [<xref ref-type="bibr" rid="ref8">8</xref>]. Early detection of TD facilitates prompt treatment with effective interventions to mitigate morbidity. The gap in the use of the 2 available Food and Drug Administration–designated breakthrough treatments, compared to the predicted prevalence of TD in the population, highlights the need for improved screening methods.</p>
      <p>Traditional TD screening and assessment rely on clinician-administered tools such as the Abnormal Involuntary Movement Scale (AIMS). However, the AIMS is a rating scale designed to quantify the severity of abnormal movements across 7 anatomical regions, and its use to screen for TD may be inappropriate according to expert consensus [<xref ref-type="bibr" rid="ref9">9</xref>]. Furthermore, the AIMS has notable limitations [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. It lacks specific movement descriptors, does not comprehensively address all TD movements, does not document the number of abnormal movements present, and does not provide independent measures of frequency and amplitude. As our understanding of TD phenomenology has expanded, there is a need for updated and objective diagnostic tools [<xref ref-type="bibr" rid="ref12">12</xref>]. The Clinician’s Tardive Inventory (CTI) is a validated tool developed to address these limitations, integrating both structured anatomical movement assessment and evaluation of functional impact into a single, repeatable inventory.</p>
      <p>Sterns et al [<xref ref-type="bibr" rid="ref13">13</xref>] described the TDtect visual transformer algorithm, a novel deep learning model designed to enhance the accuracy of TD detection using automated video analysis. Although traditional convolutional neural networks [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>] excel at extracting local spatial features, TDtect leverages a transformer architecture to process video frames by dividing them into patches and using self-attention mechanisms to capture long-range temporal dependencies across movements. This approach enables more comprehensive feature extraction across the temporal dimension.</p>
      <p>The initial studies on TDtect demonstrated improved sensitivity and specificity in identifying TD-related motor disturbances compared to clinician-rated AIMS measures. By leveraging machine learning, TDtect may allow reduced dependence on prior clinical experience in routine TD screening. TDtect is designed to be deployed through a smartphone app, at a scale commensurate with the millions of individuals likely affected.</p>
      <p>The initial studies evaluating the TDtect algorithm demonstrated that visual transformer algorithms could be used to analyze facial, oral, and body movements in video recordings of AIMS assessments. However, the initial investigations only evaluated this algorithm on videos in which participants performed the steps of the AIMS assessment. This study evaluates the model’s performance against a different dataset. Here, we evaluate a video dataset collected to evaluate the clinician-rated CTI. This collection of 69 patient videos, with corresponding expert-completed ratings on both CTI and AIMS, was used as an additional independent dataset to evaluate the performance of the TDtect visual transformer model.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Dataset and Participants</title>
        <p>The CTI dataset initially contained 73 video recordings of people, many of whom are living with TD. Of these, 70 had corresponding AIMS and CTI ratings. After matching videos with their appropriate ratings, we obtained 69 complete samples (video recordings with matched AIMS and CTI ratings) for our final analysis. Two movement disorders specialists independently confirmed the diagnosis of TD [<xref ref-type="bibr" rid="ref12">12</xref>]. Unlike structured National Institute of Health datasets, which use multiple reviewers and standardized movement instructions, this dataset included single-video assessments with adaptive participant instructions. The videos ranged from 1 to 6 minutes in length and included individuals sitting, standing, and performing targeted movements as shown in <xref ref-type="table" rid="table1">Table 1</xref>.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Description of the video data components for each study element.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="120"/>
            <col width="160"/>
            <col width="100"/>
            <col width="250"/>
            <col width="270"/>
            <col width="100"/>
            <thead>
              <tr valign="bottom">
                <td>Study element</td>
                <td>Participants, n (%)<sup>a</sup></td>
                <td>Videos, n</td>
                <td>Clip duration (seconds), mean (SD)</td>
                <td>Session duration (minutes), mean (SD)</td>
                <td>Assessment</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Study 1<sup>b</sup></td>
                <td>46 (100)</td>
                <td>18</td>
                <td>34 (19)</td>
                <td>11.40 (2.98)</td>
                <td>AIMS<sup>c,d</sup></td>
              </tr>
              <tr valign="top">
                <td>Study 2<sup>b</sup></td>
                <td>136 (100)</td>
                <td>22</td>
                <td>47 (31)</td>
                <td>13.50 (3.77)</td>
                <td>AIMS<sup>d</sup></td>
              </tr>
              <tr valign="top">
                <td>Study 3<sup>b</sup></td>
                <td>174 (100)</td>
                <td>4</td>
                <td>71 (50)</td>
                <td>3.43 (2.11)</td>
                <td>AIMS<sup>e</sup></td>
              </tr>
              <tr valign="top">
                <td>CTI<sup>f</sup> dataset</td>
                <td>69 (100)</td>
                <td>1</td>
                <td>170 (71)</td>
                <td>2.83 (1.19)</td>
                <td>AIMS+CTI<sup>g</sup></td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>Participant n values reflect independent study populations enrolled under separate protocols; aggregate percentages across studies are not reported as they would be misleading.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>Studies 1 to 3 from the iRx-Videra National Institute of Health protocol (Sterns et al [<xref ref-type="bibr" rid="ref13">13</xref>]).</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>AIMS: Abnormal Involuntary Movement Scale.</p>
            </fn>
            <fn id="table1fn4">
              <p><sup>d</sup>Assessment was conducted using recorded videos in a controlled environment.</p>
            </fn>
            <fn id="table1fn5">
              <p><sup>e</sup>Assessment was performed by a clinician in a face-to-face clinical setting.</p>
            </fn>
            <fn id="table1fn6">
              <p><sup>f</sup>CTI: Clinician’s Tardive Inventory.</p>
            </fn>
            <fn id="table1fn7">
              <p><sup>g</sup>Assessments were performed by a clinician in a face-to-face clinical setting while being recorded.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Video Processing and Analysis</title>
        <p>Video recordings from the CTI dataset were processed using a standardized pipeline. First, we used facial detection algorithms to isolate the face, which was analyzed separately from the body before combining the features later in our pipeline. Then, the model examined movement patterns at the per-second level using temporal feature extraction to identify potential dyskinetic movements. For each video, multiple regions of interest (facial and full body) were processed independently to ensure comprehensive movement detection. The final severity scores were derived from aggregated regional assessments, with automated quality control algorithms excluding segments with poor video quality or tracking failures. Regional movement frequencies and amplitudes were quantified using statistical features that capture temporal patterns characteristic of TD movements. This approach enabled assessment of both overall TD severity and anatomical distribution without requiring manual preprocessing or standardized instructions.</p>
      </sec>
      <sec>
        <title>The CTI Tool</title>
        <p>The CTI was developed as a structured assessment tool to document anatomical movement abnormalities and functional impairments associated with TD. The scale evaluates six core movement categories:</p>
        <list list-type="order">
          <list-item>
            <p>Eye, eyelid, and facial movements (eg, excessive blinking, forceful eyelid closure, and facial grimacing)</p>
          </list-item>
          <list-item>
            <p>Tongue and mouth movements (eg, tongue darting, lip smacking, and intraoral movements)</p>
          </list-item>
          <list-item>
            <p>Jaw movements (eg, chewing, grinding, and jaw displacement)</p>
          </list-item>
          <list-item>
            <p>Limb and trunk movements (eg, repetitive foot tapping, truncal rocking, and postural adjustments)</p>
          </list-item>
          <list-item>
            <p>Complex movements (eg, hand-wringing, self-caressing, and fidgety leg movements)</p>
          </list-item>
          <list-item>
            <p>Abnormal vocalizations (eg, irregular respiration, grunting, and moaning)</p>
          </list-item>
        </list>
        <p>Each movement category is rated on a 0 to 3 scale based on frequency, with scores ranging from absent (0) to constant (3). Functional impairments, including activities of daily living, social distress, and physical harm, are rated separately from 0 (unaware or unaffected) to 3 (severe impact) [<xref ref-type="bibr" rid="ref12">12</xref>].</p>
      </sec>
      <sec>
        <title>TDtect Algorithm</title>
        <p>The development of the TDtect algorithm has been described previously by Sterns et al [<xref ref-type="bibr" rid="ref13">13</xref>]. The current TDtect model incorporates refinements since the original publication, including enhanced capability to process unstructured video assessments of variable duration through temporal averaging of frame-level predictions. These improvements enable the model to maintain diagnostic accuracy across diverse clinical video protocols without requiring standardized assessment instructions. In brief, the TDtect training dataset consisted of 3979 video responses collected across 3 independent studies involving 356 participants. Study 1 (46/356, 13%) and study 2 (136/356, 38%) were video AIMS assessments conducted in a clinical setting and evaluated by 3 trained raters. Study 3 (174/356, 49%) consisted of patients with a traditional AIMS assessment evaluated by a single trained rater. The TDtect video assessment session has four segments: (1) the patient sitting still, (2) the patient with an open mouth and tongue inside, (3) the patients with an open mouth and the tongue extended, and (4) answering an open-ended question about daily activities. The assessments had an average duration of 2 minutes and 44 seconds.</p>
        <p>The TDtect algorithm architecture model uses a vision transformer framework, which enables precise tracking of subtle, involuntary movements. TDtect’s performance was previously benchmarked against clinician-rated AIMS with an area under the curve (AUC) of 0.89 in validation testing [<xref ref-type="bibr" rid="ref13">13</xref>].</p>
        <p>The TDtect model was not trained on any of the CTI dataset used to validate the CTI [<xref ref-type="bibr" rid="ref12">12</xref>]. However, given the shared clinical population of individuals with TD in the CTI dataset, it was deemed a valid use of the TDtect model. The TDtect model has continued to be refined since the algorithm was reported [<xref ref-type="bibr" rid="ref13">13</xref>]. This study used the most current iteration of the algorithm, trained through December 2024, which incorporates more participants and enhanced labeling methodologies. These enhancements improved the AUC from 0.89 to 0.906 [<xref ref-type="bibr" rid="ref13">13</xref>]. Performance metrics have improved on validation datasets compared to earlier versions. A key enhancement is its expanded capability for analyzing unstructured assessment sessions, allowing the model to evaluate TD movements regardless of specific instruction protocols. The model architecture has also been optimized to better handle the variability in real-world clinical assessments while maintaining high diagnostic accuracy. Detailed technical specifications and comparative performance metrics of this refined algorithm will be addressed in a separate technical publication.</p>
      </sec>
      <sec>
        <title>Statistical Analysis</title>
        <p>For this cross-dataset evaluation, we analyzed 69 paired samples of video recordings and corresponding clinical ratings from the CTI dataset. The statistical analysis plan designated two primary outcomes: (1) Pearson correlation coefficient between automated TDtect scores and clinician-rated AIMS total scores and (2) area under curve (AUC) or more formally area under the receiver operating characteristic curve, for TD diagnosis using the Schooler-Kane criteria [<xref ref-type="bibr" rid="ref15">15</xref>]. Correlation between TDtect regional subscores and CTI frequency ratings was examined as an exploratory secondary analysis to assess anatomical specificity.</p>
        <p>For the AUC analysis, we used 2 complementary approaches. First, we measured AUC using the Schooler-Kane methodology for TD diagnosis [<xref ref-type="bibr" rid="ref15">15</xref>] as the reference standard. However, due to the high prevalence of positive cases in our population, which created a significant class imbalance, we also evaluated AUC using a more stringent threshold to better differentiate between moderate and severe cases. This second approach allowed us to assess the model’s ability to identify pronounced TD cases, which may be more clinically relevant. Sensitivity and specificity were calculated for both ground-truth labeling schemes, with the optimal model output cut point for each determined using Youden J statistic [<xref ref-type="bibr" rid="ref16">16</xref>]. As the Youden-optimal cut point was identified on the same dataset used for evaluation, reported sensitivity and specificity values should be considered exploratory; AUC, which integrates performance across all thresholds, is the primary performance metric. This comprehensive approach enables assessment of both continuous score agreement and categorical diagnostic performance across different severity levels.</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>The cited study by Sterns et al [<xref ref-type="bibr" rid="ref13">13</xref>], on which the algorithm is based, was approved and overseen by the Creative Action LLC Institutional Review Board, a National Institutes of Health–registered institutional review board (FWA #10005). All patients provided informed consent, which was documented and reviewed. Participants’ video data were only available to the expert reviewers. The participants received compensation in the form of a gift card.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Overall Model Performance</title>
        <p>The TDtect model, without any retraining or fine-tuning for assessment of the CTI dataset, demonstrated a strong correlation with clinician-rated AIMS total scores (<italic>r</italic>=0.717; 69/69, 100%). This correlation strength is particularly notable given the nonstandardized nature of the video protocol used in the CTI dataset compared to the structured protocol used in the model’s original training.</p>
        <p>Bland-Altman analysis was performed using isotonic regression calibration to assess score-level agreement, as the unstructured assessment version produces uncalibrated outputs that require alignment with clinician rating scales (<xref rid="figure1" ref-type="fig">Figure 1</xref>) [<xref ref-type="bibr" rid="ref17">17</xref>]. The analysis demonstrated negligible bias (mean difference approximately 0), with limits of agreement ranging from –6.32 to +6.32. A small but statistically significant proportional bias remained (slope=–0.26; <italic>P=</italic>.002), suggesting slight underestimation at higher severity levels.</p>
        <p>Diagnostic classification performance was evaluated using receiver operating characteristic curve analysis. Using the Schooler-Kane diagnostic criteria for TD identification, the model achieved an AUC of 0.854 in a dataset in which 80% of samples showed positive findings according to clinician rating [<xref ref-type="bibr" rid="ref15">15</xref>]. This performance is comparable to the AUC of 0.89 reported in our previous validation studies using standardized assessment protocols (<xref rid="figure2" ref-type="fig">Figure 2</xref>) [<xref ref-type="bibr" rid="ref13">13</xref>]. <xref ref-type="table" rid="table2">Table 2</xref> summarizes the key performance metrics of the model, including correlation with AIMS, diagnostic accuracy measures, and characteristics of the dataset used for validation. Calibration analysis yielded a Brier score of 0.137 (AIMS ≥12), and the calibration curve (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) showed reasonable calibration across the mid- to high-probability range.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Bland-Altman graph. AIMS: Abnormal Involuntary Movement Scale.</p>
          </caption>
          <graphic xlink:href="mental_v13i1e92197_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Receiver operating characteristic (ROC) curves for model performance, showing (A) discrimination for the Abnormal Involuntary Movement Scale (AIMS) diagnostic classification and (B) discrimination for AIMS total scores ≥12.</p>
          </caption>
          <graphic xlink:href="mental_v13i1e92197_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Model performance metrics for predicting Abnormal Involuntary Movement Scale (AIMS) scores (N=69).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="470"/>
            <col width="500"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Metric</td>
                <td>Values</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">Pearson correlation with AIMS (95% CI)</td>
                <td>0.717 (0.577-0.824)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Diagnostic AUC (95% CI)<sup>a,b</sup></td>
                <td>0.854 (0.754-0.934)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">AUC (95% CI) (threshold ≥12)</td>
                <td>0.900 (0.822-0.958)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Sensitivity (95% CI)</td>
                <td>0.727 (0.566-0.875)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Specificity (95% CI)</td>
                <td>0.929 (0.818-1.000)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Brier score (Schooler-Kane criteria)<sup>c</sup></td>
                <td>0.128</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Brier score (AIMS ≥12)<sup>c</sup></td>
                <td>0.137</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Positive cases (%)</td>
                <td>80%</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Video duration (seconds)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Range</td>
                <td>34-388</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Mean (SD)</td>
                <td>170 (71)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>AUC: area under the curve.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>Diagnostic classification was based on the Schooler-Kane criteria.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>For reference, a naive classifier predicting the base rate for every sample would give a Brier score of approximately 0.16 (Schooler-Kane criteria) and approximately 0.23 (AIMS ≥12); therefore, the model outperformed that baseline.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>Using the Schooler-Kane criteria, TDtect achieved average precision scores of 0.964 (<xref rid="figure3" ref-type="fig">Figure 3</xref>A) and 0.822 for AIMS ≥12 (<xref rid="figure3" ref-type="fig">Figure 3</xref>B). The precision-recall curves show model performance across all decision thresholds, with precision representing positive predictive value and recall representing sensitivity. The baseline represents the proportion of positive cases in each classification scheme (79.7%, 55/69 and 36.2%, 25/69, respectively). These results complement the receiver operating characteristic analysis and provide additional insight into model performance for clinical screening applications where positive predictive value is particularly important.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Precision-recall (PR) analysis for TDtect model performance, showing (A) discrimination for Abnormal Involuntary Movement Scale (AIMS) diagnostic classification and (B) discrimination for AIMS total scores ≥12. AP: average precision.</p>
          </caption>
          <graphic xlink:href="mental_v13i1e92197_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>When analyzing optimal threshold selection, we found that classification performance could be further improved to an AUC of 0.900 when using a more stringent threshold (AIMS total score≥12), which identified 36% of the sample as positive cases. This finding suggests that the model demonstrates particularly high accuracy in identifying more pronounced cases of TD, which has important clinical implications for identifying patients most in need of intervention [<xref ref-type="bibr" rid="ref18">18</xref>].</p>
      </sec>
      <sec>
        <title>Anatomical Region-Specific Performance</title>
        <p>The model’s detection capabilities varied across different anatomical regions, providing insights into its strengths and potential limitations in clinical application. <xref rid="figure2" ref-type="fig">Figure 2</xref> summarizes the AUC values across different body regions and severity thresholds.</p>
        <p>The orofacial region, particularly tongue movements, demonstrated the highest detection reliability (AUC range 0.87-0.95 across severity thresholds). This aligns with clinical expectations, as abnormal tongue movements represent one of the most visually distinctive and prevalent manifestations of TD. Lip and jaw movements also showed good detection performance (AUC 0.76-0.92), consistent with the orofacial predominance typically seen in TD.</p>
        <p>Upper extremity movements were detected with good reliability (AUC 0.69-0.98), with performance notably stronger at higher severity thresholds. Lower extremity and trunk movements showed moderate reliability (AUC 0.75-0.84). Detection of eye movements was more challenging (AUC 0.51-0.63), likely reflecting the subtlety of these movements and their potential confounding with normal blinking patterns.</p>
      </sec>
      <sec>
        <title>Correlation With CTI Components</title>
        <p>As a secondary exploratory analysis, we examined how well TDtect regional subscores aligned with CTI frequency ratings to assess anatomical specificity of model predictions. Analysis of correlations with CTI frequency ratings revealed moderate-to-strong associations across movement categories (<xref rid="figure4" ref-type="fig">Figure 4</xref>).</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Area under the curve (AUC) across movement categories and severities. AIMS: Abnormal Involuntary Movement Scale.</p>
          </caption>
          <graphic xlink:href="mental_v13i1e92197_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>Particularly noteworthy was the anatomical specificity observed in these correlations. The model’s region-specific subscores showed the strongest relationships with clinically rated movements in the corresponding body areas (<xref ref-type="table" rid="table3">Table 3</xref>). For example, the jaw subscore correlated most strongly with CTI jaw movement ratings (<italic>r</italic>=0.732), and the tongue subscore correlated most strongly with CTI tongue movement items (<italic>r</italic>=0.55). This anatomical consistency provides compelling evidence that the model is detecting clinically meaningful movement patterns rather than nonspecific indicators.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Correlations between Clinician’s Tardive Inventory frequency ratings and predicted Abnormal Involuntary Movement Scale subscores.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="300"/>
            <col width="300"/>
            <col width="400"/>
            <thead>
              <tr valign="top">
                <td>Frequency metric<sup>a</sup></td>
                <td>Frequency value (95% CI)</td>
                <td>Predicted subregion score<sup>b</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Eye</td>
                <td>0.499 (0.300-0.679)</td>
                <td>Face</td>
              </tr>
              <tr valign="top">
                <td>Tongue</td>
                <td>0.552 (0.419-0.719)</td>
                <td>Tongue</td>
              </tr>
              <tr valign="top">
                <td>Jaw</td>
                <td>0.732 (0.626-0.828)</td>
                <td>Jaw</td>
              </tr>
              <tr valign="top">
                <td>Complex</td>
                <td>0.572 (0.393-0.730)</td>
                <td>Upper extremity</td>
              </tr>
              <tr valign="top">
                <td>Limb</td>
                <td>0.261 (0.243-0.549)</td>
                <td>Trunk</td>
              </tr>
              <tr valign="top">
                <td>Vocal</td>
                <td>0.464 (0.248-0.718)</td>
                <td>Face</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>Frequency metrics were derived from the Clinician’s Tardive Inventory examination.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>Subregion predicted by the model with the highest correlation.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>The results of this study demonstrate that an artificial intelligence (AI)–powered video analysis model can provide reliable TD assessments, even in the absence of a standard video capture protocol. This cross-dataset evaluation suggests that automated screening may complement clinician assessments, supporting further investigation into its role in clinical workflows.</p>
        <p>The AUC of 0.854, using the Schooler-Kane criteria, highlights the difficulty of distinguishing TD from non-TD in a population in which about 80% of participants meet diagnostic criteria—a class imbalance that narrows the range of possible AUC values compared with a balanced population. When evaluated at a threshold that provides a more balanced class split (AIMS ≥12; 36% positive cases), the model achieves an AUC of 0.900, closely aligning with the 0.89 AUC reported in earlier validation studies conducted under structured AIMS protocols. The remaining performance difference at the Schooler-Kane threshold is expected, considering that the model was applied without any fine-tuning to an unstructured video protocol on which it was not trained; temporal averaging of frame-level predictions was the only adjustment. Fine-tuning on a larger unstructured dataset could potentially reduce this gap further.</p>
        <p>The moderate performance in functional impairment categories (<italic>r</italic>=0.27-0.63) is notable, given that the model was trained exclusively on motor movement data without functional impact labels, suggesting that the algorithm captures movement patterns that genuinely predict real-world consequences. Future iterations may improve these predictions by incorporating additional training datasets and refined subregion analysis.</p>
        <p>The observed pattern of anatomical specificity in our correlations has important implications. The higher reliability in orofacial regions (particularly tongue and jaw movements) aligns with the typical presentation of TD, in which these movements are often the earliest and most persistent manifestations. The comparatively lower correlations with limb movements (<italic>r</italic>=0.261) suggest that additional training may be needed to recognize the more variable presentation of TD in the extremities. Importantly, the strong agreement between the model and clinician ratings for jaw movements (<italic>r</italic>=0.732) is particularly promising, as these movements are often considered diagnostic hallmarks of TD and disabling for patients. The model’s ability to detect these movements with high accuracy, even in nonstandardized video recordings, suggests that it could serve as an effective screening tool in real-world clinical settings (eg, accessing a video collected during a routine telemedicine appointment) where structured assessments may not always be practical.</p>
      </sec>
      <sec>
        <title>Remote Monitoring and Specialist Integration</title>
        <p>These results support the exploration of TDtect’s integration into remote monitoring workflows. Implementing such an envisioned remote patient monitoring service could represent a paradigm shift in TD management. The AI-based detection model could be integrated into both traditional and telepsychiatry practice, allowing psychiatrists to monitor patients remotely. When TD is detected, the patient’s case could be escalated to a movement disorder specialist for confirmation; treatment recommendations; and, if needed, ongoing management. A structured referral system, as has proven successful in other disorders that require high degrees of expertise, might ensure that patients receive timely and expert intervention. Future work should evaluate whether AI-flagged cases can be effectively escalated to movement disorder specialists and whether such workflows improve early detection rates in real-world settings.</p>
        <p>TDtect is designed as a screening tool; its intended clinical role is to identify patients who may have TD and should be referred for formal evaluation, not to replace clinician-administered diagnostic instruments such as the AIMS or CTI. Performance metrics in this paper should be interpreted in this context: sensitivity at the detection threshold is the primary concern, proportional bias at higher severity levels is a secondary consideration relevant to future severity quantification work, and all claims about clinical deployment refer to screening workflows in which positive flags are followed by clinician confirmation.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>Although TDtect demonstrated high accuracy in detecting TD, several limitations must be acknowledged, suggesting areas for further investigation and clinical development. First, the current model does not yet provide automated assessment of frequency and severity across all movement zones defined by the CTI; future iterations should be trained to generate severity and frequency ratings across the full spectrum of clinically relevant abnormal movements. The robustness of diagnostic predictions remains constrained by the size and diversity of the training dataset, highlighting the need to incorporate broader and more representative real-world clinical data. Additionally, rigorous prospective trials remain necessary to clinically validate the TDtect algorithm, particularly through comparative studies evaluating its severity assessments against consensus ratings from multiple clinicians using established measures such as the AIMS and CTI. To enhance the model’s differential diagnostic capacity, future training sets should integrate video data from individuals presenting with a range of other movement disorders. Personalized dynamic monitoring systems that can adapt to individual patient profiles warrant further integration, allowing for the development of actionable, patient-specific alerts and more responsive longitudinal tracking.</p>
        <p>Small validation samples are a known limitation in biomedical reliability research. Guidelines usually recommend larger cohorts than what a single-site specialty population can realistically provide for stable agreement estimates [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. Our evaluation sample (N=69) was sufficient to demonstrate cross-protocol generalization, but it limits the precision of regional performance estimates, as seen in the wide bootstrap CIs for several anatomical regions, and does not permit formal demographic subgroup analysis. Data balancing and generative augmentation have shown promise in similar small, imbalanced clinical datasets [<xref ref-type="bibr" rid="ref21">21</xref>], though augmenting the evaluation set alone would not fix the fundamental constraint here. Collecting larger unstructured video datasets prospectively remains the most direct way to refine the temporal aggregation process and achieve more accurate generalizability estimates.</p>
        <p>Interpretation of TDtect’s performance is also limited by inherent differences in protocol across the CTI dataset, which may pose challenges for direct comparison with standardized rating instruments. Furthermore, the absence of model fine-tuning with this dataset suggests that further targeted training may yield higher accuracy. Ultimately, by addressing these limitations—including refining sensitivity thresholds, expanding the training corpus, and advancing model personalization—the algorithm may evolve into a more comprehensive AI-driven diagnostic and monitoring platform, bridging the gap between automated detection and specialist intervention [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>].</p>
        <p>The dataset’s high TD prevalence (approximately 80% positive under the Schooler-Kane criteria) reflects the specialty movement disorder population from which it was drawn, but limits generalizability to screening contexts where prevalence is lower. AUC values should be interpreted in light of this class distribution; positive and negative predictive values would differ substantially in a general psychiatric population. The AIMS ≥12 threshold result (AUC 0.900; 36% positive for likelihood of having TD vs 64% negative for likelihood not having TD; the CTI dataset is 80% positive for TD) provides a complementary estimate under more balanced conditions.</p>
        <p>This analysis does not include a formal evaluation of algorithmic bias across demographic subgroups. Although the training dataset included participants across racial and ethnic groups (Sterns et al [<xref ref-type="bibr" rid="ref13">13</xref>]), the CTI sample (N=69) does not provide sufficient statistical power for subgroup performance analysis. Future studies should incorporate larger, demographically stratified samples to evaluate potential differential performance. Additionally, although the CTI dataset’s variable recording conditions represent a step toward real-world robustness, systematic evaluation across telehealth platforms, mobile devices, and diverse environmental conditions is needed before deployment at scale.</p>
      </sec>
      <sec>
        <title>Future Research</title>
        <p>Future research should emphasize a longitudinal approach in which individuals are monitored monthly or quarterly alongside medication tracking to fully evaluate the potential of smartphone-based monitoring of TD. Another avenue for future research is to explore the integration of this AI-based diagnostic tool into routine telemedicine sessions. This could enhance ongoing care for individuals receiving antipsychotic medications by providing continuous, remote monitoring for early signs of TD, allowing for timely intervention.</p>
        <p>Future research should also focus on integrating medication adherence monitoring with TD diagnostics. Understanding patients’ adherence patterns will provide critical insights into how treatment strategies can be adjusted to prevent the progression of TD and reduce the risk of irreversible symptoms.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>The TDtect model demonstrates promising cross-dataset generalization in detecting TD movements when evaluated on the independent CTI dataset, with particularly robust performance in identifying anatomically specific movement patterns. Notably, the model maintained high accuracy even without standardized video capture protocols. These findings support the feasibility of automated, AI-driven movement disorder assessment in real-world clinical settings. If confirmed in prospective studies, this technology could contribute to earlier detection of TD and support more timely clinical decision-making.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Calibration curve for Abnormal Involuntary Movement Scale total score ≥12.</p>
        <media xlink:href="mental_v13i1e92197_app1.png" xlink:title="PNG File , 185 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AIMS</term>
          <def>
            <p>Abnormal Involuntary Movement Scale</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">AUC</term>
          <def>
            <p>area under the curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">CTI</term>
          <def>
            <p>Clinician’s Tardive Inventory</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">TD</term>
          <def>
            <p>tardive dyskinesia</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>Artificial intelligence (AI) tools developed by the authors for the assessment of the presence or absence of tardive dyskinesia were used in the analyses carried out in this manuscript. The development of these tools is detailed in the referenced manuscripts, in particular, the study by Sterns et al [<xref ref-type="bibr" rid="ref13">13</xref>] in the <italic>Journal of Clinical Psychiatry</italic>, and their use for the analysis of the video materials assembled for the study by Trosch et al [<xref ref-type="bibr" rid="ref12">12</xref>] is detailed in this study. Grammarly AI Writing Assistant (web-based, version current as of November 2025) was used to improve grammar and sentence clarity in the preparation of this manuscript. Grammarly is a proprietary, AI-powered tool developed and maintained by Grammarly Inc. No researcher-driven modifications or additional data were introduced to the tool. Grammarly may use submitted text for model improvement under its standard Terms of Service. All edits were reviewed by the authors for accuracy and appropriateness. The authors declare no financial conflict of interest related to the use of Grammarly. The tool’s feedback may reflect biases present in its training data, and human editorial review remains essential.</p>
    </ack>
    <notes>
      <sec>
        <title>Funding</title>
        <p>Financial support for the development of the Clinician’s Tardive Inventory was provided in the form of an investigator-initiated study grant received from Neurocrine Biosciences, Inc. Funding for this research was partly provided by the National Institute of Mental Health (grant 2R44MH114763). Data included and described as study 3 were obtained through appropriate institutional review board consent as part of the real-world IMPACT-TD Registry sponsored by Teva Branded Pharmaceutical Products, R&#38;D, Inc. Teva had no further contributions (financial or otherwise) to the work described herein, aside from a courtesy medical review of the manuscript before submission.</p>
      </sec>
    </notes>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The datasets generated or analyzed during this study are not publicly available due fact that the video data underlying this study cannot be shared publicly due to participant privacy and institutional review board constraints, but an anonymized dataset of model predictions and clinician ratings are available from the corresponding author on request.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>RT, AAS, JWH, BG, LL, BT, FM, RR, CM, JF, and OSM contributed to the writing and editing of the manuscript. RT participated in the creation of the Clinician’s Tardive Inventory data collection. AAS, JWH, OM, and CM participated in the expert assessments of the visual data for the TDtect study. AAS, BG, LL, and BT contributed to the methodology for the visual artificial intelligence analyses used in the study. FM, RR, JF, RT, and OM contributed to the research methods and interpretation of results.</p>
      </fn>
      <fn fn-type="conflict">
        <p>RT has received consulting fees in the last 24 months from EPI-Q, Amneal, Ipsen, Supernus, and Neurocrine Biosciences; has received speaker fees from Amneal, Ipsen, Supernus, and Neurocrine Biosciences; and has received funds from Neurocrine Biosciences. AAS is the CEO of iRxReminder, a company that provides telehealth solutions. He holds equity in the company and serves on its board. JWH is a professor at Kent State University and has received research funding from iRxReminder for this study. BG is an employee of Videra Health, which provides artificial intelligence–based health care solutions. He holds equity in the company. LL is the CTO of Videra Health and holds equity in the company. FM is the COO of iRxReminder, a company that provides telehealth solutions. He holds equity in the company and serves on its board. RR is the owner of Charak Health and Wellness Clinics and has received research support from iRxReminder. He has received research funding from various pharmaceutical companies and serves on advisory boards, but none are directly related to this study. CM is the Chief Product Officer of Radial Health and has received consultancy fees from iRxReminder. She holds equity in Osmind, Emobot, and Radial Health. BT is the Chief Clinical Officer of Videra Health and holds equity in the company. JF has received research funding from various pharmaceutical companies and serves on advisory boards, but none are directly related to this study. OM is the CMO of iRxReminder, a company that provides telehealth solutions, CMO of Radial Health, a mental health care provider, and CMO of Neurolief, a medical device company. He is the Co-Founder of Radial and Breakthrough 6, and serves on several advisory and editorial boards. He holds equity in Radial, Ampa Health, Acacia Clinics, Brainsway, Brainify, First Tracks PBC, iRxReminder, Outro Health, Videra Health, MindMed, and receives funding from Brainsway, Magnus Medical, NIH, NIMH, and consulting revenue from Magnus, Soneira Bio, Beckley Clinical, PeakLogic, Spring Health, and MDisrupt. CM and OM are married. All other authors declare no other conflicts of interest.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <article-title>Tardive dyskinesia</article-title>
          <source>MedlinePlus</source>
          <access-date>2025-10-30</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.nlm.nih.gov/medlineplus/ency/article/000685.htm">http://www.nlm.nih.gov/medlineplus/ency/article/000685.htm</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Simpson</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Zoubok</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Gardos</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>A rating scale for tardive dyskinesia</article-title>
          <source>Psychopharmacology</source>
          <year>1979</year>
          <volume>64</volume>
          <fpage>171</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1007/BF00496058</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Caroff</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Ungvari</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Cunningham Owens</surname>
              <given-names>DG</given-names>
            </name>
          </person-group>
          <article-title>Historical perspectives on tardive dyskinesia</article-title>
          <source>J Neurol Sci</source>
          <year>2018</year>
          <month>06</month>
          <day>15</day>
          <volume>389</volume>
          <fpage>4</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jns.2018.02.015</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Woods</surname>
              <given-names>SW</given-names>
            </name>
            <name name-style="western">
              <surname>Morgenstern</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Saksa</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Walsh</surname>
              <given-names>BC</given-names>
            </name>
            <name name-style="western">
              <surname>Sullivan</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Money</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hawkins</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Gueorguieva</surname>
              <given-names>RV</given-names>
            </name>
            <name name-style="western">
              <surname>Glazer</surname>
              <given-names>WM</given-names>
            </name>
          </person-group>
          <article-title>Incidence of tardive dyskinesia with atypical versus conventional antipsychotic medications: a prospective cohort study</article-title>
          <source>J Clin Psychiatry</source>
          <year>2010</year>
          <month>04</month>
          <volume>71</volume>
          <issue>04</issue>
          <fpage>463</fpage>
          <lpage>74</lpage>
          <pub-id pub-id-type="doi">10.4088/JCP.07m03890yel</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carbon</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hsieh</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Kane</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Correll</surname>
              <given-names>CU</given-names>
            </name>
          </person-group>
          <article-title>Tardive dyskinesia prevalence in the period of second-generation antipsychotic use: a meta-analysis</article-title>
          <source>J Clin Psychiatry</source>
          <year>2017</year>
          <month>03</month>
          <volume>78</volume>
          <issue>3</issue>
          <fpage>e264</fpage>
          <lpage>78</lpage>
          <pub-id pub-id-type="doi">10.4088/jcp.16r10832</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Woerner</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Alvir</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Saltz</surname>
              <given-names>BL</given-names>
            </name>
            <name name-style="western">
              <surname>Lieberman</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Kane</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Prospective study of tardive dyskinesia in the elderly: rates and risk factors</article-title>
          <source>Am J Psychiatry</source>
          <year>1998</year>
          <month>11</month>
          <day>01</day>
          <volume>155</volume>
          <issue>11</issue>
          <fpage>1521</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1176/ajp.155.11.1521</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vrijens</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Vincze</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kristanto</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Urquhart</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Burnier</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Adherence to prescribed antihypertensive drug treatments: longitudinal study of electronically compiled dosing histories</article-title>
          <source>BMJ</source>
          <year>2008</year>
          <month>05</month>
          <day>17</day>
          <volume>336</volume>
          <issue>7653</issue>
          <fpage>1114</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1136/bmj.39553.670231.25</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gandhi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ayyagari</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Assessment of underdiagnosis of tardive dyskinesia by geographic region, social determinants, and other patient characteristics</article-title>
          <source>CNS Spectr</source>
          <year>2025</year>
          <month>01</month>
          <day>10</day>
          <volume>29</volume>
          <issue>5</issue>
          <fpage>509</fpage>
          <lpage>10</lpage>
          <pub-id pub-id-type="doi">10.1017/s1092852924001809</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kane</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Correll</surname>
              <given-names>CU</given-names>
            </name>
            <name name-style="western">
              <surname>Nierenberg</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Caroff</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Sajatovic</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Revisiting the Abnormal Involuntary Movement Scale: proceedings from the tardive dyskinesia assessment workshop</article-title>
          <source>J Clin Psychiatry</source>
          <year>2018</year>
          <volume>79</volume>
          <issue>3</issue>
          <fpage>17cs11959</fpage>
          <pub-id pub-id-type="doi">10.4088/jcp.17cs11959</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guy</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <source>ECDEU Assessment Manual for Psychopharmacology</source>
          <year>1976</year>
          <publisher-loc>Rockville, MD</publisher-loc>
          <publisher-name>U.S. Department of Health, Education, and Welfare, Public Health Service, Alcohol, Drug Abuse, and Mental Health Administration, National Institute of Mental Health, Psychopharmacology Research Branch, Division of Extramural Research Programs</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lane</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Glazer</surname>
              <given-names>WM</given-names>
            </name>
            <name name-style="western">
              <surname>Hansen</surname>
              <given-names>TE</given-names>
            </name>
            <name name-style="western">
              <surname>Berman</surname>
              <given-names>WH</given-names>
            </name>
            <name name-style="western">
              <surname>Kramer</surname>
              <given-names>SI</given-names>
            </name>
          </person-group>
          <article-title>Assessment of tardive dyskinesia using the Abnormal Involuntary Movement Scale</article-title>
          <source>J Nerv Ment Dis</source>
          <year>1985</year>
          <month>06</month>
          <volume>173</volume>
          <issue>6</issue>
          <fpage>353</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1097/00005053-198506000-00005</pub-id>
          <pub-id pub-id-type="medline">3998720</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Trosch</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Comella</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Caroff</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Ondo</surname>
              <given-names>WG</given-names>
            </name>
            <name name-style="western">
              <surname>Shillington</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>LaChappelle</surname>
              <given-names>BJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hauser</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Correll</surname>
              <given-names>CU</given-names>
            </name>
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>JH</given-names>
            </name>
          </person-group>
          <article-title>The Clinician's Tardive Inventory (CTI): a new clinical tool for documenting and rating tardive dyskinesia</article-title>
          <source>J Clin Psychiatry</source>
          <year>2024</year>
          <month>01</month>
          <day>24</day>
          <volume>85</volume>
          <issue>1</issue>
          <fpage>23m14886</fpage>
          <pub-id pub-id-type="doi">10.4088/JCP.23m14886</pub-id>
          <pub-id pub-id-type="medline">38270545</pub-id>
          <pub-id pub-id-type="pii">23m14886</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sterns</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Hughes</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Grimm</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Larsen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ranjan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>MacMillan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Talbot</surname>
              <given-names>BH</given-names>
            </name>
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Muir</surname>
              <given-names>OS</given-names>
            </name>
          </person-group>
          <article-title>Detecting tardive dyskinesia using video-based artificial intelligence</article-title>
          <source>J Clin Psychiatry</source>
          <year>2025</year>
          <month>05</month>
          <day>28</day>
          <volume>86</volume>
          <issue>3</issue>
          <fpage>25m15792</fpage>
          <pub-id pub-id-type="doi">10.4088/jcp.25m15792</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sterns</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Larsen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Grimm</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Muir</surname>
              <given-names>OS</given-names>
            </name>
          </person-group>
          <article-title>Remote monitoring and AI for detecting tardive dyskinesia and improving patient outcomes</article-title>
          <source>Gerontechnology</source>
          <year>2022</year>
          <volume>21</volume>
          <issue>s</issue>
          <fpage>1</fpage>
          <pub-id pub-id-type="doi">10.4017/gt.2022.21.s.706.opp3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schooler</surname>
              <given-names>NR</given-names>
            </name>
            <name name-style="western">
              <surname>Kane</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Research diagnoses for tardive dyskinesia</article-title>
          <source>Arch Gen Psychiatry</source>
          <year>1982</year>
          <month>04</month>
          <volume>39</volume>
          <issue>4</issue>
          <fpage>486</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1001/archpsyc.1982.04290040080014</pub-id>
          <pub-id pub-id-type="medline">6121550</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Youden</surname>
              <given-names>WJ</given-names>
            </name>
          </person-group>
          <article-title>Index for rating diagnostic tests</article-title>
          <source>Cancer</source>
          <year>1950</year>
          <month>01</month>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>32</fpage>
          <lpage>5</lpage>
          <pub-id pub-id-type="doi">10.1002/1097-0142(1950)3:1&#60;32::aid-cncr2820030106&#62;3.0.co;2-3</pub-id>
          <pub-id pub-id-type="medline">15405679</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bland</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Altman</surname>
              <given-names>DG</given-names>
            </name>
          </person-group>
          <article-title>Statistical methods for assessing agreement between two methods of clinical measurement</article-title>
          <source>Lancet</source>
          <year>1986</year>
          <month>02</month>
          <day>08</day>
          <volume>1</volume>
          <issue>8476</issue>
          <fpage>307</fpage>
          <lpage>10</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-023-00751-9"/>
          </comment>
          <pub-id pub-id-type="medline">2868172</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(86)90837-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Joyce</surname>
              <given-names>DW</given-names>
            </name>
            <name name-style="western">
              <surname>Kormilitzin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Cipriani</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Explainable artificial intelligence for mental health through transparency and interpretability for understandability</article-title>
          <source>NPJ Digit Med</source>
          <year>2023</year>
          <month>01</month>
          <day>18</day>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>6</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-023-00751-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-023-00751-9</pub-id>
          <pub-id pub-id-type="medline">36653524</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41746-023-00751-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC9849399</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shoukri</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Asyali</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Donner</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Sample size requirements for the design of reliability study: review and new results</article-title>
          <source>Stat Methods Med Res</source>
          <year>2004</year>
          <month>08</month>
          <volume>13</volume>
          <issue>4</issue>
          <fpage>251</fpage>
          <lpage>71</lpage>
          <pub-id pub-id-type="doi">10.1191/0962280204sm365ra</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hobart</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Cano</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Warner</surname>
              <given-names>TT</given-names>
            </name>
            <name name-style="western">
              <surname>Thompson</surname>
              <given-names>AJ</given-names>
            </name>
          </person-group>
          <article-title>What sample sizes for reliability and validity studies in neurology?</article-title>
          <source>J Neurol</source>
          <year>2012</year>
          <month>12</month>
          <volume>259</volume>
          <issue>12</issue>
          <fpage>2681</fpage>
          <lpage>94</lpage>
          <pub-id pub-id-type="doi">10.1007/s00415-012-6570-y</pub-id>
          <pub-id pub-id-type="medline">22729386</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Trabassi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Castiglia</surname>
              <given-names>SF</given-names>
            </name>
            <name name-style="western">
              <surname>Bini</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Marinozzi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ajoudani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lorenzini</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chini</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Varrecchia</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ranavolo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>De Icco</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Casali</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Serrao</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Optimizing rare disease gait classification through data balancing and generative AI: insights from hereditary cerebellar ataxia</article-title>
          <source>Sensors (Basel)</source>
          <year>2024</year>
          <month>06</month>
          <day>03</day>
          <volume>24</volume>
          <issue>11</issue>
          <fpage>3613</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=s24113613"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/s24113613</pub-id>
          <pub-id pub-id-type="medline">38894404</pub-id>
          <pub-id pub-id-type="pii">s24113613</pub-id>
          <pub-id pub-id-type="pmcid">PMC11175240</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
