<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMH</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Ment Health</journal-id>
      <journal-title>JMIR Mental Health</journal-title>
      <issn pub-type="epub">2368-7959</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v7i1e16790</article-id>
      <article-id pub-id-type="pmid"/>
      <article-id pub-id-type="doi">10.2196/16790</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Atypical Repetition in Daily Conversation on Different Days for Detecting Alzheimer Disease: Evaluation of Phone-Call Data From a Regular Monitoring Service</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Parsey</surname>
            <given-names>Carolyn</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Kanno</surname>
            <given-names>Keynes</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Sinclair</surname>
            <given-names>Craig</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Yamada</surname>
            <given-names>Yasunori</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>IBM Research</institution>
            <addr-line>19-21, Nihonbashi, Hakozaki-cho, Chuo-ku</addr-line>
            <addr-line>Tokyo, </addr-line>
            <country>Japan</country>
            <phone>81 80 6706 9381</phone>
            <email>ysnr@jp.ibm.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3333-4368</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Shinkawa</surname>
            <given-names>Kaoru</given-names>
          </name>
          <degrees>ME</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3869-1922</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Shimmei</surname>
            <given-names>Keita</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9897-6671</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>IBM Research</institution>
        <addr-line>Tokyo</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Poverty and Equity Global Practice</institution>
        <institution>The World Bank</institution>
        <addr-line>Washington, DC</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Yasunori Yamada <email>ysnr@jp.ibm.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>1</month>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>14</day>
        <month>1</month>
        <year>2020</year>
      </pub-date>
      <volume>7</volume>
      <issue>1</issue>
      <elocation-id>e16790</elocation-id>
      <history>
        <date date-type="received">
          <day>25</day>
          <month>10</month>
          <year>2019</year>
        </date>
        <date date-type="rev-request">
          <day>19</day>
          <month>11</month>
          <year>2019</year>
        </date>
        <date date-type="rev-recd">
          <day>4</day>
          <month>12</month>
          <year>2019</year>
        </date>
        <date date-type="accepted">
          <day>16</day>
          <month>12</month>
          <year>2019</year>
        </date>
      </history>
      <copyright-statement>©Yasunori Yamada, Kaoru Shinkawa, Keita Shimmei. Originally published in JMIR Mental Health (http://mental.jmir.org), 14.01.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Mental Health, is properly cited. The complete bibliographic information, a link to the original publication on http://mental.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://mental.jmir.org/2020/1/e16790/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Identifying signs of Alzheimer disease (AD) through longitudinal and passive monitoring techniques has become increasingly important. Previous studies have succeeded in quantifying language dysfunctions and identifying AD from speech data collected during neuropsychological tests. However, whether and how we can quantify language dysfunction in daily conversation remains unexplored.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The objective of this study was to explore the linguistic features that can be used for differentiating AD patients from daily conversations.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We analyzed daily conversational data of seniors with and without AD obtained from longitudinal follow-up in a regular monitoring service (from n=15 individuals including 2 AD patients at an average follow-up period of 16.1 months; 1032 conversational data items obtained during phone calls and approximately 221 person-hours). In addition to the standard linguistic features used in previous studies on connected speech data during neuropsychological tests, we extracted novel features related to atypical repetition of words and topics reported by previous observational and descriptive studies as one of the prominent characteristics in everyday conversations of AD patients.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>When we compared the discriminative power of AD, we found that atypical repetition in two conversations on different days outperformed other linguistic features used in previous studies on speech data during neuropsychological tests. It was also a better indicator than atypical repetition in single conversations as well as that in two conversations separated by a specific number of conversations.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our results show how linguistic features related to atypical repetition across days could be used for detecting AD from daily conversations in a passive manner by taking advantage of longitudinal data.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>dementia</kwd>
        <kwd>Alzheimer disease</kwd>
        <kwd>speech analysis</kwd>
        <kwd>screening</kwd>
        <kwd>monitoring</kwd>
        <kwd>behavioral marker</kwd>
        <kwd>daily conversation</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>As the world’s elderly population increases, the number of people living with dementia is rising rapidly, making dementia an increasingly serious health and social problem. As of 2018, approximately 50 million people globally were living with dementia, corresponding to about 7.3% of the world’s over 65-year-olds [<xref ref-type="bibr" rid="ref1">1</xref>]. The total worldwide cost of dementia has risen significantly, being estimated to reach over US $1 trillion in 2018 [<xref ref-type="bibr" rid="ref1">1</xref>]. At the same time, diagnostic coverage worldwide remains so low that only 40% to 50% of people with dementia have been diagnosed, even in high-income countries [<xref ref-type="bibr" rid="ref2">2</xref>]. The low-diagnosis coverage makes it more difficult for many patients and their families to receive appropriate support and care. Taking this into consideration, health monitoring technology and services are expected to help increase the diagnosis coverage by detecting signs of cognitive decline resulting from dementia in everyday situations [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>].</p>
      <p>One of the clues for detecting cognitive decline resulting from Alzheimer disease (AD) in everyday situations can be obtained by identifying the evolution of a patient’s language as their AD progresses. While the most typical symptom of dementia is memory impairment due to the medial temporal lobe shrinking [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>], both retrospective analysis and prospective cohort studies have shown that language dysfunctions prevail even from the presymptomatic period [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref8">8</xref>]. Moreover, studies on pathologically proven AD patients showed that they exhibited syntactic simplification and impairment in lexical-semantic processing [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. A growing body of studies on probable AD patients has also shown that many aspects of speech and language, including grammatical and informational content as well as acoustic characteristics such as the pitch contour, show deficits as AD progresses [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
      <p>Previous computational studies attempted to measure these language dysfunctions in AD patients on the basis of such findings by using acoustic, prosodic, and linguistic features [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref34">34</xref>]. For example, the short-term memory loss attributed to dementia often makes normal conversation difficult due to language dysfunctions such as difficulties with word-finding and word-retrieving [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]. These language dysfunctions have been measured by tallying pronoun frequency and fillers, including nonwords and short phrases (eg, “umm” or “uh”) [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]. The reduction in speech expressiveness is another language dysfunction typically observed in AD patients. This reduction is measured by the decrease in adjectives and indicators related to vocabulary richness [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref39">39</xref>]. Using a combination of these features, previous studies have succeeded in differentiating healthy controls and AD patients [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]. However, they mainly investigated speech data obtained while participants took part in neuropsychological tests such as verbal fluency, story recall, and picture description tasks [<xref ref-type="bibr" rid="ref40">40</xref>]. Whether and how we can measure language dysfunctions resulting from AD during daily conversations remains largely uninvestigated. Because the conversational content and cognitive workload vary in daily conversations where people do not engage in specific tasks, we need to reinvestigate what kinds of speech features could be useful for identifying AD patients. In terms of the language dysfunctions of dementia patients in everyday conversations, previous observational and descriptive studies reported atypical repetition of words and topics as a prominent characteristic [<xref ref-type="bibr" rid="ref41">41</xref>]. While this repetition has been typically reported to occur in the same conversation, it also appears in separate conversations that may be held on different days. Because it has not been objectively measured, investigating how word and topic repetition differs in AD patients is a promising first step.</p>
      <p>In this study, we analyzed the conversational data of seniors with and without AD obtained from longitudinal follow-up in a regular monitoring service. We used natural language processing techniques to automatically measure atypical word and topic repetitions and then investigated whether and how characteristics in topic repetition differed between seniors with and without AD. The results indicated that both linguistic features related to word and topic repetition in paired conversations on different days had better discriminative powers compared with other linguistic features used in previous studies on connected speech data during neuropsychological tests. We also found that they peaked at a specific interval day (around seven days), not at a specific number of conversations. On the basis of these results, we demonstrate how quantifying atypical repetition in continuous and passive monitoring of daily conversations can help automatically detect AD.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data and Participants</title>
        <p>We used conversational data obtained during phone calls with a regular monitoring service for seniors provided by Cocolomi Co, Ltd (<xref rid="figure1" ref-type="fig">Figure 1</xref>A). In this service, communicators call and talk with older individuals once or twice a week, typically for 10 to 20 minutes of free conversation. All communicators received training and communicated with participants in accordance with the company guidelines for encouraging participants to speak. In this service, one communicator is typically assigned to a participant, and that participant talks with the same communicator. They manually transcribe the conversations in a spoken-word format by omitting incomplete words and fillers and forward the texts to family members such as their children. They used either home phones or smartphones. All conversations were conducted in Japanese. We analyzed these transcribed text data. All participants agreed to having their conversational data used for research purposes. This study was conducted under the approval of the ethical committee of Shizuoka University and performed in accordance with the Ethical Guidelines for Medical and Health Research Involving Human Subjects.</p>
        <p>The data were obtained from 15 Japanese people (12 females and 3 males aged 61 to 91 years; mean 76.8 [SD 9.4] years). Of these, 2 females had received the diagnosis of AD. The morbidity information for other diseases was not available. The communicators knew the diagnosis status of the participants, but they communicated with them in accordance with the company guidelines and did not change conversation methods on the basis of the diagnosis status. The follow-up period ranged from 1 to 33 months (mean period 16.1 months). We analyzed data from 1032 phone calls in total, and the number of phone calls for each participant ranged from 4 to 226 (mean 68.8 phone calls). The average duration of a single phone call for each participant ranged from 6.8 to 22.2 minutes (mean time between participants 12.1 [SD 4.1] minutes). The total call time of our dataset was around 221 hours. Transcribed text data consists of only text spoken by participants, not communicators. The text data contained 1098 characters on average, and we analyzed 1,132,935 characters in total. <xref ref-type="table" rid="table1">Table 1</xref> provides the overview of our dataset.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Atypical repetition in conversational data from regular monitoring service. A. Overview of regular monitoring service. The manually transcribed text of the conversation was analyzed in this study. B. Schematic illustrating the paired samples of conversations separated by t days and n phone calls to extract repetition features across different conversations. C. Repetition features of seniors with and without AD. Violin plot is used to visualize the distribution of the data and its probability density. On each side of the violin is a kernel density estimation to show the distribution shape of the data. The wider portion of the violin indicates the higher density and the narrow region represents relatively lower density. The grey box with the whiskers in the violin is the boxplot. The box denotes the 25th (Q1) and 75th (Q3) percentiles. The whiskers denote the upper and lower adjacent values that are the most extreme within Q3+1.5(Q3-Q1) and Q1-1.5(Q3-Q1), respectively. The white dot in the box represents median value. Significant differences are denoted with asterisks (*<italic>P</italic>&lt;.001). D. AUC-ROC score of topic repetition feature with different T days.</p>
          </caption>
          <graphic xlink:href="mental_v7i1e16790_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Demographics of conversational data participants.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="120"/>
            <col width="140"/>
            <col width="140"/>
            <col width="100"/>
            <col width="230"/>
            <col width="240"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Status and gender</td>
                <td>Age (years)</td>
                <td>Duration (months)</td>
                <td>Calls, n</td>
                <td>Call time (min), mean (SD)</td>
                <td>Number of characters, mean (SD)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">
                  <bold>Control</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>F</td>
                <td>61-62</td>
                <td>11</td>
                <td>31</td>
                <td>7.8 (2.0)</td>
                <td>422.7 (121.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>F</td>
                <td>63-64</td>
                <td>14</td>
                <td>32</td>
                <td>14.0 (5.1)</td>
                <td>1078.3 (369.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>F</td>
                <td>75-77</td>
                <td>25</td>
                <td>75</td>
                <td>11.3 (8.5)</td>
                <td>744.8 (215.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>F</td>
                <td>75-75</td>
                <td>1</td>
                <td>4</td>
                <td>12.8 (3.1)</td>
                <td>1365.0 (130.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>F</td>
                <td>78-78</td>
                <td>9</td>
                <td>64</td>
                <td>10.3 (2.0)</td>
                <td>815.2 (173.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>F</td>
                <td>79-80</td>
                <td>6</td>
                <td>23</td>
                <td>11.7 (3.2)</td>
                <td>1507.5 (457.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>F</td>
                <td>80-83</td>
                <td>33</td>
                <td>109</td>
                <td>16.6 (4.7)</td>
                <td>1499.7 (391.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>F</td>
                <td>82-83</td>
                <td>19</td>
                <td>72</td>
                <td>6.8 (3.0)</td>
                <td>811.2 (367.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>F</td>
                <td>88-89</td>
                <td>17</td>
                <td>104</td>
                <td>11.2 (4.4)</td>
                <td>944.5 (314.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>F</td>
                <td>91-91</td>
                <td>9</td>
                <td>35</td>
                <td>22.2 (3.7)</td>
                <td>2405.8 (433.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>M</td>
                <td>63-65</td>
                <td>16</td>
                <td>72</td>
                <td>11.9 (3.1)</td>
                <td>1146.8 (242.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>M</td>
                <td>67-70</td>
                <td>33</td>
                <td>132</td>
                <td>10.6 (2.3)</td>
                <td>999.4 (236.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>M</td>
                <td>82-85</td>
                <td>30</td>
                <td>226</td>
                <td>17.7 (6.3)</td>
                <td>1207.0 (497.7)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Alzheimer disease</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>F</td>
                <td>83-84</td>
                <td>14</td>
                <td>40</td>
                <td>9.5 (2.8)</td>
                <td>923.9 (409.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>F</td>
                <td>85-85</td>
                <td>5</td>
                <td>13</td>
                <td>7.8 (1.8)</td>
                <td>662.0 (199.1)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Mean (SD)</td>
                <td>76.8 (9.4)</td>
                <td>16.1 (10.2)</td>
                <td>68.8 (57.2)</td>
                <td>12.1 (4.1)</td>
                <td>1098.0 (500.3)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  Total
                </td>
                <td>—</td>
                <td>—</td>
                <td>1032</td>
                <td>13,230 (221 hours)</td>
                <td>1,132,935</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Extraction of Linguistic Features</title>
        <p>From each item of phone call data, we extracted linguistic features related to word and topic repetition within single conversations, as well as the standard linguistic features used in previous studies to build models for AD screening from connected speech data during neuropsychological tests (for the list of features, please see the Standard Linguistic Features section) [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref34">34</xref>]. In addition, we extracted features related to word and topic repetition across different conversations from the text data of two phone calls separated by <italic>t</italic> days and <italic>n</italic> phone calls interval, respectively (<xref rid="figure1" ref-type="fig">Figure 1</xref>B). Specifically, we used all possible pairs of two phone call data items separated by <italic>t</italic> days (<italic>T</italic>–<italic>M</italic>&lt;<italic>t</italic>≤<italic>T</italic>+<italic>M</italic>) for specific days interval and <italic>n</italic> phone calls (<italic>N</italic>–<italic>M</italic>&lt;<italic>n</italic>≤<italic>N</italic>+<italic>M</italic>) for specific phone calls interval. Optimal parameters for <italic>T</italic> (4,5,…,13) and <italic>N</italic> (3,4,…,12) were selected by performing a grid search for each feature. In this study, we used <italic>M</italic>=3, <italic>T</italic>=10, and <italic>N</italic>=7 for word repetition, and <italic>T</italic>=7 and <italic>N</italic>=9 for topic repetition.</p>
        <p>For preprocessing, we used the Japanese morphological analyzer MeCab [<xref ref-type="bibr" rid="ref42">42</xref>] to perform word segmentation, part-of-speech tagging, and word lemmatization on the transcribed texts. Words tagged as numerals or symbols were excluded from the analysis. Predefined stop words were also eliminated.</p>
      </sec>
      <sec>
        <title>Word and Topic Repetition Features</title>
        <p>We measured word repetition by using the feature focusing on the number of distinct words being used in a target document. Specifically, the feature was calculated by the inverse number of Honoré’s statistic (HS) [<xref ref-type="bibr" rid="ref43">43</xref>], defined as HS=100log<italic>V</italic>/(1–<italic>V</italic><sub>uni</sub>/<italic>U</italic>), where <italic>V</italic> is the total number of words, <italic>U</italic> is the total number of distinct word types, and <italic>V</italic><sub>uni</sub> is the number of total distinct word types used only once. For the feature related to word repetition across two text data of different conversations, we combined the data of both texts and then extracted the feature from it.</p>
        <p>For the features related to topic repetition, we used a biterm topic model (BTM) [<xref ref-type="bibr" rid="ref44">44</xref>]. While conventional topic models such as latent Dirichlet allocation have typically been used for estimating the latent topics of conversations [<xref ref-type="bibr" rid="ref45">45</xref>], BTM was designed to extract latent topics from a limited amount of context, such as that found in tweets and news headlines [<xref ref-type="bibr" rid="ref44">44</xref>]. Accordingly, we used BTM for estimating the topic in sentences and then extracted features related to topic repetition within conversations. Specifically, we first divided a text document into sentences by using punctuation marks. We then applied a BTM to a set of all the sentences, extracted word probability vectors for each <italic>K</italic> topic and obtained topic proportions allocated to each <italic>l</italic> sentence. For example, when a text document consisted of <italic>L</italic> sentences, we obtained <italic>L</italic>–<italic>l</italic>+1 vectors for topic proportions. We calculated pair-wise similarities with Euclidean distance and used the inverse number of the mean value as topic similarity features within single conversations. For the topic similarity features across two different items of text data <italic>D<sub>i</sub></italic> and <italic>D<sub>j</sub></italic>, we calculated pair-wise similarities between topic proportions in <italic>D<sub>i</sub></italic> and <italic>D<sub>j</sub></italic> and used the inverse number of the mean value. The parameters <italic>K</italic>=200 and <italic>l</italic>=3 were used.</p>
        <p>We briefly describe how BTM works. In contrast to conventional topic models such as latent Dirichlet allocation [<xref ref-type="bibr" rid="ref45">45</xref>], BTM directly models the generation of word co-occurrence patterns in the whole corpus to estimate topics from a small amount of context in a document [<xref ref-type="bibr" rid="ref44">44</xref>]. The key concept is that if two words co-occur more frequently, they are more likely to belong to the same topic. The term <italic>biterm</italic> denotes an unordered word pair occurring in a short text. For example, a document with three distinct words generates three biterms:</p>
        <disp-formula>(<italic>w</italic><sub>1</sub>, <italic>w</italic><sub>2</sub>, <italic>w</italic><sub>3</sub>)⟹{(<italic>w</italic><sub>1</sub>, <italic>w</italic><sub>2</sub>), (<italic>w</italic><sub>2</sub>, <italic>w</italic><sub>3</sub>), (<italic>w</italic><sub>1</sub>, <italic>w</italic><sub>3</sub>)}.</disp-formula>
        <p>In general, a document containing <italic>n</italic> distinct words generates <italic>n</italic>C<sub>2</sub> biterms. The biterms are typically extracted from each sentence, and by combining them we get a corpus <italic>B</italic> for the target document as a set consisting of ‖<italic>B</italic>‖ biterms. With the BTM, it is assumed that each topic is a multinomial distribution over the biterm (<italic>ϕ</italic>), and the whole corpus is a mixture of these topics (<italic>θ</italic>). The process of extracting biterms can be conducted as follows:</p>
        <list list-type="order">
          <list-item>
            <p>Draw a topic distribution θ ~ Dirichlet (α) for the whole corpus.</p>
          </list-item>
          <list-item>
            <p>Draw a topic-specific word distribution ϕk Dirichlet (β) for each topic k.</p>
          </list-item>
          <list-item>
            <p>For each biterm bi in the whole biterm set:
        
            Draw a topic assignment z ~ multinomial (θ).
            Draw two words wi,1, wi,2 ~ multinomial (ϕZi).
        
    </p>
          </list-item>
        </list>
        <p>Following the above procedure, the probability of biterm <italic>b<sub>i</sub></italic>=(<italic>w<sub>i</sub></italic>,<sub>1</sub>, <italic>w<sub>i</sub></italic>,<sub>2</sub>) conditioned on the model parameters <italic>θ</italic> and <italic>α</italic> can be written as seen in <xref rid="figure2" ref-type="fig">Figure 2</xref>. For more details, we refer the reader to the original paper [<xref ref-type="bibr" rid="ref44">44</xref>].</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>The equation of the probability of biterm bi.</p>
          </caption>
          <graphic xlink:href="mental_v7i1e16790_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Standard Linguistic Features</title>
        <p>On the basis of related work on connected speech data during neuropsychological tests, we extracted 29 linguistic features categorized into 4 types of linguistic features that would be useful for inferring AD: parts of speech, vocabulary richness, syntactic complexity, and perseveration [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref34">34</xref>]. Here, neuropsychological tests in previous studies include a picture description task using a picture of the Cookie Theft, comprehensive aphasia test, and the Wechsler Logical Memory tests [<xref ref-type="bibr" rid="ref46">46</xref>-<xref ref-type="bibr" rid="ref48">48</xref>].</p>
        <p>The first feature set, related to parts of speech, consists of 14 features: frequency and the ratio of part-of-speech tags. We extracted the part-of-speech information by using Mecab [<xref ref-type="bibr" rid="ref42">42</xref>] and then computed the frequency of occurrence of different parts of speech (nouns, verbs, adjectives, auxiliary verbs, and conjunctions). We also computed ratios, namely, each part of speech normalized by the total number of word tokens in the document. Analyzed part-of-speech tags included nouns, verbs, adjectives, pronouns, adverbs, auxiliary verbs, and conjunctions. We also calculated the ratio of noun to verb and the ratio of pronoun to noun.</p>
        <p>The second feature set, related to vocabulary richness, consists of 3 features: type-token ratio (TTR), Brunét’s index (BI), and HS [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref43">43</xref>]. This feature set measures lexical diversity, which tends to decrease in AD cases [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. TTR compares the total distinct word types (<italic>U</italic>) to the total word count (<italic>V</italic>) as TTR=<italic>U</italic>/<italic>V</italic>. Using the same <italic>U</italic> and <italic>V</italic>, BI is defined as BI=<italic>V<sup>U</sup></italic><sup>–0.165</sup>. Unlike other measures related to vocabulary richness, for this measure, the lexical richness becomes greater as BI becomes smaller. HS gives particular importance to unique vocabulary items used only once, also known as hapax legomena <italic>V<sub>uni</sub></italic>. HS is defined as HS=100log<italic>V</italic>/(1–<italic>V<sub>uni</sub></italic>/<italic>U</italic>).</p>
        <p>The third feature set, related to syntactic complexity, consists of 7 features related to length metrics as well as dependency relations. For features related to length metrics, we calculated 4 measures consisting of mean length of sentences, total number of sentences in a document, total number of words in a document, and total number of characters in a document. For features related to dependency relations, we calculated total number of dependencies in a document, the average dependencies per sentence, and total dependency distance in a document. As for the dependency structures, we used CaboCha [<xref ref-type="bibr" rid="ref49">49</xref>]. Dependency distance was calculated by the sum of all the linear distances between 2 syntactically related words in a sentence. This dependency distance has been considered an important index of memory burden and an indicator of syntactic difficulty [<xref ref-type="bibr" rid="ref50">50</xref>].</p>
        <p>The final feature set, related to perseveration, consists of 5 features. First, sentences were converted into term frequency–inverse document frequency (TF-IDF) vectors by using a bag-of-words model [<xref ref-type="bibr" rid="ref51">51</xref>]. TF-IDF is a numerical statistic intended to reflect how important a word is to a document. By using TF-IDF vectors, we then calculated the cosine similarity between sentences [<xref ref-type="bibr" rid="ref51">51</xref>]. We then calculated the proportion of sentence pairs equal to 0 and below 2 thresholds (0.3, 0.5) as well as the minimum and average cosine distances across all pairs of sentences.</p>
      </sec>
      <sec>
        <title>Statistical Analysis</title>
        <p>All statistical analyses were done in the R environment (R Foundation for Statistical Computing). A 2-tailed Student <italic>t</italic> test was applied for each feature to determine significant differences of enrichment between the two populations, and the resulting <italic>P</italic> values were adjusted with Bonferroni multiple testing correction. Adjusted <italic>P</italic> values below .01 were considered significantly different.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>We first investigated whether and how each of the 6 types of features for measuring repetition differed between seniors with and without AD: 2 repetition types (word and topic) × 3 data sources (single conversations, 2 different conversations separated by <italic>t</italic> days, and 2 different conversations separated by <italic>n</italic> phone calls). The discriminative power was measured by using both effect size (Cohen <italic>d</italic>) [<xref ref-type="bibr" rid="ref52">52</xref>] and AUC-ROC. For Cohen <italic>d</italic>, an effect size of 0.80 is considered large, 0.50 is medium, and 0.20 is small [<xref ref-type="bibr" rid="ref52">52</xref>]. ROC is a graphical plot that illustrates the diagnostic ability of a binary classifier system that ranges from 0 to 1.</p>
      <p>Results showed that all 6 features had significant increased repetition in the AD group with large effect size (<italic>P</italic>&lt;.001, 2-sided <italic>t</italic> test with Bonferroni multiple testing correction; Cohen <italic>d</italic> &gt;0.80; <xref rid="figure1" ref-type="fig">Figure 1</xref>C). When we compared the discriminative power among them, the feature related to topic repetition across 2 conversations on different days showed the highest AUC scores and largest effect size (AUC=0.91); effect size of –1.76, 95% CI –2.15 to –1.36; <xref ref-type="table" rid="table2">Table 2</xref>). In addition, the features for word and topic repetition across different conversations separated by specific days interval and phone calls interval had larger effect size and higher AUC scores compared with those in single conversations (<xref ref-type="table" rid="table2">Table 2</xref>). We also found that the features extracted from conversational data at <italic>t</italic> days interval had better discriminative power than those at <italic>n</italic> phone calls interval (<xref ref-type="table" rid="table2">Table 2</xref>).</p>
      <p>To deepen our understanding of the nature of repetition features across different days, we investigated the relationship between the discriminative power of the repetition features and interval days of paired conversations. Results showed that after they increased in the beginning, they peaked at around <italic>T</italic>=7 days and then had a tendency to decline (<xref rid="figure1" ref-type="fig">Figure 1</xref>D). This suggests that the difference of topic repetition between seniors with and without AD might change with a certain tendency, rather than randomly, with intervening days for two different conversations, and be the largest in the medium interval.</p>
      <p>We next compared the repetition features with the standard linguistic features that were typically used in previous studies on connected speech data during neuropsychological tests [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref34">34</xref>]. Specifically, we extracted a total of 29 features used in previous studies: 14 features related to part-of-speech distribution, 3 features related to vocabulary richness, 7 features related to syntactic complexity, and 5 features related to perseveration. We found that 13 of the 29 features showed a significant difference between healthy control and AD groups in our dataset of daily conversations (<italic>P</italic>&lt;.01, 2-sided <italic>t</italic> test with Bonferroni multiple testing correction; 11 out of 14 features relating to part-of-speech distribution, 1 out of 3 features relating to vocabulary richness, 1 out of 7 features relating to syntactic complexity, 0 out of 5 features related to perseveration; for exact <italic>P</italic> values see <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Through a comparison of discriminative power, we found that both topic and word repetition features across two conversations on different days outperformed all 29 features used in previous studies in terms of AUC-ROC scores (<xref ref-type="table" rid="table2">Table 2</xref> and <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), followed by conjunction ratio (AUC=0.89; effect size of –2.03, 95% CI –2.33 to –1.73) and pronoun to noun ratio (AUC=0.87; effect size of –1.94, 95% CI –2.24 to –1.64). These results indicate that topic and word repetition across daily conversations on different days might be a better indicator for differentiating AD than linguistic features used for inferring AD in neuropsychological test settings.</p>
      <p>Finally, we investigated how changes in the language function of AD patients measured by linguistic features are different during neuropsychological tests and daily conversations. First, we summarized the linguistic features reported to be significant in distinguishing AD from healthy controls in previous studies on connected speech data during neuropsychological tests [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref34">34</xref>]. For the selection of the previous studies, we referred to the review article [<xref ref-type="bibr" rid="ref40">40</xref>] as the baseline and added studies. Specifically, we considered only studies based on a group comparison with a group of healthy controls. Only studies focusing on connected speech through neuropsychological tests including picture descriptions have been considered. Semistructured or unstructured interviews including open-ended questions were not included. The features reported as significant in at least half of the studies were considered as the significant features. We then compared them with the results of statistical analysis on our dataset of free daily conversations.</p>
      <p>This comparison showed that 19 out of 24 features showed a statistically consistent tendency with the results of the previous studies on connected speech data during neuropsychological tests (<xref ref-type="table" rid="table3">Table 3</xref> and <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The other 5 features related to part-of-speech distribution (verb frequency, adjective ratio, and noun to verb ratio) and perseveration (average cosine distance and proportion of sentence pairs whose cosine distance is less than threshold 0.50) showed a statistically different tendency.</p>
      <table-wrap position="float" id="table2">
        <label>Table 2</label>
        <caption>
          <p>Top 15 features of high discriminative power among linguistic features used in previous studies and repetition features. The table contains area under the receiver operating characteristic curve (AUC-ROC) score, effect size (Cohen d) with 95% CI, and <italic>P</italic> value of 2-sided t test with Bonferroni multiple testing correction.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="480"/>
          <col width="110"/>
          <col width="280"/>
          <col width="130"/>
          <thead>
            <tr valign="top">
              <td>Feature type</td>
              <td>AUC-ROC<sup>a</sup></td>
              <td>Effect size (95% CI)</td>
              <td>Adjusted <italic>P</italic> value</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Topic repetition in two different conversations separated by <italic>t</italic> days interval (<italic>T</italic>=7)<sup>b</sup></td>
              <td>0.91</td>
              <td>–1.76 (–2.15 to –1.36)</td>
              <td>4.17E–17</td>
            </tr>
            <tr valign="top">
              <td>Word repetition in two different conversations separated by <italic>t</italic> days interval (<italic>T</italic>=10)<sup>b</sup></td>
              <td>0.90</td>
              <td>–1.67 (–2.06 to –1.29)</td>
              <td>4.44E–17</td>
            </tr>
            <tr valign="top">
              <td>Conjunction ratio</td>
              <td>0.89</td>
              <td>–2.03 (–2.33 to –1.73)</td>
              <td>2.04E–41</td>
            </tr>
            <tr valign="top">
              <td>Pronoun to noun ratio</td>
              <td>0.87</td>
              <td>–1.94 (–2.24 to –1.64)</td>
              <td>3.17E–38</td>
            </tr>
            <tr valign="top">
              <td>Topic repetition in two different conversations separated by <italic>n</italic> phone calls (<italic>N</italic>=9)<sup>b</sup></td>
              <td>0.86</td>
              <td>–1.35 (–1.51 to –1.20)</td>
              <td>2.75E–67</td>
            </tr>
            <tr valign="top">
              <td>Noun ratio</td>
              <td>0.86</td>
              <td>1.38 (1.09 to 1.67)</td>
              <td>4.28E–20</td>
            </tr>
            <tr valign="top">
              <td>Word repetition in two different conversations separated by <italic>n</italic> phone calls (<italic>N</italic>=7)<sup>b</sup></td>
              <td>0.84</td>
              <td>–1.22 (–1.36 to –1.08)</td>
              <td>9.35E–66</td>
            </tr>
            <tr valign="top">
              <td>Pronoun ratio</td>
              <td>0.82</td>
              <td>–1.50 (–1.79 to –1.21)</td>
              <td>1.30E–23</td>
            </tr>
            <tr valign="top">
              <td>Noun to verb ratio</td>
              <td>0.81</td>
              <td>0.63 (0.35 to 0.91)</td>
              <td>2.73E–04</td>
            </tr>
            <tr valign="top">
              <td>Honoré’s statistic</td>
              <td>0.80</td>
              <td>1.03 (0.75 to 1.32)</td>
              <td>1.61E–11</td>
            </tr>
            <tr valign="top">
              <td>Word repetition in single conversations<sup>b</sup></td>
              <td>0.79</td>
              <td>–1.08 (–1.36 to –0.79)</td>
              <td>1.57E–12</td>
            </tr>
            <tr valign="top">
              <td>Topic repetition in single conversations<sup>b</sup></td>
              <td>0.78</td>
              <td>–0.80 (–1.09 to –0.52)</td>
              <td>7.62E–07</td>
            </tr>
            <tr valign="top">
              <td>Conjunction frequency</td>
              <td>0.77</td>
              <td>–1.27 (–1.55 to –0.98)</td>
              <td>4.22E–17</td>
            </tr>
            <tr valign="top">
              <td>Noun frequency</td>
              <td>0.75</td>
              <td>0.71 (0.43 to 0.99)</td>
              <td>1.66E–05</td>
            </tr>
            <tr valign="top">
              <td>Adjective ratio</td>
              <td>0.75</td>
              <td>–1.06 (–1.34 to –0.77)</td>
              <td>5.12E–12</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table2fn1">
            <p><sup>a</sup>AUC-ROC: area under the receiver operating characteristic curve.</p>
          </fn>
          <fn id="table2fn2">
            <p><sup>b</sup>Topic and word repetition features proposed by the authors.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <table-wrap position="float" id="table3">
        <label>Table 3</label>
        <caption>
          <p>Comparison of the results of statistical analysis for the linguistic features between our study and previous studies. Our study analyzes speech data during daily conversations, while the previous studies analyzed connected speech data during neuropsychological tests. Sig and nonsig refer to significant and nonsignificant. For example, sig-nonsig in the inconsistent column indicates a feature that showed significant difference in the previous studies but not in our study. Cells contain the name of the corresponding features. Features whose statistical test results were not reported in the previous studies are excluded from this summary table. Information including <italic>P</italic> values of the statistical analysis in our study and the list of the previous studies is provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="200"/>
          <col width="250"/>
          <col width="250"/>
          <col width="150"/>
          <col width="150"/>
          <thead>
            <tr valign="top">
              <td>Feature category</td>
              <td colspan="2">Consistent (our study–previous studies)</td>
              <td colspan="2">Inconsistent (our study–previous study)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Sig-sig</td>
              <td>Nonsig-nonsig</td>
              <td>Sig-nonsig</td>
              <td>Nonsig-sig</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Part of speech (12)</td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>Noun frequency</p>
                  </list-item>
                  <list-item>
                    <p>Auxiliary verb frequency</p>
                  </list-item>
                  <list-item>
                    <p>Noun ratio</p>
                  </list-item>
                  <list-item>
                    <p>Verb ratio</p>
                  </list-item>
                  <list-item>
                    <p>Pronoun ratio</p>
                  </list-item>
                  <list-item>
                    <p>Auxiliary verb ratio</p>
                  </list-item>
                  <list-item>
                    <p>Conjunction ratio</p>
                  </list-item>
                  <list-item>
                    <p>Pronoun to noun ratio</p>
                  </list-item>
                </list>
              </td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>Adverb ratio</p>
                  </list-item>
                </list>
              </td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>Adjective ratio</p>
                  </list-item>
                  <list-item>
                    <p>Noun to verb ratio</p>
                  </list-item>
                </list>
              </td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>Verb frequency</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td>Vocabulary richness (3)</td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>Honoré’s statistic</p>
                  </list-item>
                </list>
              </td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>Type-token ratio</p>
                  </list-item>
                  <list-item>
                    <p>Brunét’s index</p>
                  </list-item>
                </list>
              </td>
              <td>—</td>
              <td>—</td>
            </tr>
            <tr valign="top">
              <td>Syntactic complexity (7)</td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>Mean length of sentence (utterance)</p>
                  </list-item>
                </list>
              </td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>Total no of words</p>
                  </list-item>
                  <list-item>
                    <p>No of sentences (utterances)</p>
                  </list-item>
                  <list-item>
                    <p>No of characters</p>
                  </list-item>
                  <list-item>
                    <p>Total dependency distance in a document</p>
                  </list-item>
                  <list-item>
                    <p>Avg dependency distance per sentence</p>
                  </list-item>
                  <list-item>
                    <p>Total no of distance in a document</p>
                  </list-item>
                </list>
              </td>
              <td>—</td>
              <td>—</td>
            </tr>
            <tr valign="top">
              <td>Perseveration (2)</td>
              <td>—</td>
              <td>—</td>
              <td>—</td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>Avg cosine distance</p>
                  </list-item>
                  <list-item>
                    <p>Cosine cutoff: 0.50</p>
                  </list-item>
                </list>
              </td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>In response to the increasing demand for detecting dementia in everyday situations, we aimed to quantify language dysfunctions observed in AD from daily conversational data when the target is not performing neuropsychological or cognitive tasks. Although previous studies have succeeded in quantifying many aspects of language dysfunction, including grammatical and informational content as well as speech characteristics resulting from AD, they mainly investigated connected speech data collected while targets were engaged in neuropsychological and cognitive tasks; how language dysfunction in daily conversations can be quantified has not been sufficiently investigated. In this study, we focused on atypical repetition of words and topics reported by previous observational and descriptive studies as one of the prominent characteristics in everyday conversations of AD patients. Using conversational data of seniors with and without AD obtained from longitudinal follow-up in a regular monitoring service (from n=15 individuals including 2 AD patients at an average follow-up period of 16.1 months; 1032 conversational data items obtained during phone calls and approximately 221 person-hours), we investigated whether and how linguistic features related to word and topic repetition can be used for differentiating AD patients.</p>
        <p>The results indicated that atypical repetition across different conversations could have a better discriminative power for AD compared to that within single conversations. We assume this atypical repetition across different conversations results from memory impairment that prevents speakers from remembering recent conversations. If so, the results suggest that the difference of memory performance between AD and healthy older adults might be larger after the lapse of some time than immediately, and linguistic features relating to atypical repetition could capture such difference even in daily conversations. In fact, deficits in episodic memory are one of the earliest detectable cognitive impairments in AD [<xref ref-type="bibr" rid="ref53">53</xref>], and some experimental studies on episodic memory tasks such as word-list learning have reported that the forgetting rate passing from immediate to delayed recall in AD was significantly larger than that in age-matched controls [<xref ref-type="bibr" rid="ref54">54</xref>]. These experimental studies seem to support our results. In addition, our results suggest that interval days between two conversations might be a more important parameter than the number of phone calls in terms of a discriminating power. These results might also be reasonable if the linguistic features relating to repetition can capture memory impairments resulting from pathological changes underlying AD. Furthermore, recent studies have reported accelerated long-term forgetting even in presymptomatic AD, which has garnered increased attention to detecting presymptomatic changes in AD [<xref ref-type="bibr" rid="ref55">55</xref>]. From this perspective, our approach, which focuses on atypical repetition in daily conversations on different days, holds promise for detecting early signs of AD in everyday situations.</p>
        <p>On the basis of comparisons with the standard linguistic features used in previous studies on connected speech data during neuropsychological tests, we found that features relating to atypical repetition in two conversations on different days had better AUC-ROC scores for differentiating AD than these linguistic features on speech data of daily conversations. The results suggest that repetition features across daily conversations on different days might be better indicators for detecting AD in everyday situations. We also compared the results of statistical analysis for each linguistic feature between previous studies on connected speech data during neuropsychological tests and our studies on daily conversations and found that about 80% of features (19 out of 24) showed a statistically consistent tendency. These results indicate that these linguistic features could be useful for inferring AD from speech data not only during neuropsychological tests but also during daily conversations. Features showing a statistically different tendency included those related to part-of-speech distributions and perseveration. In terms of the features of part-of-speech distribution, adjective ratio and noun to verb ratio showed significant difference between AD and controls in our study, while they were reported to have no significant difference in previous studies on connected speech data during neuropsychological tests [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. In contrast, previous studies on speech data during semistructured interviews have reported that these two features were significant different [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref56">56</xref>]. Thus, language dysfunction in AD measured by these two features might be discriminative, especially in conversations in which the contents are less predetermined. As for the features related to perseveration, we found no significant difference in our dataset, while previous work reported the statistical significance of these features [<xref ref-type="bibr" rid="ref22">22</xref>]. For example, one study used these features for measuring semantic similarity using a bag-of-words model in speech data during a picture description task and reported a significant difference between AD and controls [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref57">57</xref>]. Considering our results on the statistical analysis for these features, when we analyze unstructured and free conversational data such as daily conversations, language dysfunction in AD related to perseveration might need to be measured by combining a model for estimating the semantic topics (eg, BTM). In fact, the semantic similarity when using the BTM revealed a significant difference between AD and controls in our dataset.</p>
        <p>In this study, we analyzed daily conversational data and showed that linguistic features, especially those related to repetition, can potentially be used for automatically detecting AD in a longitudinal and passive manner. Indeed, speech data collected in daily lives has gained increasing interest for clinical applications due to the improvement in audio quality recorded by portable devices and the expansion of voice-based interaction systems such as smartphones and smart speakers [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref58">58</xref>]. In particular, several studies that administrated cognitive and neuropsychological assessments over the phone have reported that speech features could be reliably extracted from phone recordings and used to build models for AD screening [<xref ref-type="bibr" rid="ref59">59</xref>]. However, there are still relatively few studies on changes in speech features in daily conversations resulting from AD. Being capable of inferring AD from daily conversations would help with timely detection by frequent assessments with relatively short intervals, which might be difficult to do when using neuropsychological tests due to learning effects. From this perspective, we believe that the results of our study will help promote future efforts toward early detection of AD in everyday situations.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>Our work has several limitations. First, the number of participants was small, especially for AD patients, although the follow-up periods and number of conversations for each participant were relatively long and large. The results of a post hoc power analysis revealed that we would need at least two additional AD patients to obtain more than 0.80 of the power. A second limitation is the lack of information about AD severity and stage. We analyzed conversational data collected from the users of a regular monitoring service, and as such, were not able to obtain information related to clinical assessments, such as Mini-Mental State Exam scores and biomarkers (aside from AD diagnosis provided by medical doctors). Third, the age and gender of the control and AD groups were not matched. These three limitations stem from the fact that our dataset was collected from real users of an actual monitoring service. To clarify the relevance of our results obtained from the datasets with these limitations, we comprehensively compared the statistical results of each of the 24 linguistic features between our study and more than 20 previous studies and confirmed that our dataset showed a statistically consistent tendency with the previous studies. In addition to this perspective, because our dataset represents invaluable data collected from a real service and consists of 1032 conversational data items at an average follow-up period of 16.1 months, we believe our results can provide useful information for future studies toward the early detection of AD in the real world. The fourth limitation is the use of transcribed conversation data after omitting information related to incomplete words and fillers. While previous studies on connected speech during neuropsychological tests reported that these features did not significantly differ between controls and AD patients [<xref ref-type="bibr" rid="ref40">40</xref>], we feel that further investigation is required, especially on speech data in daily conversations. The fifth limitation was the specific type of conversational data used. In this study, we analyzed free conversation between older adults and communicators mainly about the lives of the older individuals, but we need further research to confirm our results and extend the scope into various types of daily conversation, such as phone call conversations with their friends and face-to-face family conversations.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>In summary, we investigated the daily conversational data of seniors with and without AD obtained from longitudinal follow-up in a regular monitoring service. We demonstrated that, while the linguistic features used in previous studies on connected speech data during neuropsychological tests can be used for detecting AD from daily conversations, the novel features related to repetition across conversations on different days could be a better indicator. We believe that our results can help to promote future efforts toward early detection of AD in everyday situations by taking advantage of speech data that can be collected in a passive, longitudinal manner.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Results of statistical analysis for the linguistic features in our dataset of daily conversations and the summary of the statistical analysis of these features in previous studies on speech data during neuropsychological tests.</p>
        <media xlink:href="mental_v7i1e16790_app1.docx" xlink:title="DOCX File , 38 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AD</term>
          <def>
            <p>Alzheimer disease</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AUC-ROC</term>
          <def>
            <p>area under the receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">BI</term>
          <def>
            <p>Brunét’s index</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">BTM</term>
          <def>
            <p>biterm topic model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">HS</term>
          <def>
            <p>Honoré’s statistic</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">TF-IDF</term>
          <def>
            <p>term frequency–inverse document frequency</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">TTR</term>
          <def>
            <p>type-token ratio</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>We thank M Nishimura for valuable comments and suggestions on the data analysis. We also thank A Kamiyama, Y Masuda, J Hayakawa, and K Cho at Cocolomi Co, Ltd, for providing all of the data used in this study.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <source>Alzheimer's Disease International</source>
          <year>2018</year>
          <access-date>2019-12-22</access-date>
          <comment>World Alzheimer Report 2018: the state of the art of dementia research: new frontiers <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.alz.co.uk/research/WorldAlzheimerReport2018.pdf">https://www.alz.co.uk/research/WorldAlzheimerReport2018.pdf</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Prince</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Comas-Herrera</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Knapp</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Guerchet</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Karagiannidou</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <source>Alzheimer's Disease International</source>
          <year>2016</year>
          <access-date>2019-12-22</access-date>
          <comment>World Alzheimer Report 2016: improving healthcare for people living with dementia: coverage, quality and costs now and in the future <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.alz.co.uk/research/WorldAlzheimerReport2016.pdf">https://www.alz.co.uk/research/WorldAlzheimerReport2016.pdf</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Teipel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>König</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hoey</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kaye</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Krüger</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Robillard</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Kirste</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Babiloni</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Use of nonintrusive sensor-based information and communication technology for real-world evidence for clinical trials in dementia</article-title>
          <source>Alzheimers Dement</source>
          <year>2018</year>
          <month>09</month>
          <volume>14</volume>
          <issue>9</issue>
          <fpage>1216</fpage>
          <lpage>1231</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1552-5260(18)30156-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jalz.2018.05.003</pub-id>
          <pub-id pub-id-type="medline">29936147</pub-id>
          <pub-id pub-id-type="pii">S1552-5260(18)30156-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC6179371</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kourtis</surname>
              <given-names>LC</given-names>
            </name>
            <name name-style="western">
              <surname>Regele</surname>
              <given-names>OB</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>GB</given-names>
            </name>
          </person-group>
          <article-title>Digital biomarkers for Alzheimer's disease: the mobile/ wearable devices opportunity</article-title>
          <source>NPJ Digit Med</source>
          <year>2019</year>
          <volume>2</volume>
          <fpage>9</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31119198"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-019-0084-2</pub-id>
          <pub-id pub-id-type="medline">31119198</pub-id>
          <pub-id pub-id-type="pmcid">PMC6526279</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kirshner</surname>
              <given-names>HS</given-names>
            </name>
          </person-group>
          <article-title>Primary progressive aphasia and Alzheimer's disease: brief history, recent evidence</article-title>
          <source>Curr Neurol Neurosci Rep</source>
          <year>2012</year>
          <month>12</month>
          <volume>12</volume>
          <issue>6</issue>
          <fpage>709</fpage>
          <lpage>714</lpage>
          <pub-id pub-id-type="doi">10.1007/s11910-012-0307-2</pub-id>
          <pub-id pub-id-type="medline">22932755</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>MacKay</surname>
              <given-names>DG</given-names>
            </name>
            <name name-style="western">
              <surname>James</surname>
              <given-names>LE</given-names>
            </name>
            <name name-style="western">
              <surname>Hadley</surname>
              <given-names>CB</given-names>
            </name>
          </person-group>
          <article-title>Amnesic H.M.'s performance on the language competence test: parallel deficits in memory and sentence production</article-title>
          <source>J Clin Exp Neuropsychol</source>
          <year>2008</year>
          <month>04</month>
          <volume>30</volume>
          <issue>3</issue>
          <fpage>280</fpage>
          <lpage>300</lpage>
          <pub-id pub-id-type="doi">10.1080/13803390701380609</pub-id>
          <pub-id pub-id-type="medline">17852614</pub-id>
          <pub-id pub-id-type="pii">780567613</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>van Velzen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Garrard</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>From hindsight to insight—retrospective analysis of language written by a renowned Alzheimer's patient</article-title>
          <source>Interdiscip Sci Rev</source>
          <year>2013</year>
          <month>07</month>
          <day>18</day>
          <volume>33</volume>
          <issue>4</issue>
          <fpage>278</fpage>
          <lpage>286</lpage>
          <pub-id pub-id-type="doi">10.1179/174327908x392852</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Oulhaj</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wilcock</surname>
              <given-names>GK</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>de Jager</surname>
              <given-names>CA</given-names>
            </name>
          </person-group>
          <article-title>Predicting the time of conversion to MCI in the elderly: role of verbal expression and learning</article-title>
          <source>Neurology</source>
          <year>2009</year>
          <month>11</month>
          <day>03</day>
          <volume>73</volume>
          <issue>18</issue>
          <fpage>1436</fpage>
          <lpage>1442</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/19794124"/>
          </comment>
          <pub-id pub-id-type="doi">10.1212/WNL.0b013e3181c0665f</pub-id>
          <pub-id pub-id-type="medline">19794124</pub-id>
          <pub-id pub-id-type="pii">WNL.0b013e3181c0665f</pub-id>
          <pub-id pub-id-type="pmcid">PMC2882176</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>de Jager</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Haigh</surname>
              <given-names>AF</given-names>
            </name>
            <name name-style="western">
              <surname>Garrard</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Logopenic aphasia in Alzheimer's disease: clinical variant or clinical feature?</article-title>
          <source>J Neurol Neurosurg Psychiatry</source>
          <year>2012</year>
          <month>11</month>
          <volume>83</volume>
          <issue>11</issue>
          <fpage>1056</fpage>
          <lpage>1062</lpage>
          <pub-id pub-id-type="doi">10.1136/jnnp-2012-302798</pub-id>
          <pub-id pub-id-type="medline">22842206</pub-id>
          <pub-id pub-id-type="pii">jnnp-2012-302798</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>de Jager</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Haigh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Garrard</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Semantic processing in connected speech at a uniformly early stage of autopsy-confirmed Alzheimer's disease</article-title>
          <source>Neuropsychology</source>
          <year>2013</year>
          <month>01</month>
          <volume>27</volume>
          <issue>1</issue>
          <fpage>79</fpage>
          <lpage>85</lpage>
          <pub-id pub-id-type="doi">10.1037/a0031288</pub-id>
          <pub-id pub-id-type="medline">23356598</pub-id>
          <pub-id pub-id-type="pii">2013-01868-007</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bucks</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cuerden</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Wilcock</surname>
              <given-names>GK</given-names>
            </name>
          </person-group>
          <article-title>Analysis of spontaneous, conversational speech in dementia of Alzheimer type: evaluation of an objective technique for analysing lexical performance</article-title>
          <source>Aphasiology</source>
          <year>2000</year>
          <month>01</month>
          <volume>14</volume>
          <issue>1</issue>
          <fpage>71</fpage>
          <lpage>91</lpage>
          <pub-id pub-id-type="doi">10.1080/026870300401603</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hoffmann</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Nemeth</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Dye</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Pákáski</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Irinyi</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kálmán</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Temporal parameters of spontaneous speech in Alzheimer's disease</article-title>
          <source>Int J Speech Lang Pathol</source>
          <year>2010</year>
          <month>02</month>
          <volume>12</volume>
          <issue>1</issue>
          <fpage>29</fpage>
          <lpage>34</lpage>
          <pub-id pub-id-type="medline">20380247</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guinn</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Habash</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <source>AAAI Fall Symposium: Artificial Intelligence for Gerontechnology</source>
          <year>2012</year>
          <access-date>2019-12-22</access-date>
          <comment>Language analysis of speakers with dementia of the Alzheimer's type <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.aaai.org/ocs/index.php/FSS/FSS12/paper/download/5574/5783">https://www.aaai.org/ocs/index.php/FSS/FSS12/paper/download/5574/5783</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Haigh</surname>
              <given-names>AF</given-names>
            </name>
            <name name-style="western">
              <surname>de Jager</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Garrard</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Connected speech as a marker of disease progression in autopsy-proven Alzheimer's disease</article-title>
          <source>Brain</source>
          <year>2013</year>
          <month>12</month>
          <volume>136</volume>
          <issue>Pt 12</issue>
          <fpage>3727</fpage>
          <lpage>3737</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24142144"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/brain/awt269</pub-id>
          <pub-id pub-id-type="medline">24142144</pub-id>
          <pub-id pub-id-type="pii">awt269</pub-id>
          <pub-id pub-id-type="pmcid">PMC3859216</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Beltrami</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Gagliardi</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Rossini Favretti</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ghidoni</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Tamburini</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Calzà</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Speech analysis by natural language processing techniques: a possible tool for very early detection of cognitive decline?</article-title>
          <source>Front Aging Neurosci</source>
          <year>2018</year>
          <volume>10</volume>
          <fpage>369</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3389/fnagi.2018.00369"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fnagi.2018.00369</pub-id>
          <pub-id pub-id-type="medline">30483116</pub-id>
          <pub-id pub-id-type="pmcid">PMC6243042</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bschor</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kühl</surname>
              <given-names>KP</given-names>
            </name>
            <name name-style="western">
              <surname>Reischies</surname>
              <given-names>FM</given-names>
            </name>
          </person-group>
          <article-title>Spontaneous speech of patients with dementia of the Alzheimer type and mild cognitive impairment</article-title>
          <source>Int Psychogeriatr</source>
          <year>2001</year>
          <month>09</month>
          <volume>13</volume>
          <issue>3</issue>
          <fpage>289</fpage>
          <lpage>298</lpage>
          <pub-id pub-id-type="medline">11768376</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carlomagno</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Santoro</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Menditti</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pandolfi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Marini</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Referential communication in Alzheimer's type dementia</article-title>
          <source>Cortex</source>
          <year>2005</year>
          <month>08</month>
          <volume>41</volume>
          <issue>4</issue>
          <fpage>520</fpage>
          <lpage>534</lpage>
          <pub-id pub-id-type="doi">10.1016/s0010-9452(08)70192-8</pub-id>
          <pub-id pub-id-type="medline">16042028</pub-id>
          <pub-id pub-id-type="pii">S0010-9452(08)70192-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Croisile</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ska</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Brabant</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Duchene</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lepage</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Aimard</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Trillet</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Comparative study of oral and written picture description in patients with Alzheimer's disease</article-title>
          <source>Brain Lang</source>
          <year>1996</year>
          <month>04</month>
          <volume>53</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>19</lpage>
          <pub-id pub-id-type="doi">10.1006/brln.1996.0033</pub-id>
          <pub-id pub-id-type="medline">8722896</pub-id>
          <pub-id pub-id-type="pii">S0093-934X(96)90033-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cuetos</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Arango-Lasprilla</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Uribe</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Valencia</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lopera</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Linguistic changes in verbal expression: a preclinical marker of Alzheimer's disease</article-title>
          <source>J Int Neuropsychol Soc</source>
          <year>2007</year>
          <month>05</month>
          <volume>13</volume>
          <issue>3</issue>
          <fpage>433</fpage>
          <lpage>439</lpage>
          <pub-id pub-id-type="doi">10.1017/S1355617707070609</pub-id>
          <pub-id pub-id-type="medline">17445292</pub-id>
          <pub-id pub-id-type="pii">S1355617707070609</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Feyereisen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Berrewaerts</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hupet</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Pragmatic skills in the early stages of Alzheimer's disease: an analysis by means of a referential communication task</article-title>
          <source>Int J Lang Commun Disord</source>
          <year>2007</year>
          <volume>42</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>17</lpage>
          <pub-id pub-id-type="doi">10.1080/13682820600624216</pub-id>
          <pub-id pub-id-type="medline">17365083</pub-id>
          <pub-id pub-id-type="pii">769953694</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Forbes-McKay</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Shanks</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Venneri</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Profiling spontaneous speech decline in Alzheimer's disease: a longitudinal study</article-title>
          <source>Acta Neuropsychiatr</source>
          <year>2013</year>
          <month>12</month>
          <volume>25</volume>
          <issue>6</issue>
          <fpage>320</fpage>
          <lpage>327</lpage>
          <pub-id pub-id-type="doi">10.1017/neu.2013.16</pub-id>
          <pub-id pub-id-type="medline">25287871</pub-id>
          <pub-id pub-id-type="pii">S0924270813000161</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fraser</surname>
              <given-names>KC</given-names>
            </name>
            <name name-style="western">
              <surname>Meltzer</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Rudzicz</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Linguistic features identify Alzheimer's disease in narrative speech</article-title>
          <source>J Alzheimers Dis</source>
          <year>2016</year>
          <volume>49</volume>
          <issue>2</issue>
          <fpage>407</fpage>
          <lpage>422</lpage>
          <pub-id pub-id-type="doi">10.3233/JAD-150520</pub-id>
          <pub-id pub-id-type="medline">26484921</pub-id>
          <pub-id pub-id-type="pii">JAD150520</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hernández-Domínguez</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ratté</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sierra-Martínez</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Roche-Bergua</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Computer-based evaluation of Alzheimer's disease and mild cognitive impairment patients during a picture description task</article-title>
          <source>Alzheimers Dement (Amst)</source>
          <year>2018</year>
          <volume>10</volume>
          <fpage>260</fpage>
          <lpage>268</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2352-8729(18)30012-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.dadm.2018.02.004</pub-id>
          <pub-id pub-id-type="medline">29780871</pub-id>
          <pub-id pub-id-type="pii">S2352-8729(18)30012-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC5956933</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kavé</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Levy</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Morphology in picture descriptions provided by persons with Alzheimer's disease</article-title>
          <source>J Speech Lang Hear Res</source>
          <year>2003</year>
          <month>04</month>
          <volume>46</volume>
          <issue>2</issue>
          <fpage>341</fpage>
          <lpage>352</lpage>
          <pub-id pub-id-type="medline">14700376</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kavé</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Goral</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Word retrieval in picture descriptions produced by individuals with Alzheimer's disease</article-title>
          <source>J Clin Exp Neuropsychol</source>
          <year>2016</year>
          <month>11</month>
          <volume>38</volume>
          <issue>9</issue>
          <fpage>958</fpage>
          <lpage>966</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27171756"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/13803395.2016.1179266</pub-id>
          <pub-id pub-id-type="medline">27171756</pub-id>
          <pub-id pub-id-type="pmcid">PMC4983450</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>March</surname>
              <given-names>EG</given-names>
            </name>
            <name name-style="western">
              <surname>Wales</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Pattison</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>The uses of nouns and deixis in discourse production in Alzheimer's disease</article-title>
          <source>J Neurolinguistics</source>
          <year>2006</year>
          <month>7</month>
          <volume>19</volume>
          <issue>4</issue>
          <fpage>311</fpage>
          <lpage>340</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jneuroling.2006.01.001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mueller</surname>
              <given-names>KD</given-names>
            </name>
            <name name-style="western">
              <surname>Koscik</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Hermann</surname>
              <given-names>BP</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Turkstra</surname>
              <given-names>LS</given-names>
            </name>
          </person-group>
          <article-title>Declines in connected language are associated with very early mild cognitive impairment: results from the Wisconsin Registry for Alzheimer's Prevention</article-title>
          <source>Front Aging Neurosci</source>
          <year>2018</year>
          <volume>9</volume>
          <fpage>437</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3389/fnagi.2017.00437"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fnagi.2017.00437</pub-id>
          <pub-id pub-id-type="medline">29375365</pub-id>
          <pub-id pub-id-type="pmcid">PMC5767238</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nicholas</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Obler</surname>
              <given-names>LK</given-names>
            </name>
            <name name-style="western">
              <surname>Albert</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Helm-Estabrooks</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Empty speech in Alzheimer's disease and fluent aphasia</article-title>
          <source>J Speech Hear Res</source>
          <year>1985</year>
          <month>09</month>
          <volume>28</volume>
          <issue>3</issue>
          <fpage>405</fpage>
          <lpage>410</lpage>
          <pub-id pub-id-type="doi">10.1044/jshr.2803.405</pub-id>
          <pub-id pub-id-type="medline">4046581</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Orimaye</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Golden</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Learning predictive linguistic features for Alzheimer's disease and related dementias using verbal utterances</article-title>
          <year>2014</year>
          <conf-name>Proceedings of the Workshop on Computational Linguistics and Clinical Psychology</conf-name>
          <conf-date>2014</conf-date>
          <conf-loc>Baltimore</conf-loc>
          <fpage>78</fpage>
          <lpage>87</lpage>
          <pub-id pub-id-type="doi">10.3115/v1/w14-3210</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Orimaye</surname>
              <given-names>SO</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Golden</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>CP</given-names>
            </name>
            <name name-style="western">
              <surname>Soyiri</surname>
              <given-names>IN</given-names>
            </name>
          </person-group>
          <article-title>Predicting probable Alzheimer's disease using linguistic deficits and biomarkers</article-title>
          <source>BMC Bioinformatics</source>
          <year>2017</year>
          <month>01</month>
          <day>14</day>
          <volume>18</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>13</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/s12859-016-1456-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12859-016-1456-0</pub-id>
          <pub-id pub-id-type="medline">28088191</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12859-016-1456-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC5237556</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Roark</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Mitchell</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hosom</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hollingshead</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kaye</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Spoken language derived measures for detecting mild cognitive impairment</article-title>
          <source>IEEE Trans Audio Speech Lang Process</source>
          <year>2011</year>
          <month>09</month>
          <day>01</day>
          <volume>19</volume>
          <issue>7</issue>
          <fpage>2081</fpage>
          <lpage>2090</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22199464"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/TASL.2011.2112351</pub-id>
          <pub-id pub-id-type="medline">22199464</pub-id>
          <pub-id pub-id-type="pmcid">PMC3244269</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sajjadi</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Patterson</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Nestor</surname>
              <given-names>PJ</given-names>
            </name>
          </person-group>
          <article-title>Logopenic, mixed, or Alzheimer-related aphasia?</article-title>
          <source>Neurology</source>
          <year>2014</year>
          <month>04</month>
          <day>01</day>
          <volume>82</volume>
          <issue>13</issue>
          <fpage>1127</fpage>
          <lpage>1131</lpage>
          <pub-id pub-id-type="doi">10.1212/WNL.0000000000000271</pub-id>
          <pub-id pub-id-type="medline">24574548</pub-id>
          <pub-id pub-id-type="pii">WNL.0000000000000271</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shimada</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Meguro</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yamazaki</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Horikawa</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hayasaka</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Yamaguchi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yamaguchi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Katsuyama</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Nakano</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yamadori</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Impaired verbal description ability assessed by the Picture Description Task in Alzheimer's disease</article-title>
          <source>Arch Gerontol Geriatr</source>
          <year>1998</year>
          <volume>27</volume>
          <issue>1</issue>
          <fpage>57</fpage>
          <lpage>65</lpage>
          <pub-id pub-id-type="medline">18653151</pub-id>
          <pub-id pub-id-type="pii">S0167-4943(98)00099-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yancheva</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fraser</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Rudzicz</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Using linguistic features longitudinally to predict clinical scores for Alzheimer's disease and related dementias</article-title>
          <year>2015</year>
          <conf-name>Proceedings of SLPAT 6th Workshop on Speech and Language Processing for Assistive Technologies</conf-name>
          <conf-date>2015</conf-date>
          <conf-loc>Dresden</conf-loc>
          <fpage>134</fpage>
          <lpage>139</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/w15-5123</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Henry</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Crawford</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Phillips</surname>
              <given-names>LH</given-names>
            </name>
          </person-group>
          <article-title>Verbal fluency performance in dementia of the Alzheimer's type: a meta-analysis</article-title>
          <source>Neuropsychologia</source>
          <year>2004</year>
          <volume>42</volume>
          <issue>9</issue>
          <fpage>1212</fpage>
          <lpage>1222</lpage>
          <pub-id pub-id-type="doi">10.1016/j.neuropsychologia.2004.02.001</pub-id>
          <pub-id pub-id-type="medline">15178173</pub-id>
          <pub-id pub-id-type="pii">S0028393204000296</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kavé</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Goral</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Word retrieval in connected speech in Alzheimer's disease: a review with meta-analyses</article-title>
          <source>Aphasiology</source>
          <year>2018</year>
          <volume>32</volume>
          <fpage>4</fpage>
          <lpage>26</lpage>
          <pub-id pub-id-type="doi">10.1080/02687038.2017.1338663</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>König</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Satt</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sorin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hoory</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Toledo-Ronen</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Derreumaux</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Manera</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Verhey</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Aalten</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Robert</surname>
              <given-names>PH</given-names>
            </name>
            <name name-style="western">
              <surname>David</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Automatic speech analysis for the assessment of patients with predementia and Alzheimer's disease</article-title>
          <source>Alzheimers Dement (Amst)</source>
          <year>2015</year>
          <month>03</month>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>112</fpage>
          <lpage>124</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://linkinghub.elsevier.com/retrieve/pii/S2352-8729(15)00016-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.dadm.2014.11.012</pub-id>
          <pub-id pub-id-type="medline">27239498</pub-id>
          <pub-id pub-id-type="pii">S2352-8729(15)00016-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC4876915</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lunsford</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Heeman</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Using linguistic indicators of difficulty to identify mild cognitive impairment</article-title>
          <year>2015</year>
          <conf-name>INTERSPEECH 2015</conf-name>
          <conf-date>2015</conf-date>
          <conf-loc>Dresden</conf-loc>
          <fpage>658</fpage>
          <lpage>662</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chinaei</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Currie</surname>
              <given-names>LC</given-names>
            </name>
            <name name-style="western">
              <surname>Danks</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Mehta</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Rudzicz</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Identifying and avoiding confusion in dialogue with people with Alzheimer's disease</article-title>
          <source>Computational Linguistics</source>
          <year>2017</year>
          <month>06</month>
          <volume>43</volume>
          <issue>2</issue>
          <fpage>377</fpage>
          <lpage>406</lpage>
          <pub-id pub-id-type="doi">10.1162/coli_a_00290</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Boschi</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Catricalà</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Consonni</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chesi</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Moro</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cappa</surname>
              <given-names>SF</given-names>
            </name>
          </person-group>
          <article-title>Connected speech in neurodegenerative language disorders: a review</article-title>
          <source>Front Psychol</source>
          <year>2017</year>
          <volume>8</volume>
          <fpage>269</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3389/fpsyg.2017.00269"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fpsyg.2017.00269</pub-id>
          <pub-id pub-id-type="medline">28321196</pub-id>
          <pub-id pub-id-type="pmcid">PMC5337522</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cook</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Fay</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rockwood</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Verbal repetition in people with mild-to-moderate Alzheimer Disease: a descriptive analysis from the VISTA clinical trial</article-title>
          <source>Alzheimer Dis Assoc Disord</source>
          <year>2009</year>
          <volume>23</volume>
          <issue>2</issue>
          <fpage>146</fpage>
          <lpage>151</lpage>
          <pub-id pub-id-type="doi">10.1097/WAD.0b013e318193cbef</pub-id>
          <pub-id pub-id-type="medline">19474572</pub-id>
          <pub-id pub-id-type="pii">00002093-200904000-00008</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kudo</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <source>Mecab: yet another part-of-speech and morphological analyzer</source>
          <year>2005</year>
          <access-date>2019-12-22</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.semanticscholar.org/paper/MeCab-%3A-Yet-Another-Part-of-Speech-and-Analyzer-Kudo/70b849773678010942a0975f2887e527c17cda76#paper-header">https://www.semanticscholar.org/paper/MeCab-%3A-Yet-Another-Part-of-Speech-and-Analyzer-Kudo/70b849773678010942a0975f2887e527c17cda76#paper-header</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Honoré</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <source>Some simple measures of richness of vocabulary</source>
          <year>1979</year>
          <access-date>2019-12-22</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.semanticscholar.org/paper/Some-Simple-Measures-of-Richness-of-Vocabulary-Honor%C3%A9/68d636546e452d9ec1dc5b3f5d2977cc53b182cb">https://www.semanticscholar.org/paper/Some-Simple-Measures-of-Richness-of-Vocabulary-Honor%C3%A9/68d636546e452d9ec1dc5b3f5d2977cc53b182cb</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lan</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>BTM: topic modeling over short texts</article-title>
          <source>IEEE Transact Knowl Data Engineer</source>
          <year>2014</year>
          <volume>26</volume>
          <issue>12</issue>
          <fpage>2928</fpage>
          <lpage>2941</lpage>
          <pub-id pub-id-type="doi">10.1109/tkde.2014.2313872</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jordan</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Latent dirichlet allocation</article-title>
          <source>J Mach Learn Res</source>
          <year>2003</year>
          <volume>3</volume>
          <fpage>993</fpage>
          <lpage>1022</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Goodglass</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kaplan</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <source>The Boston Diagnostic Aphasia Examination</source>
          <year>1983</year>
          <publisher-loc>Philadelphia</publisher-loc>
          <publisher-name>Lea &amp; Febinger</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Swinburn</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Porter</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Howard</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <source>Comprehensive Aphasia Test</source>
          <year>2004</year>
          <publisher-loc>Hove</publisher-loc>
          <publisher-name>Psychology Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wechsler</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <source>Wechsler Memory Scale. Third Edition Manual</source>
          <year>1997</year>
          <publisher-loc>San Antonio</publisher-loc>
          <publisher-name>The Psychological Corp</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kudo</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <source>Cabocha: yet another Japanese dependency structure analyzer</source>
          <access-date>2019-12-22</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://taku910.github.io/cabocha/">https://taku910.github.io/cabocha/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Dependency distance: a new perspective on syntactic patterns in natural languages</article-title>
          <source>Phys Life Rev</source>
          <year>2017</year>
          <month>07</month>
          <volume>21</volume>
          <fpage>171</fpage>
          <lpage>193</lpage>
          <pub-id pub-id-type="doi">10.1016/j.plrev.2017.03.002</pub-id>
          <pub-id pub-id-type="medline">28624589</pub-id>
          <pub-id pub-id-type="pii">S1571-0645(17)30053-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Masrani</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Murray</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Field</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Carenini</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Detecting dementia through retrospective analysis of routine blog posts by bloggers with dementia</article-title>
          <source>BioNLP</source>
          <year>2017</year>
          <fpage>232</fpage>
          <lpage>237</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/w17-2329</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nakagawa</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cuthill</surname>
              <given-names>IC</given-names>
            </name>
          </person-group>
          <article-title>Effect size, confidence interval and statistical significance: a practical guide for biologists</article-title>
          <source>Biol Rev Camb Philos Soc</source>
          <year>2007</year>
          <month>11</month>
          <volume>82</volume>
          <issue>4</issue>
          <fpage>591</fpage>
          <lpage>605</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1469-185X.2007.00027.x</pub-id>
          <pub-id pub-id-type="medline">17944619</pub-id>
          <pub-id pub-id-type="pii">BRV27</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Greene</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Baddeley</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Hodges</surname>
              <given-names>JR</given-names>
            </name>
          </person-group>
          <article-title>Analysis of the episodic memory deficit in early Alzheimer's disease: evidence from the doors and people test</article-title>
          <source>Neuropsychologia</source>
          <year>1996</year>
          <month>06</month>
          <volume>34</volume>
          <issue>6</issue>
          <fpage>537</fpage>
          <lpage>551</lpage>
          <pub-id pub-id-type="doi">10.1016/0028-3932(95)00151-4</pub-id>
          <pub-id pub-id-type="medline">8736567</pub-id>
          <pub-id pub-id-type="pii">0028-3932(95)00151-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carlesimo</surname>
              <given-names>GA</given-names>
            </name>
            <name name-style="western">
              <surname>Mauri</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Graceffa</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Fadda</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Loasses</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lorusso</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Caltagirone</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Memory performances in young, elderly, and very old healthy individuals versus patients with Alzheimer's disease: evidence for discontinuity between normal and pathological aging</article-title>
          <source>J Clin Exp Neuropsychol</source>
          <year>1998</year>
          <month>02</month>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>14</fpage>
          <lpage>29</lpage>
          <pub-id pub-id-type="doi">10.1076/jcen.20.1.14.1482</pub-id>
          <pub-id pub-id-type="medline">9672816</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weston</surname>
              <given-names>PSJ</given-names>
            </name>
            <name name-style="western">
              <surname>Nicholas</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Henley</surname>
              <given-names>SMD</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Macpherson</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Donnachie</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Schott</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Rossor</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Crutch</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Butler</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Zeman</surname>
              <given-names>AZ</given-names>
            </name>
            <name name-style="western">
              <surname>Fox</surname>
              <given-names>NC</given-names>
            </name>
          </person-group>
          <article-title>Accelerated long-term forgetting in presymptomatic autosomal dominant Alzheimer's disease: a cross-sectional study</article-title>
          <source>Lancet Neurol</source>
          <year>2018</year>
          <month>02</month>
          <volume>17</volume>
          <issue>2</issue>
          <fpage>123</fpage>
          <lpage>132</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1474-4422(17)30434-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S1474-4422(17)30434-9</pub-id>
          <pub-id pub-id-type="medline">29413314</pub-id>
          <pub-id pub-id-type="pii">S1474-4422(17)30434-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC5958413</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jarrold</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Peintner</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Wilkins</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Aided diagnosis of dementia type through computer-based analysis of spontaneous speech</article-title>
          <year>2014</year>
          <conf-name>Proceedings of the Workshop on Computational Linguistics and Clinical Psychology</conf-name>
          <conf-date>2014</conf-date>
          <conf-loc>Baltimore</conf-loc>
          <fpage>27</fpage>
          <lpage>37</lpage>
          <pub-id pub-id-type="doi">10.3115/v1/w14-3204</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fraser</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <source>Automatic Text and Speech Processing for the Detection of Dementia [Thesis]</source>
          <year>2016</year>
          <publisher-loc>Toronto</publisher-loc>
          <publisher-name>University of Toronto</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Manfredi</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lebacq</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cantarella</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Schoentgen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Orlandi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bandini</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>DeJonckere</surname>
              <given-names>PH</given-names>
            </name>
          </person-group>
          <article-title>Smartphones Offer New Opportunities in Clinical Voice Research</article-title>
          <source>J Voice</source>
          <year>2017</year>
          <month>01</month>
          <volume>31</volume>
          <issue>1</issue>
          <fpage>111.e1</fpage>
          <lpage>111.e7</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jvoice.2015.12.020</pub-id>
          <pub-id pub-id-type="medline">27068549</pub-id>
          <pub-id pub-id-type="pii">S0892-1997(16)00005-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Van Mierlo</surname>
              <given-names>LD</given-names>
            </name>
            <name name-style="western">
              <surname>Wouters</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Sikkes</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Van der Flier</surname>
              <given-names>WM</given-names>
            </name>
            <name name-style="western">
              <surname>Prins</surname>
              <given-names>ND</given-names>
            </name>
            <name name-style="western">
              <surname>Bremer</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Koene</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Van Hout</surname>
              <given-names>HPJ</given-names>
            </name>
          </person-group>
          <article-title>Screening for mild cognitive impairment and dementia with automated, anonymous online and telephone cognitive self-tests</article-title>
          <source>J Alzheimers Dis</source>
          <year>2017</year>
          <volume>56</volume>
          <issue>1</issue>
          <fpage>249</fpage>
          <lpage>259</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27911296"/>
          </comment>
          <pub-id pub-id-type="doi">10.3233/JAD-160566</pub-id>
          <pub-id pub-id-type="medline">27911296</pub-id>
          <pub-id pub-id-type="pii">JAD160566</pub-id>
          <pub-id pub-id-type="pmcid">PMC5389042</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
