<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMH</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Ment Health</journal-id>
      <journal-title>JMIR Mental Health</journal-title>
      <issn pub-type="epub">2368-7959</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
    <article-id pub-id-type="publisher-id">v4i1e7</article-id>
    <article-id pub-id-type="pmid">28223264</article-id>
    <article-id pub-id-type="doi">10.2196/mental.6545</article-id>
    <article-categories>
      <subj-group subj-group-type="heading">
        <subject>Original Paper</subject>
      </subj-group>
      <subj-group subj-group-type="article-type">
        <subject>Original Paper</subject>
      </subj-group>
    </article-categories>
    <title-group>
      <article-title>Applying Computerized Adaptive Testing to the Four-Dimensional Symptom Questionnaire (4DSQ): A Simulation Study</article-title>
    </title-group>
    <contrib-group>
      <contrib contrib-type="editor">
        <name>
          <surname>Eysenbach</surname>
          <given-names>Gunther</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Gardner</surname>
          <given-names>William</given-names>
        </name>
      </contrib>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Geraghty</surname>
          <given-names>Adam</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="author" id="contrib1" corresp="yes">
      <name name-style="western">
        <surname>Magnée</surname>
        <given-names>Tessa</given-names>
      </name>
      <degrees>MSc (Psych)</degrees>
      <xref rid="aff1" ref-type="aff">1</xref>
      <address>
        <institution>Netherlands Institute for Health Services Research (NIVEL)</institution>
        <addr-line>Otterstraat 118-114</addr-line>
        <addr-line>Utrecht, 3500BN</addr-line>
        <country>Netherlands</country>
        <phone>31 302729854</phone>
        <fax>31 302729729</fax>
        <email>t.magnee@nivel.nl</email>
      </address>  
      <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-6029-0906</ext-link></contrib>
      <contrib contrib-type="author" id="contrib2">
        <name name-style="western">
          <surname>de Beurs</surname>
          <given-names>Derek P</given-names>
        </name>
        <degrees>PhD</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-0166-6897</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib3">
        <name name-style="western">
          <surname>Terluin</surname>
          <given-names>Berend</given-names>
        </name>
        <degrees>MD, PhD</degrees>
        <xref rid="aff2" ref-type="aff">2</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-8944-5238</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib4">
        <name name-style="western">
          <surname>Verhaak</surname>
          <given-names>Peter F</given-names>
        </name>
        <degrees>PhD</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <xref rid="aff3" ref-type="aff">3</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-5764-3451</ext-link>
      </contrib>
    </contrib-group>
    <aff id="aff1">
      <sup>1</sup>
      <institution>Netherlands Institute for Health Services Research (NIVEL)</institution>
      <addr-line>Utrecht</addr-line>
      <country>Netherlands</country>
    </aff>
    <aff id="aff2">
    <sup>2</sup>
    <institution>EMGO Institute for Health and Care Research</institution>
    <institution>Department of General Practice and Elderly Care Medicine</institution>  
    <institution>VU University Medical Center</institution>  
    <addr-line>Amsterdam</addr-line>
    <country>Netherlands</country></aff>
    <aff id="aff3">
    <sup>3</sup>
    <institution>Groningen University</institution>
    <institution>University Medical Center Groningen</institution>  
    <institution>Department of General Practice</institution>  
    <addr-line>Groningen</addr-line>
    <country>Netherlands</country></aff>
    <author-notes>
      <corresp>Corresponding Author: Tessa Magnée 
      <email>t.magnee@nivel.nl</email></corresp>
    </author-notes>
    <pub-date pub-type="collection"><season>Jan-Mar</season><year>2017</year></pub-date>
    <pub-date pub-type="epub">
      <day>21</day>
      <month>02</month>
      <year>2017</year>
    </pub-date>
    <volume>4</volume>
    <issue>1</issue>
    <elocation-id>e7</elocation-id>
    <!--history from ojs - api-xml-->
    <history>
      <date date-type="received">
        <day>26</day>
        <month>8</month>
        <year>2016</year>
      </date>
      <date date-type="rev-request">
        <day>5</day>
        <month>12</month>
        <year>2016</year>
      </date>
      <date date-type="rev-recd">
        <day>22</day>
        <month>12</month>
        <year>2016</year>
      </date>
      <date date-type="accepted">
        <day>30</day>
        <month>1</month>
        <year>2017</year>
      </date>
    </history>
    <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
    <copyright-statement>©Tessa Magnée, Derek P de Beurs, Berend Terluin, Peter F Verhaak. Originally published in JMIR Mental Health (http://mental.jmir.org), 21.02.2017.</copyright-statement>
    <copyright-year>2017</copyright-year>
    <license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/2.0/">
      <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (http://creativecommons.org/licenses/by/2.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Mental Health, is properly cited. The complete bibliographic information, a link to the original publication on http://mental.jmir.org/, as well as this copyright and license information must be included.</p>
    </license>  
    <self-uri xlink:href="http://mental.jmir.org/2017/1/e7/" xlink:type="simple"/>
    <abstract>
      <sec sec-type="background">
        <title>Background</title>
        <p>Efficient screening questionnaires are useful in general practice. Computerized adaptive testing (CAT) is a method to improve the efficiency of questionnaires, as only the items that are particularly informative for a certain responder are dynamically selected.</p>
      </sec>
      <sec sec-type="objective">
        <title>Objective</title>
        <p>The objective of this study was to test whether CAT could improve the efficiency of the Four-Dimensional Symptom Questionnaire (4DSQ), a frequently used self-report questionnaire designed to assess common psychosocial problems in general practice.</p>
      </sec>
      <sec sec-type="methods">
        <title>Methods</title>
        <p>A simulation study was conducted using a sample of Dutch patients visiting a general practitioner (GP) with psychological problems (n=379). Responders completed a paper-and-pencil version of the 50-item 4DSQ and a psychometric evaluation was performed to check if the data agreed with item response theory (IRT) assumptions. Next, a CAT simulation was performed for each of the four 4DSQ scales (distress, depression, anxiety, and somatization), based on the given responses as if they had been collected through CAT. The following two stopping rules were applied for the administration of items: (1) stop if measurement precision is below a predefined level, or (2) stop if more than half of the items of the subscale are administered.</p>
      </sec>
      <sec sec-type="results">
        <title>Results</title>
        <p>In general, the items of each of the four scales agreed with IRT assumptions. Application of the first stopping rule reduced the length of the questionnaire by 38% (from 50 to 31 items on average). When the second stopping rule was also applied, the total number of items could be reduced by 56% (from 50 to 22 items on average).</p>
      </sec>
      <sec sec-type="conclusions">
        <title>Conclusions</title>
        <p>CAT seems useful for improving the efficiency of the 4DSQ by 56% without losing a considerable amount of measurement precision. The CAT version of the 4DSQ may be useful as part of an online assessment to investigate the severity of mental health problems of patients visiting a GP. This simulation study is the first step needed for the development a CAT version of the 4DSQ. A CAT version of the 4DSQ could be of high value for Dutch GPs since increasing numbers of patients with mental health problems are visiting the general practice. In further research, the results of a real-time CAT should be compared with the results of the administration of the full scale.</p>
      </sec>
    </abstract>
    <kwd-group>
      <kwd>item response theory</kwd>
      <kwd>Four-Dimensional Symptom Questionnaire</kwd>
      <kwd>computerized adaptive testing</kwd>
      <kwd>mental health</kwd>
      <kwd>general practice</kwd>
    </kwd-group></article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>General practitioners (GPs) are often the first point of contact for persons with mental health problems, and they make important decisions about treatment and referrals. However, GPs vary in their ability to detect mental problems in patients during consultations [<xref ref-type="bibr" rid="ref1">1</xref>] and may have difficulties distinguishing between “normal” psychological distress and psychopathology [<xref ref-type="bibr" rid="ref2">2</xref>]. Moreover, time pressure in general practice is increasing.</p>
      <p>Using a short, good quality screener to distinguish between mild psychological symptoms and severe disorders has become of particular importance for Dutch GPs, as they have been restricted to refer only patients with a Diagnostic and Statistical Manual of Mental Disorders 4th edition (DSM-IV) disorder [<xref ref-type="bibr" rid="ref3">3</xref>] to mental health care professionals.</p>
      <p>The Four-Dimensional Symptom Questionnaire (4DSQ; <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>) is a frequently used self-report questionnaire designed to assess common psychosocial problems in general practice [<xref ref-type="bibr" rid="ref4">4</xref>]. It consists of four subscales measuring distress, depression, anxiety, and somatization. The 4DSQ is available in Dutch, English, and several other languages and has been widely used and validated in clinical practice. The full version of the 4DSQ comprises 50 items. It has been found that most responders need 7 minutes to complete the full version and 75% of all responders complete the 4DSQ within 10 minutes [<xref ref-type="bibr" rid="ref4">4</xref>]. Responses to the questionnaire can be used to distinguish between patients with “normal” psychological distress and patients with psychopathology [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref7">7</xref>]. This is of increasing importance for GPs who have to make crucial decisions about the triage of patients with mental health problems.</p>
      <p>Computerized adaptive testing (CAT) is a method to reduce patient burden of traditional questionnaires, by letting a computer dynamically select only the items that give new information about the patient. Based on a patient’s answer to a single first item, a responders underlying trait (eg, level of depression) is estimated. In addition, an automated algorithm selects the next item that is most appropriate or informative for this responder. The benefit of using CAT is the reduction in items without a loss in reliability or precision in measurement [<xref ref-type="bibr" rid="ref8">8</xref>].</p>
      <p>CAT relies on item response theory (IRT) [<xref ref-type="bibr" rid="ref9">9</xref>]. A CAT version of the Center for Epidemiologic Studies-Depression (CES-D) scale, one of the most widely used depression screeners, provided only marginally different outcomes with a decreased number of items compared to the full version [<xref ref-type="bibr" rid="ref10">10</xref>]. CAT has also been applied successfully to other mental health questionnaires, such as the Beck Depression Inventory [<xref ref-type="bibr" rid="ref11">11</xref>], the Beck Scale for Suicide Ideation [<xref ref-type="bibr" rid="ref12">12</xref>], and the 90-item Mood and Anxiety Symptom Questionnaire [<xref ref-type="bibr" rid="ref13">13</xref>] and seems more accurate than a simple short-form version of an assessment [<xref ref-type="bibr" rid="ref14">14</xref>]. It is not clear yet if the efficiency of screening for common mental health problems in general practice can be increased by developing an adaptive version of the 4DSQ.</p>
      <p>The aims of this simulation study were (1) to investigate if responses of a clinical sample to a paper-and-pencil version of the 4DSQ meet the psychometric requirements needed for IRT; and (2) to determine if a simulated adaptive version of the 4DSQ would yield inferences similar to those based on the full version of the 4DSQ. This simulation study is the first step necessary for the development of a CAT version of the 4DSQ.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Participants</title>
        <p>We used data collected in the baseline measurement of a study evaluating triage decisions in general practice. All patients with mental health problems visiting a GP working in a primary care center in the northern part of the Netherlands between January 1 and December 31, 2014 were included in the study (N=408). All included participants provided informed consent. Participants filled in the Dutch paper-and-pen version of the 4DSQ and only patients with complete data were included in the analyses (92.9%, 379/408). As a result, our final sample consisted of 379 participants with a mean age of 44.8 years (SD 16.5, range 16 to 87). Of the participants, 66.8% (253/379) were female. No significant differences in age (<italic>P</italic>=.715) or sex (<italic>P</italic>=.205) were found between responders with complete and without complete data.</p>
      </sec>
      <sec>
        <title>Psychometric Evaluation</title>
        <p>Since all four of the 4DSQ scales are used and interpreted separately, we performed the psychometric evaluation and our analyses for each of the four scales separately. We followed the five steps described in the analysis plan used for the PROMIS study, which was aimed at improving patient-reported outcome instruments [<xref ref-type="bibr" rid="ref8">8</xref>].</p>
        <sec>
          <title>Step 1: Descriptive Statistics</title>
          <p>Descriptive statistics were calculated for each single item (<xref ref-type="app" rid="app2">Multimedia Appendix 2</xref>). The 4DSQ consists of questions about complaints and symptoms that occurred during the previous week, such as “During the past week, did you feel tense?” Responders indicated how often they experienced these symptoms by answering “no,” “sometimes,” “regularly,” “often,” or “very often or constantly.” According to the scoring protocol, responses were coded as 0 (no), 1 (sometimes), 2 (regularly, often, or very often/constantly). The four 4DSQ scales vary in the total number of items: 16 items for distress, 6 for depression, 12 for anxiety, and 16 for somatization. A total score was calculated for each scale by adding up all item scores. To examine internal consistency, Cronbach alpha was calculated for each scale, with .8 as the acceptable minimum. We analyzed whether removing any of the items changed the internal consistency of a scale.</p>
        </sec>
        <sec>
          <title>Step 2: Evaluate Item Response Theory Assumptions</title>
          <p>Within IRT, data have to agree with three basic assumptions: unidimensionality, local independency, and monotonicity [<xref ref-type="bibr" rid="ref8">8</xref>].</p>
          <p>Unidimensionality means that a person’s response to an item is accounted for by his or her level on the underlying trait and not by any other factor. A confirmatory factor analysis (CFA) with ordinal data was performed to study unidimensionality for each scale. The model’s fit was assessed using four frequently used fit indices: comparative fit index (CFI) greater than 0.95 for good fit, root mean square error of approximation (RMSEA) less than 0.06 for good fit, Tucker Lewis index (TLI) greater than 0.95 for good fit, and standardized root mean residuals (SRMR) less than 0.08 for good fit.</p>
          <p>Local independence means that there should be no significant association among item responses, except for the association controlled for by the underlying trait. This assumption was checked by inspecting residual correlations between item pairs within the CFA. Items with high residual correlations (greater than 0.2) were considered as possibly locally dependent.</p>
          <p>The assumption of monotonicity means that an item response related to a higher level of the trait should increase with the level of the trait. This assumption was studied by plotting trace lines. In addition, we studied scalability coefficients of IRT probability curves (greater than 0.3 indicates monotonicity).</p>
        </sec>
        <sec>
          <title>Step 3: Graded Response Model Fit</title>
          <p>Within IRT, several models are commonly used; however, because of the ordered-response categories of the 4DSQ, a graded response model (GRM) was preferred for our data [<xref ref-type="bibr" rid="ref15">15</xref>]. This model estimates at which levels of an underlying trait (θ), such as depression, a person is likely to choose one of the response options of an item. For each single item, several GRM parameters are estimated. The discrimination parameter (α) represents the extent to which an item discriminates between different trait levels. An item with a high alpha is strongly associated with the measured construct. Two difficulty or threshold parameters (ß<sub>1</sub> and ß<sub>2</sub>) were also estimated. A category response curve (CRC), based on the estimated parameters, was plotted for each item to evaluate the fit of the model to the data.</p>
        </sec>
        <sec>
          <title>Step 4: Differential Item Functioning</title>
          <p>An item displays differential item functioning (DIF) if persons with different characteristics (eg, males and females) respond differently to an item, despite equivalent levels of the underlying trait [<xref ref-type="bibr" rid="ref8">8</xref>]. Items showing DIF may bias CAT outcomes. To check for DIF (uniform and non-uniform), GRM estimates of each item were compared between subgroups varying in gender (male or female) and age (R<sup>2</sup> less than .03 indicating no DIF).</p>
        </sec>
        <sec>
          <title>Step 5: Simulated Computerized Adaptive Testing</title>
          <p>The GRM parameter estimates from Step 3 were used for a CAT simulation. As no information on a subject is available before the first item is administered, θ is initially set at 0. After the first item is answered, the choice for the next item is based on the GRM parameters of all potential next items in relation to the response to the item that was answered first. All optimal next items are selected based on the maximum Fisher estimation method. The CAT selects new items until a pre-defined stopping rule is reached. A stopping rule is based on either a maximum number of items administered or on a pre-specified level of measurement precision [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref13">13</xref>].</p>
          <p>We combined the two following stopping rules: (1) stop when the standard error of the trait is similar to the standard error of the full lengths scale, or (2) stop when half the number of the full scale is administered. We compared CAT outcomes with the first stopping rule only and with both stopping rules. Regarding the first stopping rule, we inspected varying levels of standard error (from 0.2 to 0.8). The pre-defined standard error of theta that corresponded with the standard error of the full scale was used as a reference point. Correlations were calculated between trait levels based on CAT and on the scores from the full version of the 4DSQ. We added a second stopping rule because questionnaires in mental health often are most informative for patients with relatively high levels of clinical outcomes [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. For patients with a low level of the assessed outcome (eg, patients with low levels of depression), many items provide little (additional) information. Ironically, as the CAT algorithm finds it difficult to estimate the standard error when items offer little information, patients with a low trait level often have to answer all items, even though they provide no new information.</p>
        </sec>
      </sec>
      <sec>
        <title>Software</title>
        <p>The descriptive statistics and the estimation of the GRM parameters were done in STATA 14.0. The CFA model was estimated using the lavaan package in R [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. Monotonicity was checked using the R mokken package [<xref ref-type="bibr" rid="ref20">20</xref>] and DIF with the R lordif package [<xref ref-type="bibr" rid="ref21">21</xref>]. The CAT simulation was done with the CatIRT package in R [<xref ref-type="bibr" rid="ref22">22</xref>].</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Step 1: Descriptive Statistics</title>
        <p>The sample’s mean total score on the 4DSQ distress scale was 18.6 (SE 0.43, range 0-32, median 20), with an overall Cronbach alpha of .92. The mean depression score was 3.4 (SE 0.20, range 0-12, median 2), with a Cronbach alpha of .90. The mean score for anxiety was 5.5 (SE 0.27, range 0-23, median 4), with a Cronbach alpha of .87. Finally, for the somatization scale, the sample scored 11.6 on average (SE 0.35, range 0-32, median 11), with a Cronbach alpha of .85. These results were comparable to other studies [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. The descriptive statistics of the single items on the four scales are shown in <xref ref-type="app" rid="app2">Multimedia Appendix 2</xref>. Removing any one of the items did not change the internal consistency of any of the four scales.</p>
      </sec>
      <sec>
        <title>Step 2: Checking Item Response Theory Assumptions</title>
        <p>Regarding the first assumption, unidimensionality, we concluded that the items of the anxiety scale showed a good model fit for all four fit indices of the CFA. The items of the distress and depression scales showed a good fit for three of the four indices, but not for RMSEA, although they nearly did. For good fit, RMSEA should be lower than 0.06, but it was 0.08 (distress) and 0.07 (depression). The items of the somatization scale showed good fit for two out of four indices, but not for RMSEA (0.07 instead of less than 0.06) and TLI (0.94 instead of greater than 0.95).</p>
        <p>Regarding the second assumption, out of 321 items pairs within the four scales (equation 1), two item pairs with a residual correlation above 0.2 were observed, indicating local independency. They were items 20 and 39 (sleep-related), and items 47 and 48 (trauma-related), all from the distress scale.</p>
        <p>321=(½)(6)(5) + (½)(16)(15) + (½)(12)(11) + (½)(16)(15) (1)</p>
        <p>The scalability coefficient of all items was higher than 0.3, indicating that all items met the third assumption of monotonicity.</p>
      </sec>
      <sec>
        <title>Step 3: Graded Response Model Fit</title>
        <p>The parameter estimates of the GRM for all items of the four scales are shown in <xref ref-type="app" rid="app3">Multimedia Appendix 3</xref>. Item 33 (“would be better off dead”) of the depression scale showed the highest alpha (7.377) and discriminates best between persons with low and high levels of depression. For the three other scales, the highest alphas were observed for item 37 (3.483, distress, “no longer feel like doing anything”), item 27 (5.527, anxiety, “feel frightened”), and item 16 (1.855, somatization, “pain in the chest”). All other items showed an alpha above 1, except for items 47 and 48 (distress), item 50 (anxiety), and items 6 and 8 (somatization).</p>
        <p>It was found that 43 items showed CRCs as expected. Five items on the anxiety scale (40, 42, 43, 49, and 50) and two items on the somatization scale (5 and 14) did not show CRCs as expected. For those items, the probability to answer “sometimes” was always lower than the probability for one of the other responses, regardless of the trait level.</p>
        <p>As an example, <xref ref-type="fig" rid="figure1">Figure 1</xref> shows the CRCs of the items with the highest (item 33; α=7.377, ß<sub>1</sub>=0.688, ß<sub>2</sub>=1.349) and lowest (item 35; α=2.457, ß<sub>1</sub>=0.119, ß<sub>2</sub>=0.828) discrimination parameter (α) of the depression scale. The higher discrimination parameter of item 33 indicates an ability to demarcate fine gradations between persons with similar levels of depression. This can be observed in <xref ref-type="fig" rid="figure1">Figure 1</xref>, which shows steep curves for different answer categories for item 33. Item 35 (no escape from situation) is more easily endorsed than item 33 in general (would be better off dead), which is indicated by the location of the curves more on the left side of the graph. Persons with a high depression level are most likely to answer “sometimes” to item 33, and to answer “regularly”, “often,” or “very often or constantly” to item 35.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Category response curves of items 33 and 35 of the Four-Dimensional Symptom Questionnaire depression scale. The probability (y-axis) represents the chance on a certain response (0=never; 1=sometimes; 2=regularly, often, very often, or constantly) given a certain level of theta. Theta (x-axis) represents the underlying trait level; in this figure, depression. The abbreviation Pr is probability.</p>
          </caption>
          <graphic xlink:href="mental_v4i1e7_fig1.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Step 4: Differential Item Functioning</title>
        <p>For the depression, anxiety, and somatization subscales, no items showed DIF. The only item that showed significant and relevant uniform and non-uniform DIF was item 41 (“I quickly get emotional”) from the distress scale for the covariate gender.</p>
      </sec>
      <sec>
        <title>Step 5: Simulated Computerized Adaptive Testing</title>
        <p>The characteristics of the simulated CAT under different levels of measurement precision (allowing the standard error of the estimated underlying trait to gradually increase; stopping rule 1) are shown in <xref ref-type="table" rid="table1">Table 1</xref>. For each scale, the standard error of theta that was equal to the standard error of the full version scale is indicated. For example, the standard error of the full version scale of distress was 0.4. When allowing the standard error of theta to be maximal 0.4, the mean number of items administered could be decreased from 16 to 6.3. The correlation between the distress level based on 6.3 items and the distress level based on all items was high (0.96). Comparable results were found for the three other scales. With the first stopping rule, we were able to reduce the mean number of items administered to 5 for depression (from 6), to 8.3 for anxiety (from 12), and to 12.9 for somatization (from 16), while correlations between CAT and full test scores remained high. Applying CAT with the first stopping rule to all four scales could reduce the total number of 4DSQ items from 50 to, on average, 34 items.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Mean number of items administered under varying levels of measurement precision and correlations between computerized adaptive testing scores and full version scores of the Four-Dimensional Symptom Questionnaire.</p>
          </caption>
          <table width="619" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="47"/>
            <col width="49"/>
            <col width="65"/>
            <col width="45"/>
            <col width="65"/>
            <col width="45"/>
            <col width="65"/>
            <col width="45"/>
            <col width="64"/>
            <thead>
              <tr valign="top">
                <td rowspan="2">Stopping rule</td>
                <td colspan="2">Distress</td>
                <td colspan="2">Depression</td>
                <td colspan="2">Anxiety</td>
                <td colspan="2">Somatization</td>
              </tr>
              <tr valign="top">
                <td>Number of items, mean (SD)</td>
                <td>Correlation<sup>a</sup></td>
                <td>Number of items, mean (SD)</td>
                <td>Correlation<sup>a</sup></td>
                <td>Number of items, mean (SD)</td>
                <td>Correlation<sup>a</sup></td>
                <td>Number of items, mean (SD)</td>
                <td>Correlation<sup>a</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>None</td>
                <td>16</td>
                <td>1.00</td>
                <td>6</td>
                <td>1.00</td>
                <td>12</td>
                <td>1.00</td>
                <td>16</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>SE<sup>b</sup> (θ)&#60;0.2</td>
                <td>15.7 (0.8)</td>
                <td>1</td>
                <td>5.7 (0.9)<sup>c</sup></td>
                <td>1<sup>c</sup></td>
                <td>12 (0)</td>
                <td>1</td>
                <td>16 (0)</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>SE (θ)&#60;0.3</td>
                <td>8.8 (4.5)</td>
                <td>0.98</td>
                <td>5.4 (1.2)</td>
                <td>0.99</td>
                <td>8.7 (4.3)<sup>c</sup></td>
                <td>0.97<sup>c</sup></td>
                <td>14 (0)</td>
                <td>0.97</td>
              </tr>
              <tr valign="top">
                <td>SE (θ)&#60;0.4</td>
                <td>6.3 (4.3)<sup>c</sup></td>
                <td>0.96<sup>c</sup></td>
                <td>5.0 (1.3)</td>
                <td>0.99</td>
                <td>8.3 (4.3)</td>
                <td>0.97</td>
                <td>12.9 (2.1)<sup>c</sup></td>
                <td>0.95<sup>c</sup></td>
              </tr>
              <tr valign="top">
                <td>SE (θ)&#60;0.5</td>
                <td>4.9 (3.8)</td>
                <td>0.92</td>
                <td>4.9 (1.4)</td>
                <td>0.99</td>
                <td>8.1 (4.4)</td>
                <td>0.97</td>
                <td>11.2 (4.9)</td>
                <td>0.95</td>
              </tr>
              <tr valign="top">
                <td>SE (θ)&#60;0.6</td>
                <td>4.1 (2.6)</td>
                <td>0.86</td>
                <td>4.6 (1.4)</td>
                <td>0.99</td>
                <td>5.9 (4.2)</td>
                <td>0.94</td>
                <td>7.5 (4.6)</td>
                <td>0.86</td>
              </tr>
              <tr valign="top">
                <td>SE (θ)&#60;0.7</td>
                <td>3.8 (2.5)</td>
                <td>0.84</td>
                <td>3.9 (1.3)</td>
                <td>0.97</td>
                <td>5.9 (4.1)</td>
                <td>0.94</td>
                <td>4.6 (3.4)</td>
                <td>0.73</td>
              </tr>
              <tr valign="top">
                <td>SE (θ)&#60;0.8</td>
                <td>3.7 (2.3)</td>
                <td>0.79</td>
                <td>3.9 (1.3)</td>
                <td>0.97</td>
                <td>5.6 (4.0)</td>
                <td>0.93</td>
                <td>4.6 (3.4)</td>
                <td>0.73</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>Correlation between CAT θ and complete test θ.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>SE: standard error.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>The standard error of theta (θ) is equal to the standard error of the full version scale.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>The results of combining the first stopping rule with the second stopping rule are shown in <xref ref-type="table" rid="table2">Table 2</xref>. For distress, the average number of items could be further decreased from 6.3 to 5, but the correlation also decreased from 0.96 to 0.79. Therefore, we did not apply the second stopping rule to this scale. For the three other scales, the number of average items could be decreased, while the correlation remained high. Overall, when applying the CAT with both stopping rules (except for distress), the 4DSQ could be reduced from 50 to 22 items.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Mean number of items administered and correlation with total estimated theta under one or two stopping rules.</p>
          </caption>
          <table width="619" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="54"/>
            <col width="45"/>
            <col width="65"/>
            <col width="45"/>
            <col width="65"/>
            <col width="45"/>
            <col width="65"/>
            <col width="45"/>
            <col width="64"/>
            <thead>
              <tr valign="top">
                <td rowspan="2">Stopping rule</td>
                <td colspan="2">Distress</td>
                <td colspan="2">Depression</td>
                <td colspan="2">Anxiety</td>
                <td colspan="2">Somatization</td>
              </tr>
              <tr valign="top">
                <td>Number of items, mean (SD)</td>
                <td>Correlation<sup>a</sup></td>
                <td>Number of items, mean (SD)</td>
                <td>Correlation<sup>a</sup></td>
                <td>Number of items, mean (SD)</td>
                <td>Correlation<sup>a</sup></td>
                <td>Number of items, mean (SD)</td>
                <td>Correlation<sup>a</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>None</td>
                <td>16</td>
                <td>1.00</td>
                <td>6</td>
                <td>1.00</td>
                <td>12</td>
                <td>1.00</td>
                <td>16</td>
                <td>1.00</td>
              </tr>
              <tr valign="top">
                <td>SE<sup>b</sup> (θ) = SE (full)</td>
                <td>6.3 (4.3)</td>
                <td>0.96</td>
                <td>5.4 (1.2)</td>
                <td>0.99</td>
                <td>8.7 (4.3)</td>
                <td>0.97</td>
                <td>12.9 (2.1)</td>
                <td>0.95</td>
              </tr>
              <tr valign="top">
                <td>Maximum items<sup>c</sup></td>
                <td>5.0 (2.1)</td>
                <td>0.79</td>
                <td>3.0 (0)</td>
                <td>0.96</td>
                <td>4.9 (1.4)</td>
                <td>0.92</td>
                <td>7.9 (0.3)</td>
                <td>0.92</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>Correlation between CAT θ and complete test θ.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>SE: standard error.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>Maximum items are determined by dividing the number of items by 2.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>In summary, when applying CAT to the 4DSQ and applying two stopping rules to the subscales of anxiety, depression, somatization, and one stopping rule to the subscale distress, the total number of items on the 4DSQ could be reduced by 56% on average (from 50 to 22 items), without losing a considerable amount of measurement precision.</p>
      </sec>
      <sec>
        <title>Interpretation</title>
        <p>Our simulation study showed that CAT may increase the efficiency of the 4DSQ and could reduce responders’ burden by more than 50%. These results were also found in other CAT studies, such as on the <italic>Center for Epidemiological Studies-Depression Scale</italic> (CES-D), where the total scale of 20 items could be reduced to 7 items [<xref ref-type="bibr" rid="ref23">23</xref>].</p>
        <p>Some CATs to measure anxiety and depression have already been used and evaluated in clinical (specialist) care [<xref ref-type="bibr" rid="ref24">24</xref>-<xref ref-type="bibr" rid="ref26">26</xref>]. These CATs appeared to be useful for longitudinal monitoring of symptoms, since they were as reliable over time as traditional questionnaires [<xref ref-type="bibr" rid="ref27">27</xref>].</p>
        <p>A CAT version of the 4DSQ seems especially useful in general practices, for example, as part of a broad online assessment to investigate the severity of psychological problems of patients. As the number of patients visiting their GP with mental health problems is increasing [<xref ref-type="bibr" rid="ref28">28</xref>], there is a growing need for an efficient screener for mental health problems. Many Dutch GPs already use the 4DSQ. An efficient, shortened 4DSQ could be combined with other mental health questionnaires, while keeping responders’ burden as low as possible. GPs have only a limited time and often have to make important decisions about referring patients with mental health problems. An online severity assessment, ideally preceding the first consultation, could be helpful as a first quick evaluation on which to base further (treatment) decisions. Some GPs use the 4DSQ as an agenda-setting tool to talk about the psychological problems of their patients. An online assessment could fulfill the same agenda-setting function.</p>
        <p>However, some obstacles for the successful implementation of a CAT version of the 4DSQ in general practice exist. First, current information and communication technology (ICT) possibilities in general practices are insufficient for the implementation of CAT, which requires sophisticated statistical software. Second, it is not clear to what extent GPs are willing to implement a CAT version of the 4DSQ. GPs may use responses from individual 4DSQ items, such as item 47 or 48 on traumatic events, for a quick clinical evaluation, and this information may be lost when applying CAT. Lastly, it is not clear if CAT is appropriate for all patients. Previous research on CAT after inpatient rehabilitation suggests that it might only be feasible to collect (complete) data for a specific subset of patients [<xref ref-type="bibr" rid="ref29">29</xref>]. Some patients may prefer a paper-and-pencil version of a questionnaire to an online assessment. Although a CAT version of the 4DSQ might not be immediately available for use in clinical practice, some studies have already shown that CAT versions of traditional questionnaires can be used in a clinical setting [<xref ref-type="bibr" rid="ref24">24</xref>-<xref ref-type="bibr" rid="ref26">26</xref>] and are well accepted by patients [<xref ref-type="bibr" rid="ref25">25</xref>]. Recently developed, free-to-use online CAT platforms [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>] are likely to enable the development of new CAT questionnaires. Moreover, some Dutch GPs already have been using an online screener to assess mental health problems, so application of a CAT version of the 4DSQ in clinical practice may be within reach.</p>
      </sec>
      <sec>
        <title>Strengths and Limitations</title>
        <p>As this was a simulation study, we used responses to a paper-and-pencil version of the 4DSQ. In reality, responders might behave differently when receiving a computerized adaptive assessment. For example, we do not know if the actual computer administration might influence responses or what effect differences in the item order may have. However, a previous study showed that differences between results from a simulation CAT and a real CAT were small [<xref ref-type="bibr" rid="ref32">32</xref>]. We used data from a sample from a northern region of the Netherlands, but parameter estimates based on data from different regions and countries might also differ.</p>
        <p>Regarding the psychometric evaluation, our data showed some weaknesses. For most items of the four subscales of the 4DSQ, the assumptions for an IRT analysis were met. The assumption of unidimensionality was not met perfectly for all four scales, although it nearly was. Moreover, some items showed other limitations, such as correlations between item pairs or differential item functioning. These items might be left out in future (real-time) CAT versions of the 4DSQ. As in other studies, we found relevant DIF for the item “emotionality” on the distress scale. Women tend to more easily agree with this item compared to men, even when they have a similar underlying level of distress. When looking at the individual responses to the CAT of the distress scale, the item “emotionality” was only administered to participants with a very low level of distress. This indicates that the DIF on this item does not bias the CAT outcomes, as this item is not informative enough to be included in the final CAT. When looking at the distribution and the CRC of some items of the anxiety and somatization scales, participants either endorse option 0 or option 1 to 2. Patients apparently have difficulties differentiating between response categories 1 and 2. This might be solved in future studies by grouping response options 1 and 2 for certain items, making them dichotomous.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>Data from this simulation study in general agreed with assumptions needed for CAT. CAT seems useful for improving the efficiency of the 4DSQ by 56%, without losing a considerable amount of measurement precision. Of course, this simulation study is only the first step towards a CAT version of the 4DSQ that could be implemented in clinical practice and it should be followed by a study on a real-time CAT and eventually by an evaluation of the developed CAT version in a clinical setting.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <app id="app1">
        <title>Multimedia Appendix 1</title>
        <p>English version of the Four-Dimensional Symptom Questionnaire.</p>
        <media xlink:href="mental_v4i1e7_app1.pdf" xlink:title="PDF File (Adobe PDF File), 247KB"/>
      </app>
      <app id="app2">
        <title>Multimedia Appendix 2</title>
        <p>Descriptive statistics of items of the Four-Dimensional Symptom Questionnaire.</p>
        <media xlink:href="mental_v4i1e7_app2.pdf" xlink:title="PDF File (Adobe PDF File), 518KB"/>
      </app>
      <app id="app3">
        <title>Multimedia Appendix 3</title>
        <p>Graded response model parameter estimates of the Four-Dimensional Symptom Questionnaire.</p>
        <media xlink:href="mental_v4i1e7_app3.pdf" xlink:title="PDF File (Adobe PDF File), 525KB"/>
      </app>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">4DSQ</term>
          <def>
            <p>Four-Dimensional Symptom Questionnaire</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CAT</term>
          <def>
            <p>computerized adaptive testing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CRC</term>
          <def>
            <p>category response curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">CFA</term>
          <def>
            <p>confirmatory factor analysis</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">DIF</term>
          <def>
            <p>differential item functioning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">GP</term>
          <def>
            <p>general practitioner</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">GRM</term>
          <def>
            <p>graded response model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">IRT</term>
          <def>
            <p>item response theory</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">RMSEA</term>
          <def>
            <p>root mean square error of approximation</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>We would like to thank Marjolein Jansen and Thomas de Kok for their contributions to data collection.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>TM, DB, and PFV designed the study. TM and DB analyzed the data. All authors contributed to and approved the final manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>BT is the copyright owner of the 4DSQ and receives copyright fees from companies that use the 4DSQ on a commercial basis (the 4DSQ is freely available for non-commercial use in health care and research). BT received fees from various institutions for workshops on the application of the 4DSQ in primary care settings.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zantinge</surname>
            <given-names>EM</given-names>
          </name>
          <name name-style="western">
            <surname>Verhaak</surname>
            <given-names>PF</given-names>
          </name>
          <name name-style="western">
            <surname>Kerssens</surname>
            <given-names>JJ</given-names>
          </name>
          <name name-style="western">
            <surname>Bensing</surname>
            <given-names>JM</given-names>
          </name>
        </person-group>
        <article-title>The workload of GPs: consultations of patients with psychological and somatic problems compared</article-title>
        <source>Br J Gen Pract</source>  
        <year>2005</year>  
        <month>08</month>  
        <volume>55</volume>  
        <issue>517</issue>  
        <fpage>609</fpage>  
        <lpage>14</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://bjgp.org/cgi/pmidlookup?view=long&#38;pmid=16105369"/>
        </comment>  
        <pub-id pub-id-type="medline">16105369</pub-id>
        <pub-id pub-id-type="pmcid">PMC1463219</pub-id></nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hyde</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Evans</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Sharp</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Croudace</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Harrison</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Lewis</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Araya</surname>
            <given-names>R</given-names>
          </name>
        </person-group>
        <article-title>Deciding who gets treatment for depression and anxiety: a study of consecutive GP attenders</article-title>
        <source>Br J Gen Pract</source>  
        <year>2005</year>  
        <month>11</month>  
        <volume>55</volume>  
        <issue>520</issue>  
        <fpage>846</fpage>  
        <lpage>53</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://bjgp.org/cgi/pmidlookup?view=long&#38;pmid=16282000"/>
        </comment>  
        <pub-id pub-id-type="medline">16282000</pub-id>
        <pub-id pub-id-type="pmcid">PMC1570785</pub-id></nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <collab>American Psychiatric Association</collab>
        </person-group>
        <source>Diagnostic and Statistical Manual of Mental Disorders, Fifth Edition</source>  
        <year>2013</year>  
        <publisher-loc>Washington, DC</publisher-loc>
        <publisher-name>American Psychiatric Association</publisher-name></nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Terluin</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>van Marwijk</surname>
            <given-names>HW</given-names>
          </name>
          <name name-style="western">
            <surname>Adèr</surname>
            <given-names>HJ</given-names>
          </name>
          <name name-style="western">
            <surname>de Vet</surname>
            <given-names>HC</given-names>
          </name>
          <name name-style="western">
            <surname>Penninx</surname>
            <given-names>BW</given-names>
          </name>
          <name name-style="western">
            <surname>Hermens</surname>
            <given-names>ML</given-names>
          </name>
          <name name-style="western">
            <surname>van Boeijen</surname>
            <given-names>CA</given-names>
          </name>
          <name name-style="western">
            <surname>van Balkom</surname>
            <given-names>AJ</given-names>
          </name>
          <name name-style="western">
            <surname>van der Klink</surname>
            <given-names>JL</given-names>
          </name>
          <name name-style="western">
            <surname>Stalman</surname>
            <given-names>WA</given-names>
          </name>
        </person-group>
        <article-title>The Four-Dimensional Symptom Questionnaire (4DSQ): a validation study of a multidimensional self-report questionnaire to assess distress, depression, anxiety and somatization</article-title>
        <source>BMC Psychiatry</source>  
        <year>2006</year>  
        <month>08</month>  
        <day>22</day>  
        <volume>6</volume>  
        <fpage>34</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/16925825"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/1471-244X-6-34</pub-id>
        <pub-id pub-id-type="medline">16925825</pub-id>
        <pub-id pub-id-type="pii">1471-244X-6-34</pub-id>
        <pub-id pub-id-type="pmcid">PMC1590008</pub-id></nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Geraghty</surname>
            <given-names>AW</given-names>
          </name>
          <name name-style="western">
            <surname>Stuart</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Terluin</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Kendrick</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Little</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Moore</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Distinguishing between emotional distress and psychiatric disorder in primary care attenders: A cross sectional study of the four-dimensional symptom questionnaire (4DSQ)</article-title>
        <source>J Affect Disord</source>  
        <year>2015</year>  
        <month>09</month>  
        <day>15</day>  
        <volume>184</volume>  
        <fpage>198</fpage>  
        <lpage>204</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.jad.2015.05.064</pub-id>
        <pub-id pub-id-type="medline">26099254</pub-id>
        <pub-id pub-id-type="pii">S0165-0327(15)00370-5</pub-id></nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Terluin</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Brouwers</surname>
            <given-names>EP</given-names>
          </name>
          <name name-style="western">
            <surname>van Marwijk</surname>
            <given-names>HW</given-names>
          </name>
          <name name-style="western">
            <surname>Verhaak</surname>
            <given-names>PF</given-names>
          </name>
          <name name-style="western">
            <surname>van der Horst</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <article-title>Detecting depressive and anxiety disorders in distressed patients in primary care; comparative diagnostic accuracy of the Four-Dimensional Symptom Questionnaire (4DSQ) and the Hospital Anxiety and Depression Scale (HADS)</article-title>
        <source>BMC Fam Pract</source>  
        <year>2009</year>  
        <month>08</month>  
        <day>23</day>  
        <volume>10</volume>  
        <fpage>58</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://bmcfampract.biomedcentral.com/articles/10.1186/1471-2296-10-58"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/1471-2296-10-58</pub-id>
        <pub-id pub-id-type="medline">19698153</pub-id>
        <pub-id pub-id-type="pii">1471-2296-10-58</pub-id>
        <pub-id pub-id-type="pmcid">PMC2753335</pub-id></nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Terluin</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Oosterbaan</surname>
            <given-names>DB</given-names>
          </name>
          <name name-style="western">
            <surname>Brouwers</surname>
            <given-names>EP</given-names>
          </name>
          <name name-style="western">
            <surname>van Straten</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>van de Ven</surname>
            <given-names>PM</given-names>
          </name>
          <name name-style="western">
            <surname>Langerak</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>van Marwijk</surname>
            <given-names>HW</given-names>
          </name>
        </person-group>
        <article-title>To what extent does the anxiety scale of the Four-Dimensional Symptom Questionnaire (4DSQ) detect specific types of anxiety disorder in primary care? A psychometric study</article-title>
        <source>BMC Psychiatry</source>  
        <year>2014</year>  
        <month>04</month>  
        <day>24</day>  
        <volume>14</volume>  
        <fpage>121</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24761829"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/1471-244X-14-121</pub-id>
        <pub-id pub-id-type="medline">24761829</pub-id>
        <pub-id pub-id-type="pii">1471-244X-14-121</pub-id>
        <pub-id pub-id-type="pmcid">PMC4006959</pub-id></nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Reeve</surname>
            <given-names>BB</given-names>
          </name>
          <name name-style="western">
            <surname>Hays</surname>
            <given-names>RD</given-names>
          </name>
          <name name-style="western">
            <surname>Bjorner</surname>
            <given-names>JB</given-names>
          </name>
          <name name-style="western">
            <surname>Cook</surname>
            <given-names>KF</given-names>
          </name>
          <name name-style="western">
            <surname>Crane</surname>
            <given-names>PK</given-names>
          </name>
          <name name-style="western">
            <surname>Teresi</surname>
            <given-names>JA</given-names>
          </name>
          <name name-style="western">
            <surname>Thissen</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Revicki</surname>
            <given-names>DA</given-names>
          </name>
          <name name-style="western">
            <surname>Weiss</surname>
            <given-names>DJ</given-names>
          </name>
          <name name-style="western">
            <surname>Hambleton</surname>
            <given-names>RK</given-names>
          </name>
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Gershon</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Reise</surname>
            <given-names>SP</given-names>
          </name>
          <name name-style="western">
            <surname>Lai</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Cella</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>Psychometric evaluation and calibration of health-related quality of life item banks: plans for the Patient-Reported Outcomes Measurement Information System (PROMIS)</article-title>
        <source>Med Care</source>  
        <year>2007</year>  
        <month>05</month>  
        <volume>45</volume>  
        <issue>5 Suppl 1</issue>  
        <fpage>S22</fpage>  
        <lpage>31</lpage>  
        <pub-id pub-id-type="doi">10.1097/01.mlr.0000250483.85507.04</pub-id>
        <pub-id pub-id-type="medline">17443115</pub-id>
        <pub-id pub-id-type="pii">00005650-200705001-00004</pub-id></nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="editor">
          <name name-style="western">
            <surname>van der Linden</surname>
            <given-names>WJ</given-names>
          </name>
          <name name-style="western">
            <surname>Hambleton</surname>
            <given-names>RK</given-names>
          </name>
        </person-group>
        <source>Handbook of Modern Item Response Theory</source>  
        <year>1997</year>  
        <publisher-loc>New York</publisher-loc>
        <publisher-name>Springer</publisher-name></nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Smits</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Cuijpers</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>van Straten</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Applying computerized adaptive testing to the CES-D scale: a simulation study</article-title>
        <source>Psychiatry Res</source>  
        <year>2011</year>  
        <month>06</month>  
        <day>30</day>  
        <volume>188</volume>  
        <issue>1</issue>  
        <fpage>147</fpage>  
        <lpage>55</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0165-1781(10)00769-9"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.psychres.2010.12.001</pub-id>
        <pub-id pub-id-type="medline">21208660</pub-id>
        <pub-id pub-id-type="pii">S0165-1781(10)00769-9</pub-id></nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Gardner</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Shear</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Kelleher</surname>
            <given-names>KJ</given-names>
          </name>
          <name name-style="western">
            <surname>Pajer</surname>
            <given-names>KA</given-names>
          </name>
          <name name-style="western">
            <surname>Mammen</surname>
            <given-names>O</given-names>
          </name>
          <name name-style="western">
            <surname>Buysse</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Frank</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>Computerized adaptive measurement of depression: a simulation study</article-title>
        <source>BMC Psychiatry</source>  
        <year>2004</year>  
        <month>05</month>  
        <day>06</day>  
        <volume>4</volume>  
        <fpage>13</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/15132755"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/1471-244X-4-13</pub-id>
        <pub-id pub-id-type="medline">15132755</pub-id>
        <pub-id pub-id-type="pii">1471-244X-4-13</pub-id>
        <pub-id pub-id-type="pmcid">PMC416483</pub-id></nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>De Beurs</surname>
            <given-names>DP</given-names>
          </name>
          <name name-style="western">
            <surname>de Vries</surname>
            <given-names>AL</given-names>
          </name>
          <name name-style="western">
            <surname>de Groot</surname>
            <given-names>MH</given-names>
          </name>
          <name name-style="western">
            <surname>de Keijser</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Kerkhof</surname>
            <given-names>AJ</given-names>
          </name>
        </person-group>
        <article-title>Applying computer adaptive testing to optimize online assessment of suicidal behavior: a simulation study</article-title>
        <source>J Med Internet Res</source>  
        <year>2014</year>  
        <month>09</month>  
        <day>11</day>  
        <volume>16</volume>  
        <issue>9</issue>  
        <fpage>e207</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2014/9/e207/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.3511</pub-id>
        <pub-id pub-id-type="medline">25213259</pub-id>
        <pub-id pub-id-type="pii">v16i9e207</pub-id>
        <pub-id pub-id-type="pmcid">PMC4180339</pub-id></nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Flens</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Smits</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Carlier</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>van Hemert</surname>
            <given-names>AM</given-names>
          </name>
          <name name-style="western">
            <surname>de Beurs</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>Simulating computer adaptive testing with the Mood and Anxiety Symptom Questionnaire</article-title>
        <source>Psychol Assess</source>  
        <year>2016</year>  
        <month>08</month>  
        <volume>28</volume>  
        <issue>8</issue>  
        <fpage>953</fpage>  
        <lpage>62</lpage>  
        <pub-id pub-id-type="doi">10.1037/pas0000240</pub-id>
        <pub-id pub-id-type="medline">26691506</pub-id>
        <pub-id pub-id-type="pii">2015-57071-001</pub-id></nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Gardner</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Kelleher</surname>
            <given-names>KJ</given-names>
          </name>
          <name name-style="western">
            <surname>Pajer</surname>
            <given-names>KA</given-names>
          </name>
        </person-group>
        <article-title>Multidimensional adaptive testing for mental health problems in primary care</article-title>
        <source>Med Care</source>  
        <year>2002</year>  
        <month>09</month>  
        <volume>40</volume>  
        <issue>9</issue>  
        <fpage>812</fpage>  
        <lpage>23</lpage>  
        <pub-id pub-id-type="doi">10.1097/01.MLR.0000025436.30093.77</pub-id>
        <pub-id pub-id-type="medline">12218771</pub-id></nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Samejima</surname>
            <given-names>F</given-names>
          </name>
        </person-group>
        <source>Estimation of Latent Ability Using a Response Pattern of Graded Scores</source>  
        <year>1969</year>  
        <access-date>2017-02-11</access-date>
        <publisher-loc>Richmond, VA</publisher-loc>
        <publisher-name>Psychometric Society</publisher-name>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.psychometricsociety.org/sites/default/files/pdf/MN17.pdf">http://www.psychometricsociety.org/sites/default/files/pdf/MN17.pdf</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="6oCHoFl4P"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Embretson</surname>
            <given-names>SE</given-names>
          </name>
          <name name-style="western">
            <surname>Reise</surname>
            <given-names>SP</given-names>
          </name>
        </person-group>
        <source>Item Response Theory for Psychologists</source>  
        <year>2000</year>  
        <publisher-loc>Hove, UK</publisher-loc>
        <publisher-name>Psychology Press</publisher-name></nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Young</surname>
            <given-names>MA</given-names>
          </name>
          <name name-style="western">
            <surname>Halper</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Clark</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Scheftner</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Fawcett</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>An item-response theory evaluation of the Beck Hopelessness Scale</article-title>
        <source>Cogn Ther Res</source>  
        <year>1992</year>  
        <month>10</month>  
        <volume>16</volume>  
        <issue>5</issue>  
        <fpage>579</fpage>  
        <lpage>587</lpage>  
        <pub-id pub-id-type="doi">10.1007/BF01175143</pub-id></nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="web">
        <source>The Comprehensive R Archive Network</source>  
        <year>2009</year>  
        <access-date>2017-02-11</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://cran.r-project.org/">http://cran.r-project.org/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="6oCI04qc1"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Rosseel</surname>
            <given-names>Y</given-names>
          </name>
        </person-group>
        <article-title>lavaan: An R package for structural euation modeling</article-title>
        <source>J Stat Softw</source>  
        <year>2012</year>  
        <volume>48</volume>  
        <issue>2</issue>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jstatsoft.org/v48/i02/paper"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Van der Ark</surname>
            <given-names>LA</given-names>
          </name>
        </person-group>
        <article-title>Mokken scale analysis in R</article-title>
        <source>J Stat Softw</source>  
        <year>2007</year>  
        <volume>20</volume>  
        <issue>11</issue>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jstatsoft.org/v20/i11/paper"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Choi</surname>
            <given-names>SW</given-names>
          </name>
          <name name-style="western">
            <surname>Gibbons</surname>
            <given-names>LE</given-names>
          </name>
          <name name-style="western">
            <surname>Crane</surname>
            <given-names>PK</given-names>
          </name>
        </person-group>
        <article-title>lordif: An R package for detecting differential item functioning using iterative hybrid ordinal logistic regression/item response theory and Monte Carlo simulations</article-title>
        <source>J Stat Softw</source>  
        <year>2011</year>  
        <month>03</month>  
        <day>01</day>  
        <volume>39</volume>  
        <issue>8</issue>  
        <fpage>1</fpage>  
        <lpage>30</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21572908"/>
        </comment>  
        <pub-id pub-id-type="medline">21572908</pub-id>
        <pub-id pub-id-type="pmcid">PMC3093114</pub-id></nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Nydick</surname>
            <given-names>SW</given-names>
          </name>
        </person-group>
        <source>Package CATIRT</source>  
        <year>2014</year>  
        <month>04</month>  
        <day>02</day>  
        <access-date>2017-02-11</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://cran.r-project.org/web/packages/catIrt/catIrt.pdf">http://cran.r-project.org/web/packages/catIrt/catIrt.pdf</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="6oCIO742h"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Smits</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Zitman</surname>
            <given-names>FG</given-names>
          </name>
          <name name-style="western">
            <surname>Cuijpers</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>den Hollander-Gijsman</surname>
            <given-names>ME</given-names>
          </name>
          <name name-style="western">
            <surname>Carlier</surname>
            <given-names>IV</given-names>
          </name>
        </person-group>
        <article-title>A proof of principle for using adaptive testing in routine outcome monitoring: the efficiency of the Mood and Anxiety Symptoms Questionnaire -Anhedonic Depression CAT</article-title>
        <source>BMC Med Res Methodol</source>  
        <year>2012</year>  
        <month>01</month>  
        <day>10</day>  
        <volume>12</volume>  
        <fpage>4</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/1471-2288-12-4"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/1471-2288-12-4</pub-id>
        <pub-id pub-id-type="medline">22233260</pub-id>
        <pub-id pub-id-type="pii">1471-2288-12-4</pub-id>
        <pub-id pub-id-type="pmcid">PMC3317818</pub-id></nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Becker</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Fliege</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Kocalevent</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Bjorner</surname>
            <given-names>JB</given-names>
          </name>
          <name name-style="western">
            <surname>Rose</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Walter</surname>
            <given-names>OB</given-names>
          </name>
          <name name-style="western">
            <surname>Klapp</surname>
            <given-names>BF</given-names>
          </name>
        </person-group>
        <article-title>Functioning and validity of a Computerized Adaptive Test to measure anxiety (A-CAT)</article-title>
        <source>Depress Anxiety</source>  
        <year>2008</year>  
        <volume>25</volume>  
        <issue>12</issue>  
        <fpage>E182</fpage>  
        <lpage>94</lpage>  
        <pub-id pub-id-type="doi">10.1002/da.20482</pub-id>
        <pub-id pub-id-type="medline">18979458</pub-id></nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Fliege</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Becker</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Walter</surname>
            <given-names>OB</given-names>
          </name>
          <name name-style="western">
            <surname>Rose</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Bjorner</surname>
            <given-names>JB</given-names>
          </name>
          <name name-style="western">
            <surname>Klapp</surname>
            <given-names>BF</given-names>
          </name>
        </person-group>
        <article-title>Evaluation of a computer-adaptive test for the assessment of depression (D-CAT) in clinical application</article-title>
        <source>Int J Methods Psychiatr Res</source>  
        <year>2009</year>  
        <volume>18</volume>  
        <issue>1</issue>  
        <fpage>23</fpage>  
        <lpage>36</lpage>  
        <pub-id pub-id-type="doi">10.1002/mpr.274</pub-id>
        <pub-id pub-id-type="medline">19194856</pub-id></nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Walter</surname>
            <given-names>OB</given-names>
          </name>
          <name name-style="western">
            <surname>Becker</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Bjorner</surname>
            <given-names>JB</given-names>
          </name>
          <name name-style="western">
            <surname>Fliege</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Klapp</surname>
            <given-names>BF</given-names>
          </name>
          <name name-style="western">
            <surname>Rose</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Development and evaluation of a computer adaptive test for 'Anxiety' (Anxiety-CAT)</article-title>
        <source>Qual Life Res</source>  
        <year>2007</year>  
        <volume>16 Suppl 1</volume>  
        <fpage>143</fpage>  
        <lpage>55</lpage>  
        <pub-id pub-id-type="doi">10.1007/s11136-007-9191-7</pub-id>
        <pub-id pub-id-type="medline">17342455</pub-id></nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Devine</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Fliege</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Kocalevent</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Mierke</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Klapp</surname>
            <given-names>BF</given-names>
          </name>
          <name name-style="western">
            <surname>Rose</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Evaluation of Computerized Adaptive Tests (CATs) for longitudinal monitoring of depression, anxiety, and stress reactions</article-title>
        <source>J Affect Disord</source>  
        <year>2016</year>  
        <month>01</month>  
        <day>15</day>  
        <volume>190</volume>  
        <fpage>846</fpage>  
        <lpage>53</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.jad.2014.10.063</pub-id>
        <pub-id pub-id-type="medline">25481813</pub-id>
        <pub-id pub-id-type="pii">S0165-0327(14)00695-8</pub-id></nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Magnée</surname>
            <given-names>Te</given-names>
          </name>
          <name name-style="western">
            <surname>de Beurs</surname>
            <given-names>DP</given-names>
          </name>
          <name name-style="western">
            <surname>de Bakker</surname>
            <given-names>DH</given-names>
          </name>
          <name name-style="western">
            <surname>Verhaak</surname>
            <given-names>PF</given-names>
          </name>
        </person-group>
        <article-title>Consultations in general practices with and without mental health nurses: an observational study from 2010 to 2014</article-title>
        <source>BMJ Open</source>  
        <year>2016</year>  
        <month>07</month>  
        <day>18</day>  
        <volume>6</volume>  
        <issue>7</issue>  
        <fpage>e011579</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://bmjopen.bmj.com/cgi/pmidlookup?view=long&#38;pmid=27431902"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1136/bmjopen-2016-011579</pub-id>
        <pub-id pub-id-type="medline">27431902</pub-id>
        <pub-id pub-id-type="pii">bmjopen-2016-011579</pub-id>
        <pub-id pub-id-type="pmcid">PMC4964169</pub-id></nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wong</surname>
            <given-names>AW</given-names>
          </name>
          <name name-style="western">
            <surname>Heinemann</surname>
            <given-names>AW</given-names>
          </name>
          <name name-style="western">
            <surname>Miskovic</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Semik</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Snyder</surname>
            <given-names>TM</given-names>
          </name>
        </person-group>
        <article-title>Feasibility of computerized adaptive testing for collection of patient-reported outcomes after inpatient rehabilitation</article-title>
        <source>Arch Phys Med Rehabil</source>  
        <year>2014</year>  
        <month>05</month>  
        <volume>95</volume>  
        <issue>5</issue>  
        <fpage>882</fpage>  
        <lpage>91</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.apmr.2013.12.024</pub-id>
        <pub-id pub-id-type="medline">24440363</pub-id>
        <pub-id pub-id-type="pii">S0003-9993(14)00009-4</pub-id></nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <collab>Psychometrics Centre</collab>
        </person-group>
        <source>Concerto Adaptive Testing Platform</source>  
        <year>2013</year>  
        <access-date>2017-02-11</access-date>
        <publisher-loc>Cambridge</publisher-loc>
        <publisher-name>University of Cambridge</publisher-name>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.psychometrics.cam.ac.uk/newconcerto">http://www.psychometrics.cam.ac.uk/newconcerto</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="6oCHXdFO6"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="web">
        <source>PROMIS Assessment Center</source>  
        <access-date>2017-02-11</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://www.assessmentcenter.net/">https://www.assessmentcenter.net/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="6oCHetK5j"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kocalevent</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Rose</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Becker</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Walter</surname>
            <given-names>OB</given-names>
          </name>
          <name name-style="western">
            <surname>Fliege</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Bjorner</surname>
            <given-names>JB</given-names>
          </name>
          <name name-style="western">
            <surname>Kleiber</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Klapp</surname>
            <given-names>BF</given-names>
          </name>
        </person-group>
        <article-title>An evaluation of patient-reported outcomes found computerized adaptive testing was efficient in assessing stress perception</article-title>
        <source>J Clin Epidemiol</source>  
        <year>2009</year>  
        <month>03</month>  
        <volume>62</volume>  
        <issue>3</issue>  
        <fpage>278</fpage>  
        <lpage>87, 287.e1</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.jclinepi.2008.03.003</pub-id>
        <pub-id pub-id-type="medline">18639439</pub-id>
        <pub-id pub-id-type="pii">S0895-4356(08)00090-5</pub-id></nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
