<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMH</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Ment Health</journal-id>
      <journal-title>JMIR Mental Health</journal-title>
      <issn pub-type="epub">2368-7959</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
    <article-id pub-id-type="publisher-id">v4i3e36</article-id>
    <article-id pub-id-type="pmid">28877861</article-id>
    <article-id pub-id-type="doi">10.2196/mental.6805</article-id>
    <article-categories>
      <subj-group subj-group-type="heading">
        <subject>Original Paper</subject>
      </subj-group>
      <subj-group subj-group-type="article-type">
        <subject>Original Paper</subject>
      </subj-group>
    </article-categories>
    <title-group>
      <article-title>Assessing the Equivalence of Paper, Mobile Phone, and Tablet Survey Responses at a Community Mental Health Center Using Equivalent Halves of a ‘Gold-Standard’ Depression Item Bank</article-title>
    </title-group>
    <contrib-group>
      <contrib contrib-type="editor">
        <name>
          <surname>Calvo</surname>
          <given-names>Rafael</given-names>
        </name>
      </contrib>
      <contrib contrib-type="editor">
        <name>
          <surname>Eysenbach</surname>
          <given-names>Gunther</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Liegl</surname>
          <given-names>Gregor</given-names>
        </name>
      </contrib>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Torous</surname>
          <given-names>John</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="author" id="contrib1" corresp="yes">
      <name name-style="western">
        <surname>Brodey</surname>
        <given-names>Benjamin B</given-names>
      </name>
      <degrees>MPH, MD</degrees>
      <xref rid="aff1" ref-type="aff">1</xref>
      <address>
        <institution>TeleSage, Inc.</institution>
        <addr-line>201 E Rosemary Street</addr-line>
        <addr-line>Chapel Hill, NC, 27514</addr-line>
        <country>United States</country>
        <phone>1 886 942 8849</phone>
        <fax>1 919 942 0036</fax>
        <email>bb@telesage.com</email>
      </address>  
      <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-2146-8270</ext-link></contrib>
      <contrib contrib-type="author" id="contrib2">
        <name name-style="western">
          <surname>Gonzalez</surname>
          <given-names>Nicole L</given-names>
        </name>
        <degrees>BS Public Health</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-1768-3576</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib3">
        <name name-style="western">
          <surname>Elkin</surname>
          <given-names>Kathryn Ann</given-names>
        </name>
        <degrees>BS Psychology</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-6898-3141</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib4">
        <name name-style="western">
          <surname>Sasiela</surname>
          <given-names>W Jordan</given-names>
        </name>
        <degrees>BS Psychology</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-1284-3385</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib5">
        <name name-style="western">
          <surname>Brodey</surname>
          <given-names>Inger S</given-names>
        </name>
        <degrees>PhD</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-6532-0265</ext-link>
      </contrib>
    </contrib-group>
    <aff id="aff1">
      <sup>1</sup>
      <institution>TeleSage, Inc.</institution>
      <addr-line>Chapel Hill, NC</addr-line>
      <country>United States</country>
    </aff>
    <author-notes>
      <corresp>Corresponding Author: Benjamin B Brodey 
      <email>bb@telesage.com</email></corresp>
    </author-notes>
    <pub-date pub-type="collection"><season>Jul-Sep</season><year>2017</year></pub-date>
    <pub-date pub-type="epub">
      <day>06</day>
      <month>09</month>
      <year>2017</year>
    </pub-date>
    <volume>4</volume>
    <issue>3</issue>
    <elocation-id>e36</elocation-id>
    <!--history from ojs - api-xml-->
    <history>
      <date date-type="received">
        <day>14</day>
        <month>10</month>
        <year>2016</year>
      </date>
      <date date-type="rev-request">
        <day>28</day>
        <month>11</month>
        <year>2016</year>
      </date>
      <date date-type="rev-recd">
        <day>16</day>
        <month>6</month>
        <year>2017</year>
      </date>
      <date date-type="accepted">
        <day>3</day>
        <month>8</month>
        <year>2017</year>
      </date>
    </history>
    <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
    <copyright-statement>©Benjamin B Brodey, Nicole L Gonzalez, Kathryn Ann Elkin, W Jordan Sasiela, Inger S Brodey. Originally published in JMIR Mental Health (http://mental.jmir.org), 06.09.2017.</copyright-statement>
    <copyright-year>2017</copyright-year>
    <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
      <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Mental Health, is properly cited. The complete bibliographic information, a link to the original publication on http://mental.jmir.org/, as well as this copyright and license information must be included.</p>
    </license>  
    <self-uri xlink:href="http://mental.jmir.org/2017/3/e36/" xlink:type="simple"/>
    <abstract>
      <sec sec-type="background">
        <title>Background</title>
        <p>The computerized administration of self-report psychiatric diagnostic and outcomes assessments has risen in popularity. If results are similar enough across different administration modalities, then new administration technologies can be used interchangeably and the choice of technology can be based on other factors, such as convenience in the study design. An assessment based on item response theory (IRT), such as the Patient-Reported Outcomes Measurement Information System (PROMIS) depression item bank, offers new possibilities for assessing the effect of technology choice upon results.</p>
      </sec>
      <sec sec-type="objective">
        <title>Objective</title>
        <p>To create equivalent halves of the PROMIS depression item bank and to use these halves to compare survey responses and user satisfaction among administration modalities—paper, mobile phone, or tablet—with a community mental health care population.</p>
      </sec>
      <sec sec-type="methods">
        <title>Methods</title>
        <p>The 28 PROMIS depression items were divided into 2 halves based on content and simulations with an established PROMIS response data set. A total of 129 participants were recruited from an outpatient public sector mental health clinic based in Memphis. All participants took both nonoverlapping halves of the PROMIS IRT-based depression items (Part A and Part B): once using paper and pencil, and once using either a mobile phone or tablet. An 8-cell randomization was done on technology used, order of technologies used, and order of PROMIS Parts A and B. Both Parts A and B were administered as fixed-length assessments and both were scored using published PROMIS IRT parameters and algorithms.</p>
      </sec>
      <sec sec-type="results">
        <title>Results</title>
        <p>All 129 participants received either Part A or B via paper assessment. Participants were also administered the opposite assessment, 63 using a mobile phone and 66 using a tablet. There was no significant difference in item response scores for Part A versus B. All 3 of the technologies yielded essentially identical assessment results and equivalent satisfaction levels.</p>
      </sec>
      <sec sec-type="conclusions">
        <title>Conclusions</title>
        <p>Our findings show that the PROMIS depression assessment can be divided into 2 equivalent halves, with the potential to simplify future experimental methodologies. Among community mental health care recipients, the PROMIS items function similarly whether administered via paper, tablet, or mobile phone. User satisfaction across modalities was also similar. Because paper, tablet, and mobile phone administrations yielded similar results, the choice of technology should be based on factors such as convenience and can even be changed during a study without adversely affecting the comparability of results.</p>
      </sec>
    </abstract>
    <kwd-group>
      <kwd>mobile phone</kwd>
      <kwd>tablet</kwd>
      <kwd>PROMIS</kwd>
      <kwd>depression</kwd>
      <kwd>item response theory</kwd>
      <kwd>outcomes tracking</kwd>
      <kwd>PORTAL</kwd>
      <kwd>TeleSage</kwd>
      <kwd>behavioral health</kwd>
      <kwd>special issue on computing and mental health</kwd>
    </kwd-group></article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>As Internet and electronic survey administration technologies have shown many advantages and benefits relative to paper forms, computerized administrations of diagnostic and outcome measures have grown in popularity [<xref ref-type="bibr" rid="ref1">1</xref>]. Recent studies have shown that participants often prefer the electronic version of an assessment to traditional paper surveys [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. Additionally, electronic data entry has been shown to minimize errors that occur during traditional paper data collection [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. In many situations, however, patients and research participants alternate between paper and electronic data collection (EDC) mediums as needed, such as when certain parts of a facility differ in regards to wireless connectivity, or when it is unknown what device an end-user may use to complete a survey sent as a link in an email. In cases such as these, researchers need to know whether the administration technology meaningfully affects results and whether these technologies can be used interchangeably within a single study. If administration method does not significantly impact assessment results and user satisfaction, the least expensive, most user-friendly, or most convenient form of administration technology can be employed without risk of jeopardizing assessment validity.</p>
      <p>Several authors have provided evidence that the results of assessments administered via EDC methods are equivalent to results of those administered via the traditional paper-and-pencil method [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref9">9</xref>]. Additionally, a 2008 meta-analysis found equivalence between paper- and computer-administered self-report assessments [<xref ref-type="bibr" rid="ref10">10</xref>]. Similar to prior research, this study investigates whether results of self-report assessment differ based on mode of administration; however, this study improves upon past research in several ways.</p>
      <p>First, many studies have used a test-retest design, using the same items or instrument for both assessment periods [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref9">9</xref>]. This can be problematic because if the same items are administered sequentially, results may be impacted by a lingering memory effect. Furthermore, when time-delay methods are used to decrease this memory effect, if is not possible to determine whether changes in response are due to changes in modality or changes in symptoms over time. This study provides a method for overcoming these challenges.</p>
      <p>A second way that this study improves upon past research in the field is in regard to psychometric equivalence versus face validity equivalence. Previous research has been done using the Patient-Reported Outcomes Measurement Information System (PROMIS) depression item bank (the same items that are used in the current study), which demonstrated the psychometric reliability and validity of these items [<xref ref-type="bibr" rid="ref2">2</xref>]. While it is true that any 2 sets of items drawn at random from the PROMIS depression item bank should be psychometrically equivalent, clinicians rely on constellations of symptoms to diagnose and understand psychiatric disorders. Thus, from a clinical perspective, it is necessary to have equivalence on the symptom level, as well as psychometrically.</p>
      <p>To address both of these concerns, this study created 2 psychometrically equivalent halves of the PROMIS depression item bank. The 2 halves (called Form A and Form B) had no overlapping questions, which eliminated the risk of lingering memory effects within participants. Additionally, to the greatest extent possible, the halves were created to assess similar depression symptoms, which is crucial for an assessment to have clinical significance. We hypothesize that the within-person validity of assessment will be similar across administration modality.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Item Set Generation</title>
        <p>The PROMIS depression item bank is a set of 28 self-report items that use a Likert-scale with 5 options that range from “Never” to “Always” indicating how often the patient experiences each symptom [<xref ref-type="bibr" rid="ref11">11</xref>]. Item response theory (IRT) parameters have been established for the PROMIS items using the graded response model (GRM) [<xref ref-type="bibr" rid="ref12">12</xref>]. IRT parameters describe the probability of a given response to an item as a function of the respondent’s true standing on a trait or domain (for an overview of IRT and its importance in the field of psychiatry, see Yang and Kao [<xref ref-type="bibr" rid="ref13">13</xref>]). Thus, IRT allows for estimation of this trait score (theta), and the associated standard error, using any combination or number of items. These PROMIS item parameters and the IRT algorithm were programmed into the TeleSage IRT engine, which runs on the TeleSage data collection platform, called PORTAL. The IRT algorithms were created with assistance from Seung Choi, who also assisted with development of the PROMIS assessment center algorithms [<xref ref-type="bibr" rid="ref14">14</xref>]. For this study, we chose to use the PROMIS items and parameters due to the rigor that was used in their development and their proven relevance in the field [<xref ref-type="bibr" rid="ref12">12</xref>].</p>
        <p>Dividing the PROMIS depression item bank into 2 nonoverlapping analogous subsets of 14 items created the item sets used in this study. Although a perfect correspondence of content within pairs was not possible, Dr Brodey, a psychiatrist with clinical experience, paired the most similar items together based on criteria from the Diagnostic and Statistical Manual of Mental Disorders, fifth edition (DSM-5). For example, sadness was paired with depression. Sadness and depression are represented by unique PROMIS items but are included in a single DSM-5 criterion [<xref ref-type="bibr" rid="ref15">15</xref>]. The members of each pair were then divided into Form A and B (see <xref ref-type="boxed-text" rid="box1">Textboxes 1</xref> and <xref ref-type="boxed-text" rid="box2">2</xref>). Dividing the PROMIS items based on face validity preserves psychometric equivalence while maximizing clinical equivalence and relevance. The test information curves were derived from the de-identified data set used in the original PROMIS validation [<xref ref-type="bibr" rid="ref12">12</xref>]. Upon first analysis, one of the item sets provided slightly more information than the other, so one pair was chosen and the 2 items in that pair were switched to the opposite form. The test information curve for the final item sets can be seen in the Results section.</p>
      </sec>
      <sec>
        <title>Data Collection Tool</title>
        <p>Electronic health records (EHR) are a ready means of housing and sharing quantitative health information. We used the Health Insurance Portability and Accountability Act of 1996 (HIPAA)-compliant security technologies and an HL7 protocol for the bidirectional exchange of data between the community mental health systems’ EHR and the TeleSage database, via the TeleSage PORTAL.</p>
      </sec>
      <sec>
        <title>Recruitment and Summary of Participants</title>
        <p>Following full institutional review board (IRB) approval of this study, participants were recruited via flyers that were posted at an outpatient community mental health center serving severe and persistently mentally ill clients in the Memphis, TN area. Clients were excluded if they were younger than 18 years of age. Participants were advised that they would be paid US$10 in the form of a Target gift certificate regardless of whether or not they completed the study. All 129 participants who began the study completed it. The ages of the participants ranged from 18 to 72 years with an average of 43 years. The participants were more often African-American (109/129, 84.5%), non-Hispanic (123/129, 95.3%), and female (83/129, 64.3%). This is representative of the public sector population served by the clinic used in this study. The demographic characteristics in mobile phone and tablet groups were very similar across age, sex, race, and ethnicity (<xref ref-type="table" rid="table1">Table 1</xref>).</p>
        <boxed-text id="box1" position="float">
          <title>Division of Patient-Reported Outcomes Measurement Information System depression bank items into Form A.</title>
          <p>Question text:</p>
          <list list-type="bullet">
            <list-item>
              <p>I felt hopeless.</p>
            </list-item>
            <list-item>
              <p>I felt unhappy.</p>
            </list-item>
            <list-item>
              <p>I felt sad.</p>
            </list-item>
            <list-item>
              <p>I felt guilty.</p>
            </list-item>
            <list-item>
              <p>I withdrew from other people.</p>
            </list-item>
            <list-item>
              <p>I felt like a failure.</p>
            </list-item>
            <list-item>
              <p>I felt discouraged about the future.</p>
            </list-item>
            <list-item>
              <p>I felt ignored by people.</p>
            </list-item>
            <list-item>
              <p>I found that things in my life were overwhelming.</p>
            </list-item>
            <list-item>
              <p>I felt that my life was empty.</p>
            </list-item>
            <list-item>
              <p>I felt disappointed in myself.</p>
            </list-item>
            <list-item>
              <p>I had trouble making decisions.</p>
            </list-item>
            <list-item>
              <p>I felt that I was not needed.</p>
            </list-item>
            <list-item>
              <p>I felt worthless.</p>
            </list-item>
          </list>
        </boxed-text>
        <boxed-text id="box2" position="float">
          <title>Division of Patient-Reported Outcomes Measurement Information System depression bank items into Form B.</title>
          <p>Question text:</p>
          <list list-type="bullet">
            <list-item>
              <p>I felt I had no reason for living.</p>
            </list-item>
            <list-item>
              <p>I felt that nothing could cheer me up.</p>
            </list-item>
            <list-item>
              <p>I felt depressed.</p>
            </list-item>
            <list-item>
              <p>I felt that I was to blame for things.</p>
            </list-item>
            <list-item>
              <p>I had trouble feeling close to people.</p>
            </list-item>
            <list-item>
              <p>I felt that I was not as good as other people.</p>
            </list-item>
            <list-item>
              <p>I felt that I had nothing to look forward to.</p>
            </list-item>
            <list-item>
              <p>I felt lonely.</p>
            </list-item>
            <list-item>
              <p>I felt emotionally exhausted.</p>
            </list-item>
            <list-item>
              <p>I felt that nothing was interesting.</p>
            </list-item>
            <list-item>
              <p>I felt worthless.</p>
            </list-item>
            <list-item>
              <p>I felt pessimistic.</p>
            </list-item>
            <list-item>
              <p>I felt that I wanted to give up on everything.</p>
            </list-item>
            <list-item>
              <p>I felt upset for no reason.</p>
            </list-item>
          </list>
        </boxed-text>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Demographics of the full sample and of the mobile phone and tablet administration groups<sup>a</sup> (see <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="505"/>
            <col width="170"/>
            <col width="170"/>
            <col width="120"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Demographics</td>
                <td>Full Sample (N=129)</td>
                <td>Mobile phone (N=63)</td>
                <td>Tablet (N=66)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">Age; mean (standard deviation)</td>
                <td>43 (12)</td>
                <td>43 (11.28)</td>
                <td>44 (12.63)</td>
              </tr>
              <tr valign="top">
                <td colspan="2"><bold>Sex; N (%)</bold></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Female</td>
                <td>83 (65)</td>
                <td>41 (65)</td>
                <td>42 (64)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Male</td>
                <td>45 (35)</td>
                <td>22 (35)</td>
                <td>23 (36)</td>
              </tr>
              <tr valign="top">
                <td colspan="2"><bold>Race; N (%)</bold></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Asian</td>
                <td>1 (1)</td>
                <td>1 (2)</td>
                <td>0 (0)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>African-American</td>
                <td>109 (86)</td>
                <td>52 (83)</td>
                <td>57 (86)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Caucasian</td>
                <td>17 (13)</td>
                <td>9 (14)</td>
                <td>8 (12)</td>
              </tr>
              <tr valign="top">
                <td colspan="2"><bold>Ethnicity; N (%)</bold></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Non-Hispanic</td>
                <td>123 (98)</td>
                <td>59 (98)</td>
                <td>64 (98)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Hispanic</td>
                <td>2 (2)</td>
                <td>1 (2)</td>
                <td>1 (2)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>Missing values: sex (1 in tablet group), race (1 in mobile phone group, 1 in tablet group), and ethnicity (3 in mobile phone group, 1 in tablet group)</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Assessment Modality Assignment and Administration</title>
        <p>HIPAA standards were maintained throughout the data collection process. Participants were divided into an 8-cell randomization and independently randomized into groups based on (1) modality of the electronic assessment administration (mobile phone vs tablet), (2) order of assessment modality (paper first vs electronic first), and (3) order of assessment subset presentation (Form A first vs Form B first). All modalities of the surveys were self-administered. The study coordinator at the clinical site provided paper forms, and the electronic assessments were provided via the Internet (using clinic Wi-Fi and a Samsung tablet [n=63] or mobile phone [n=66]) via the TeleSage PORTAL. The site study coordinator entered all the paper surveys into the TeleSage PORTAL by using the rapid data entry interface. TeleSage obtained demographic data on each participant by automatically matching participants with their NetSmart EHR. The PORTAL system integrated with the clinic EHR, allowing the direct importation of demographics from the EHR and direct export of the clinical report to the EHR. The demographic data for each individual, including age in years, sex, race, and ethnicity, were prepopulated into the study assessments without error via the PORTAL system. Assessment reports were generated and exported to the EHR in real time. After completing both survey modalities, 38 consecutive participants filled out a short satisfaction survey (on paper) regarding the technologies they used. The survey asked participants to compare their satisfaction with the paper survey versus the electronic survey, and it asked about satisfaction with the specific electronic modality they used. All questions used a 5-point Likert-scale format of “Strongly Agree” to “Strongly Disagree.” Participants also completed survey items that asked about their technology ownership and usage.</p>
      </sec>
      <sec>
        <title>Statistical Analysis</title>
        <p>Scores are evaluated on a theta scale, based on PROMIS community norms and defined from −4.0 to 4.0, where 0 is the mean, and positive scores indicate depression. The PORTAL’s IRT module estimated a trait score (theta) in real time for each of the 2 surveys taken by each individual using the GRM and the maximum likelihood estimation calculation method [<xref ref-type="bibr" rid="ref12">12</xref>]. The theta scores were subsequently analyzed using mixed-effects models with a random intercept, which allowed for variance in the severity of depression symptoms reported by participants. Additionally, participants were repeated in the data set, which allowed the model to take within-subject dependencies across administrations into account. Fixed-effects predictors included modality (paper, mobile phone, tablet), item set (Form A or B), and the interaction between modality and item set.</p>
        <p>To gain a more intuitive understanding of trends seen in the data, <italic>t</italic> tests were also performed. While <italic>t</italic> tests do not take into account all dependencies in the data, they do allow for a more direct comparison of within-subject variation (repeated measures <italic>t</italic> tests of Form A vs B, paper vs mobile phone, and paper vs tablet) and between-subject variation (an independent groups <italic>t</italic> test of mobile phone versus tablet; <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Item Set Generation</title>
        <p>Using the methodology described previously, it was possible to create 2 psychometrically equivalent halves of the PROMIS depression item bank. <xref ref-type="fig" rid="figure1">Figure 1</xref> depicts the test information plots for Form A and B, based on item data from the original PROMIS validation [<xref ref-type="bibr" rid="ref12">12</xref>]. <xref ref-type="table" rid="table2">Table 2</xref> shows a summary of the IRT scale (theta) scores, overall, and based on variables of interest (<xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>).</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Item response theory test information plot for Forms A and B (see <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>).</p>
          </caption>
          <graphic xlink:href="mental_v4i3e36_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Summary of item response theory scale scores, overall and by variables of interest (see <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="575"/>
            <col width="120"/>
            <col width="120"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Condition</td>
                <td>N</td>
                <td>Mean</td>
                <td>Standard deviation</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">Overall</td>
                <td>258</td>
                <td>0.91</td>
                <td>0.98</td>
              </tr>
              <tr valign="top">
                <td colspan="2"><bold>Modality</bold></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Paper</td>
                <td>129</td>
                <td>0.91</td>
                <td>0.87</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Mobile phone</td>
                <td>63</td>
                <td>0.89</td>
                <td>1.04</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Tablet</td>
                <td>66</td>
                <td>0.93</td>
                <td>1.11</td>
              </tr>
              <tr valign="top">
                <td colspan="2"><bold>Form</bold></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>A</td>
                <td>129</td>
                <td>0.92</td>
                <td>0.91</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>B</td>
                <td>129</td>
                <td>0.90</td>
                <td>1.04</td>
              </tr>
              <tr valign="top">
                <td colspan="2"><bold>Modality × Form</bold></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Paper × A</td>
                <td>65</td>
                <td>0.85</td>
                <td>0.92</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Paper × B</td>
                <td>64</td>
                <td>0.98</td>
                <td>0.82</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Mobile phone × A</td>
                <td>32</td>
                <td>0.93</td>
                <td>1.02</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Mobile phone × B</td>
                <td>31</td>
                <td>0.85</td>
                <td>1.08</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Tablet × A</td>
                <td>32</td>
                <td>1.05</td>
                <td>0.79</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Table × B</td>
                <td>34</td>
                <td>0.81</td>
                <td>1.34</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Statistical Analyses</title>
        <p>Dr RJ Wirth, of Vector Psychometric Group, completed all statistical analyses. The wording of this section was taken from Dr Wirth’s report (see <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>). For the full data analyses, the first model included modality, form, and the modality-by-form interaction as predictors. Results showed a statistically nonsignificant interaction, indicating that the difference between forms did not depend on modality; <italic>F</italic><sub>2,125</sub>=0.44, <italic>P</italic>=.64. For parsimony, the nonsignificant modality-by-form interaction was dropped and a second, main effects only model was estimated using modality and form as predictors. Results from this main-effects model demonstrated that there was not a statistically significant effect of either form, <italic>F</italic><sub>1,126</sub>=0.06, <italic>P</italic>=.81, or modality, <italic>F</italic><sub>2,126</sub>=0.16, <italic>P</italic>=.85 on the provided IRT scale scores for depression.</p>
        <p>Similar results were obtained for the model using only data from unflagged observations, which resulted in the removal of 12 subjects for a reduced N of 117. Initial model results showed a statistically nonsignificant interaction, indicating that the difference between forms did not depend on modality; <italic>F</italic><sub>2,113</sub>=0.39, <italic>P</italic>=.68. For parsimony, the nonsignificant modality-by-form interaction was dropped and a second model was estimated with only modality and form as main effect predictors. Results from this model again demonstrated that there were no statistically significant effects due to either form, <italic>F</italic><sub>1,114</sub>=0.15, <italic>P</italic>=.70, or modality, <italic>F</italic><sub>2,114</sub>=0.23, <italic>P</italic>=.79 on depression scores.</p>
        <p>The data was also analyzed using <italic>t</italic> tests. While <italic>t</italic> tests do not model as many dependencies in the data, they are often easier to interpret. The results of the repeated-measures <italic>t</italic> tests (comparing the means of Form A and B, as well as paper vs mobile phone scores and paper vs tablet scores) are shown in <xref ref-type="table" rid="table3">Table 3</xref>. The results of the independent groups <italic>t</italic> test (comparing mobile phone vs table scores) are shown in <xref ref-type="table" rid="table4">Table 4</xref>. The results of the <italic>t</italic> tests support the general findings of the previously reported analysis of the variance; no statistically significant differences were found among any of the modality comparisons or across forms.</p>
      </sec>
      <sec>
        <title>Post-Assessment Satisfaction and Technology Usage and Experience Survey</title>
        <p>After completing both the electronic and the paper assessments, 38 participants in our study received a paper satisfaction survey. Of the mobile phone and tablet groups, 62% (39/63) and 61% (40/66), respectively, responded that they agreed or strongly agreed with the following statement: “It was easier to read the questions on the mobile phone/tablet (than on the paper form).” Of the mobile phone and tablet groups, 61% (38/63) and 72% (48/66), respectively, responded that they disagreed or disagreed strongly with the following statement: “It took me longer to take the survey on the mobile phone/tablet (than on the paper form).” Of the mobile phone and tablet groups, 50% (32/66) and 48% (32/66), respectively, responded that they agreed or strongly agreed with the following statement: “Overall, It was easier to take the survey on the mobile phone/tablet (than on the paper form).” Of the mobile phone and tablet groups, 66% (42/63) and 67% (44/66), respectively, responded that they agreed or strongly agreed with the following statement: “In the future, I would be equally willing to take a survey on paper or using the mobile phone/tablet.” These results indicate that overall, the participants felt that the technologies were largely equivalent.</p>
        <p>Analysis of the technology usage and experience survey showed that technology access in the 2 groups was essentially equivalent. Personal computer ownership was 22% (14/63) for the mobile phone group and 18% (12/66) for the tablet group. The mean observed duration for assessment completion on both the mobile phone and tablet was very similar (3.61 and 3.41 minutes, respectively). The mean duration for paper administration was 1.66 minutes. The mean duration of Parts A and B electronic survey administrations were very similar (3.57 and 3.43 minutes, respectively).</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Group descriptives and associated <italic>t</italic> test values for repeated measures planned comparisons (see <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="250"/>
            <col width="80"/>
            <col width="100"/>
            <col width="150"/>
            <col width="150"/>
            <col width="80"/>
            <col width="80"/>
            <col width="80"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Group</td>
                <td>N</td>
                <td>Mean</td>
                <td>Standard deviation</td>
                <td>Degrees of freedom</td>
                <td><italic>t</italic></td>
                <td><italic>P</italic></td>
                <td>Cohen</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">Form A</td>
                <td>129</td>
                <td>0.92</td>
                <td>0.91</td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td colspan="2">Form B</td>
                <td>129</td>
                <td>0.90</td>
                <td>1.04</td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td colspan="2">Difference</td>
                <td><break/></td>
                <td>0.01</td>
                <td>0.59</td>
                <td>128</td>
                <td>0.25</td>
                <td>.80</td>
                <td>0.02</td>
              </tr>
              <tr valign="top">
                <td colspan="2"><bold>Mobile Phone Group</bold></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Paper</td>
                <td>63</td>
                <td>0.85</td>
                <td>0.93</td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Mobile phone</td>
                <td>63</td>
                <td>0.89</td>
                <td>1.04</td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Difference</td>
                <td><break/></td>
                <td>−0.03</td>
                <td>0.66</td>
                <td>62</td>
                <td>0.42</td>
                <td>.68</td>
                <td>0.04</td>
              </tr>
              <tr valign="top">
                <td colspan="2"><bold>Tablet Group</bold></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Paper</td>
                <td>66</td>
                <td>0.97</td>
                <td>0.81</td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Tablet</td>
                <td>66</td>
                <td>0.93</td>
                <td>1.11</td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Difference</td>
                <td><break/></td>
                <td>0.04</td>
                <td>0.53</td>
                <td>65</td>
                <td>0.68</td>
                <td>.50</td>
                <td>0.04</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>Cohen <italic>d</italic> was calculated using original group standard deviations, rather than difference standard deviation [<xref ref-type="bibr" rid="ref16">16</xref>].</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Group descriptives and <italic>t</italic> test results for the mobile phone versus tablet independent groups comparison (see <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="280"/>
            <col width="80"/>
            <col width="100"/>
            <col width="150"/>
            <col width="150"/>
            <col width="80"/>
            <col width="80"/>
            <col width="80"/>
            <thead>
              <tr valign="top">
                <td>Group</td>
                <td>N</td>
                <td>Mean</td>
                <td>Standard deviation</td>
                <td>Degrees of freedom</td>
                <td><italic>t</italic></td>
                <td><italic>P</italic></td>
                <td>Cohen</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Mobile phone</td>
                <td>63</td>
                <td>0.89</td>
                <td>1.04</td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td>Tablet</td>
                <td>66</td>
                <td>0.93</td>
                <td>1.11</td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td>Difference</td>
                <td><break/></td>
                <td>−0.04</td>
                <td>1.08</td>
                <td>127</td>
                <td>−0.2</td>
                <td>.84</td>
                <td>0.04</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Results</title>
        <p>This study found no significant difference between the 2 item sets created from the PROMIS depression item bank; therefore, Forms A and B functioned equivalently in our sample. This suggests that in the future, researchers can administer Forms A and B to the same participant, in the same visit, without results being biased by a memory effect. Future studies could implement the methodology used in this study to assess the equivalence of additional technologies (eg, interactive voice response and smart eye wear [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]), or the equivalence of different administration settings (eg, the clinician’s office vs a patient’s home). Additionally, using multiple equivalent item groups may improve methodologies involving regularly repeated longitudinal assessments, by reducing any memory bias.</p>
        <p>We also found no significant differences between EDC method and paper, or between mobile phone and tablet. The negligible effect sizes of the differences between assessment modalities suggest that these technologies functioned equivalently within our sample, which is consistent with previous literature [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref10">10</xref>]. These findings imply that clinicians and researchers can administer the PROMIS depression items to public sector mental health recipients via mobile phone, tablet, or paper, without impacting the reliability of the information gathered from each modality, and can even shift between survey administration technologies during a study without fear of significantly affecting the validity of the survey responses or confounding the study results.</p>
        <p>Along with modality and form equivalence, the satisfaction survey reveals that there was no modality (electronic or paper) that participants clearly preferred. This was a surprising finding because the EDC methods took, on average, approximately twice as long as the paper surveys. We do not have clear evidence explaining this variation, but it may be that the EDC modality was relatively novel for many participants, thus it took them extra time to learn how to navigate the electronic surveys. Despite the time difference, a majority of the participants disagreed or disagreed strongly with the statement that it took longer to complete their EDC method. This suggests that patients/participants may not be averse to longer surveys if the surveys are administered electronically.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>Many of the recruited clients suffered from schizophrenia. This may have impaired their ability to respond to survey questions. Additionally, this study was conducted with the PROMIS items, which were designed to be short and easy to interpret. Thus, the results might not generalize to more complex question formats.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <p>There are several strengths of the current study that expand upon work done previously. While there has been work done using the PROMIS depression item bank and alternate methods of administration, this may be the first study to use nonoverlapping, equivalent item sets [<xref ref-type="bibr" rid="ref2">2</xref>]. This methodology could be applied to other instruments in which modality equivalence has been found, to provide greater strength to these studies [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref8">8</xref>]. One study used 2 different self-report instruments to assess depression and compare modalities, but the authors found significant main effects and interaction effects based on the order in which the 2 instruments were administered [<xref ref-type="bibr" rid="ref6">6</xref>]. While using 2 different but psychometrically equivalent instruments may have eliminated the risk of memory effect in the previous study, it could have benefitted from the methodology in this study—administering nonoverlapping items from the same assessment (to decrease the effects of administration order) [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
        <p>Additionally, several prior studies have found that participants prefer using an EDC method to a paper survey [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref8">8</xref>]. The current study did not have results that are consistent with these studies, suggesting that user preference can change.</p>
      </sec>
      <sec>
        <title>Suggestions for Future Research</title>
        <p>Future work should investigate the equivalence of data collected in different settings. With the PORTAL software, clients can easily be administered a survey in their homes via an email or text link (this study’s IRB approval required that all data be gathered within a health care setting). Future research in the public sector mental health care field would benefit from further research of user preference. Finding a modality that most patients are satisfied with could increase both study participation rates and the accuracy of diagnoses, especially if a self-report diagnostic assessment can be administered at home using EDC methods.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>The current study found that, in a population of mental health care recipients, 3 different self-report assessment modalities (mobile phone, tablet, paper) yielded essentially identical assessment results and essentially equivalent satisfaction levels. This suggests that, at least for the PROMIS depression assessment and public sector mental health recipients, the choice of survey administration technology in future studies can be based on cost and convenience. The results may open the way for more accurate technology comparisons among depressed patients.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <app id="app1">
        <title>Multimedia Appendix 1</title>
        <p>Statistical report from Dr RJ Wirth.</p>
        <media xlink:href="mental_v4i3e36_app1.pdf" xlink:title="PDF File (Adobe PDF File), 88KB"/>
      </app>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">DSM-5</term>
          <def>
            <p>Diagnostic and Statistical Manual of Mental Disorders, fifth edition</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">EDC</term>
          <def>
            <p>electronic data collection</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">GRM</term>
          <def>
            <p>graded response model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">HIPAA</term>
          <def>
            <p>Health Insurance Portability and Accountability Act of 1996</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">IRB</term>
          <def>
            <p>institutional review board</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">IRT</term>
          <def>
            <p>item response theory</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">PROMIS</term>
          <def>
            <p>patient-reported outcomes measurement information system</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors thank RJ Wirth, Vector Psychometric Group LLC, and Alliance Healthcare Services, and Netsmart Technologies. Funding provided by National Institutes of Health Grant 1R44MH102914-01A1.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>ISB and BBB are the sole owners of TeleSage, Inc., which is the company that developed and hosts the PORTAL system used in this study.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Brodey</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>First</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Linthicum</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Haman</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Sasiela</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Ayer</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>Validation of the NetSCID: an automated web-based adaptive version of the SCID</article-title>
        <source>Compr Psychiatry</source>  
        <year>2016</year>  
        <volume>66</volume>  
        <fpage>67</fpage>  
        <lpage>70</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.comppsych.2015.10.005</pub-id>
        <pub-id pub-id-type="medline">26995238</pub-id></nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bjorner</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Rose</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Gandek</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Stone</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Junghaenel</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Ware</surname>
            <given-names>JJ</given-names>
          </name>
        </person-group>
        <article-title>Method of administration of PROMIS scales did not significantly impact score level, reliability, or validity</article-title>
        <source>J Clin Epidemiol</source>  
        <year>2014</year>  
        <volume>67</volume>  
        <fpage>108</fpage>  
        <lpage>113</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://linkinghub.elsevier.com/retrieve/pii/S0895435613003466"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.jclinepi.2013.07.016</pub-id>
        <pub-id pub-id-type="medline">24262772</pub-id></nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bush</surname>
            <given-names>NE</given-names>
          </name>
          <name name-style="western">
            <surname>Skopp</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Smolenski</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Crumpton</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Fairall</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Behavioral screening measures delivered with a smartphone app: psychometric properties and user preference</article-title>
        <source>J Nerv Ment Dis</source>  
        <year>2013</year>  
        <volume>201</volume>  
        <fpage>991</fpage>  
        <lpage>995</lpage>  
        <pub-id pub-id-type="doi">10.1097/NMD.0000000000000039</pub-id>
        <pub-id pub-id-type="medline">24177488</pub-id>
        <pub-id pub-id-type="pii">00005053-201311000-00012</pub-id></nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Wu</surname>
            <given-names>Q</given-names>
          </name>
          <name name-style="western">
            <surname>van</surname>
            <given-names>VM</given-names>
          </name>
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Car</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Rudan</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Scherpbier</surname>
            <given-names>RW</given-names>
          </name>
        </person-group>
        <article-title>Smartphone versus pen-and-paper data collection of infant feeding practices in rural China</article-title>
        <source>J Med Internet Res</source>  
        <year>2012</year>  
        <volume>14</volume>  
        <fpage>e119</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2012/5/e119/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.2183</pub-id>
        <pub-id pub-id-type="medline">22989894</pub-id>
        <pub-id pub-id-type="pii">v14i5e119</pub-id>
        <pub-id pub-id-type="pmcid">PMC3510690</pub-id></nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Clionsky</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Clionsky</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>Psychometric equivalence of a paper-based and computerized (iPad) version of the Memory Orientation Screening Test (MOST®)</article-title>
        <source>Clin Neuropsychol</source>  
        <year>2014</year>  
        <volume>28</volume>  
        <fpage>747</fpage>  
        <lpage>755</lpage>  
        <pub-id pub-id-type="doi">10.1080/13854046.2014.913686</pub-id>
        <pub-id pub-id-type="medline">24815733</pub-id></nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Holländare</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Andersson</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Engström</surname>
            <given-names>I</given-names>
          </name>
        </person-group>
        <article-title>A comparison of psychometric properties between internet and paper versions of two depression instruments (BDI-II and MADRS-S) administered to clinic patients</article-title>
        <source>J Med Internet Res</source>  
        <year>2010</year>  
        <volume>12</volume>  
        <fpage>e49</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2010/5/e49/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.1392</pub-id>
        <pub-id pub-id-type="medline">21169165</pub-id>
        <pub-id pub-id-type="pii">v12i5e49</pub-id>
        <pub-id pub-id-type="pmcid">PMC3057311</pub-id></nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bennett</surname>
            <given-names>AV</given-names>
          </name>
          <name name-style="western">
            <surname>Dueck</surname>
            <given-names>AC</given-names>
          </name>
          <name name-style="western">
            <surname>Mitchell</surname>
            <given-names>SA</given-names>
          </name>
          <name name-style="western">
            <surname>Mendoza</surname>
            <given-names>TR</given-names>
          </name>
          <name name-style="western">
            <surname>Reeve</surname>
            <given-names>BB</given-names>
          </name>
          <name name-style="western">
            <surname>Atkinson</surname>
            <given-names>TM</given-names>
          </name>
          <name name-style="western">
            <surname>Castro</surname>
            <given-names>KM</given-names>
          </name>
          <name name-style="western">
            <surname>Denicoff</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Rogak</surname>
            <given-names>LJ</given-names>
          </name>
          <name name-style="western">
            <surname>Harness</surname>
            <given-names>JK</given-names>
          </name>
          <name name-style="western">
            <surname>Bearden</surname>
            <given-names>JD</given-names>
          </name>
          <name name-style="western">
            <surname>Bryant</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Siegel</surname>
            <given-names>RD</given-names>
          </name>
          <name name-style="western">
            <surname>Schrag</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Basch</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>National</surname>
            <given-names>CIPSG</given-names>
          </name>
        </person-group>
        <article-title>Mode equivalence and acceptability of tablet computer-, interactive voice response system-, and paper-based administration of the U.S. National Cancer Institute's Patient-Reported Outcomes version of the Common Terminology Criteria for Adverse Events (PRO-CTCAE)</article-title>
        <source>Health Qual Life Outcomes</source>  
        <year>2016</year>  
        <volume>14</volume>  
        <fpage>24</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://hqlo.biomedcentral.com/articles/10.1186/s12955-016-0426-6"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/s12955-016-0426-6</pub-id>
        <pub-id pub-id-type="medline">26892667</pub-id>
        <pub-id pub-id-type="pii">10.1186/s12955-016-0426-6</pub-id>
        <pub-id pub-id-type="pmcid">PMC4759776</pub-id></nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Cook</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Balasubramani</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Eng</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Friedman</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Young</surname>
            <given-names>EA</given-names>
          </name>
          <name name-style="western">
            <surname>Martin</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Nay</surname>
            <given-names>WT</given-names>
          </name>
          <name name-style="western">
            <surname>Ritz</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Rush</surname>
            <given-names>AJ</given-names>
          </name>
          <name name-style="western">
            <surname>Stegman</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Warden</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Trivedi</surname>
            <given-names>MH</given-names>
          </name>
          <name name-style="western">
            <surname>Wisniewski</surname>
            <given-names>SR</given-names>
          </name>
        </person-group>
        <article-title>Electronic source materials in clinical research: acceptability and validity of symptom self-rating in major depressive disorder</article-title>
        <source>J Psychiatr Res</source>  
        <year>2007</year>  
        <volume>41</volume>  
        <fpage>737</fpage>  
        <lpage>743</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.jpsychires.2006.07.015</pub-id>
        <pub-id pub-id-type="medline">17275840</pub-id>
        <pub-id pub-id-type="pii">S0022-3956(06)00148-8</pub-id></nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Goldstein</surname>
            <given-names>LA</given-names>
          </name>
          <name name-style="western">
            <surname>Connolly</surname>
            <given-names>GMB</given-names>
          </name>
          <name name-style="western">
            <surname>Thompson</surname>
            <given-names>SM</given-names>
          </name>
          <name name-style="western">
            <surname>Scott</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Heintz</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Green</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Thompson</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Crits-Christoph</surname>
            <given-names>P</given-names>
          </name>
        </person-group>
        <article-title>Outcome assessment via handheld computer in community mental health: consumer satisfaction and reliability</article-title>
        <source>J Behav Health Serv Res</source>  
        <year>2011</year>  
        <volume>38</volume>  
        <fpage>414</fpage>  
        <lpage>423</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21107916"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1007/s11414-010-9229-4</pub-id>
        <pub-id pub-id-type="medline">21107916</pub-id>
        <pub-id pub-id-type="pmcid">PMC3299491</pub-id></nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Gwaltney</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Shields</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Shiffman</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Equivalence of electronic and paper-and-pencil administration of patient-reported outcome measures: a meta-analytic review</article-title>
        <source>Value Health</source>  
        <year>2008</year>  
        <volume>11</volume>  
        <fpage>322</fpage>  
        <lpage>333</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1098-3015(10)60526-8"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1111/j.1524-4733.2007.00231.x</pub-id>
        <pub-id pub-id-type="medline">18380645</pub-id>
        <pub-id pub-id-type="pii">S1098-3015(10)60526-8</pub-id></nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Pilkonis</surname>
            <given-names>PA</given-names>
          </name>
          <name name-style="western">
            <surname>Choi</surname>
            <given-names>SW</given-names>
          </name>
          <name name-style="western">
            <surname>Reise</surname>
            <given-names>SP</given-names>
          </name>
          <name name-style="western">
            <surname>Stover</surname>
            <given-names>AM</given-names>
          </name>
          <name name-style="western">
            <surname>Riley</surname>
            <given-names>WT</given-names>
          </name>
          <name name-style="western">
            <surname>Cella</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>Item banks for measuring emotional distress from the Patient-Reported Outcomes Measurement Information System (PROMIS®): depression, anxiety, and anger</article-title>
        <source>Assessment</source>  
        <year>2011</year>  
        <volume>18</volume>  
        <fpage>263</fpage>  
        <lpage>283</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21697139"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1177/1073191111411667</pub-id>
        <pub-id pub-id-type="medline">21697139</pub-id>
        <pub-id pub-id-type="pii">1073191111411667</pub-id>
        <pub-id pub-id-type="pmcid">PMC3153635</pub-id></nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Pilkonis</surname>
            <given-names>PA</given-names>
          </name>
          <name name-style="western">
            <surname>Yu</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Dodds</surname>
            <given-names>NE</given-names>
          </name>
          <name name-style="western">
            <surname>Johnston</surname>
            <given-names>KL</given-names>
          </name>
          <name name-style="western">
            <surname>Maihoefer</surname>
            <given-names>CC</given-names>
          </name>
          <name name-style="western">
            <surname>Lawrence</surname>
            <given-names>SM</given-names>
          </name>
        </person-group>
        <article-title>Validation of the depression item bank from the Patient-Reported Outcomes Measurement Information System (PROMIS) in a three-month observational study</article-title>
        <source>J Psychiatr Res</source>  
        <year>2014</year>  
        <volume>56</volume>  
        <fpage>112</fpage>  
        <lpage>119</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24931848"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.jpsychires.2014.05.010</pub-id>
        <pub-id pub-id-type="medline">24931848</pub-id>
        <pub-id pub-id-type="pii">S0022-3956(14)00148-4</pub-id>
        <pub-id pub-id-type="pmcid">PMC4096965</pub-id></nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>FM</given-names>
          </name>
          <name name-style="western">
            <surname>Kao</surname>
            <given-names>ST</given-names>
          </name>
        </person-group>
        <article-title>Item response theory for measurement validity</article-title>
        <source>Shanghai Arch Psychiatry</source>  
        <year>2014</year>  
        <volume>26</volume>  
        <fpage>171</fpage>  
        <lpage>177</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25114494"/>
        </comment>  
        <pub-id pub-id-type="medline">25114494</pub-id>
        <pub-id pub-id-type="pii">sap-26-03-171</pub-id>
        <pub-id pub-id-type="pmcid">PMC4118016</pub-id></nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Choi</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Firestar: computerized adaptive testing simulation program for polytomous item response theory models</article-title>
        <source>Appl Psychol Meas</source>  
        <year>2009</year>  
        <volume>33</volume>  
        <fpage>644</fpage>  
        <lpage>645</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://journals.sagepub.com/doi/10.1177/0146621608329892"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1177/0146621608329892</pub-id></nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <collab>American Psychiatric Association</collab>
        </person-group>
        <source>Diagnostic and Statistical Manual of Mental Disorders. Fifth Edition</source>  
        <year>2013</year>  
        <publisher-loc>Arlington, VA</publisher-loc>
        <publisher-name>American Psychiatric Association</publisher-name></nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Dunlap</surname>
            <given-names>WP</given-names>
          </name>
          <name name-style="western">
            <surname>Cortina</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Vaslow</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Burke</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Meta-analysis of experiments with matched groups or repeated measures designs</article-title>
        <source>Psychol Methods</source>  
        <year>1996</year>  
        <volume>1</volume>  
        <fpage>170</fpage>  
        <lpage>177</lpage>  
        <pub-id pub-id-type="doi">10.1037/1082-989X.1.2.170</pub-id></nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Brodey</surname>
            <given-names>BB</given-names>
          </name>
          <name name-style="western">
            <surname>Rosen</surname>
            <given-names>CS</given-names>
          </name>
          <name name-style="western">
            <surname>Brodey</surname>
            <given-names>IS</given-names>
          </name>
          <name name-style="western">
            <surname>Sheetz</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Unutzer</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Reliability and acceptability of automated telephone surveys among Spanish- and English-speaking mental health services recipients</article-title>
        <source>Ment Health Serv Res</source>  
        <year>2005</year>  
        <volume>7</volume>  
        <fpage>181</fpage>  
        <lpage>184</lpage>  
        <pub-id pub-id-type="doi">10.1007/s11020-005-5786-1</pub-id></nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Valmaggia</surname>
            <given-names>LR</given-names>
          </name>
          <name name-style="western">
            <surname>Day</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Rus-Calafell</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Using virtual reality to investigate psychological processes and mechanisms associated with the onset and maintenance of psychosis: a systematic review</article-title>
        <source>Soc Psychiatry Psychiatr Epidemiol</source>  
        <year>2016</year>  
        <volume>51</volume>  
        <fpage>921</fpage>  
        <lpage>936</lpage>  
        <pub-id pub-id-type="doi">10.1007/s00127-016-1245-0</pub-id></nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
