<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
    <article-id pub-id-type="publisher-id">v19i9e302</article-id>
    <article-id pub-id-type="pmid">28931496</article-id>
    <article-id pub-id-type="doi">10.2196/jmir.7453</article-id>
    <article-categories>
      <subj-group subj-group-type="heading">
        <subject>Original Paper</subject>
      </subj-group>
      <subj-group subj-group-type="article-type">
        <subject>Original Paper</subject>
      </subj-group>
    </article-categories>
    <title-group>
      <article-title>Computerized Adaptive Testing Provides Reliable and Efficient Depression Measurement Using the CES-D Scale</article-title>
    </title-group>
    <contrib-group>
      <contrib contrib-type="editor">
        <name>
          <surname>Torous</surname>
          <given-names>John</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Apolinário-Hagen</surname>
          <given-names>Jennifer</given-names>
        </name>
      </contrib>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Donker</surname>
          <given-names>Tara</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="author" id="contrib1" equal-contrib="yes">
        <name name-style="western">
          <surname>Loe</surname>
          <given-names>Bao Sheng</given-names>
        </name>
        <degrees>Mphil</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-6310-1608</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib2" equal-contrib="yes">
        <name name-style="western">
          <surname>Stillwell</surname>
          <given-names>David</given-names>
        </name>
        <degrees>PhD</degrees>
        <xref rid="aff2" ref-type="aff">2</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-0174-3212</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib3" corresp="yes" equal-contrib="yes">
      <name name-style="western">
        <surname>Gibbons</surname>
        <given-names>Chris</given-names>
      </name>
      <degrees>PhD</degrees>
      <xref rid="aff2" ref-type="aff">2</xref>
      <address>
        <institution>The Psychometrics Centre</institution>
        <institution>Judge Business School</institution>
        <institution>University of Cambridge</institution>
        <addr-line>Trumpington Street</addr-line>
        <addr-line>Cambridge,</addr-line>
        <country>United Kingdom</country>
        <phone>44 01223765203</phone>
        <email>cg598@cam.ac.uk</email>
      </address>  
      <xref rid="aff3" ref-type="aff">3</xref>
      <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-4732-7305</ext-link></contrib>
    </contrib-group>
    <aff id="aff1">
    <sup>1</sup>
    <institution>School of Psychology</institution>
    <institution>University of Cambridge</institution>  
    <addr-line>Cambridge</addr-line>
    <country>United Kingdom</country></aff>
    <aff id="aff2">
    <sup>2</sup>
    <institution>The Psychometrics Centre</institution>
    <institution>Judge Business School</institution>  
    <institution>University of Cambridge</institution>  
    <addr-line>Cambridge</addr-line>
    <country>United Kingdom</country></aff>
    <aff id="aff3">
    <sup>3</sup>
    <institution>Cambridge Centre for Health Services Research</institution>
    <institution>Cambridge School of Clinical Medicine</institution>  
    <institution>University of Cambridge</institution>  
    <addr-line>Cambridge</addr-line>
    <country>United Kingdom</country></aff>
    <author-notes>
      <corresp>Corresponding Author: Chris Gibbons 
      <email>cg598@cam.ac.uk</email></corresp>
    </author-notes>
    <pub-date pub-type="collection"><month>09</month><year>2017</year></pub-date>
    <pub-date pub-type="epub">
      <day>20</day>
      <month>09</month>
      <year>2017</year>
    </pub-date>
    <volume>19</volume>
    <issue>9</issue>
    <elocation-id>e302</elocation-id>
    <!--history from ojs - api-xml-->
    <history>
      <date date-type="received">
        <day>6</day>
        <month>2</month>
        <year>2017</year>
      </date>
      <date date-type="rev-request">
        <day>12</day>
        <month>4</month>
        <year>2017</year>
      </date>
      <date date-type="rev-recd">
        <day>22</day>
        <month>5</month>
        <year>2017</year>
      </date>
      <date date-type="accepted">
        <day>29</day>
        <month>5</month>
        <year>2017</year>
      </date>
    </history>
    <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
    <copyright-statement>©Bao Sheng Loe, David Stillwell, Chris Gibbons. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 20.09.2017.</copyright-statement>
    <copyright-year>2017</copyright-year>
    <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
      <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
    </license>  
    <self-uri xlink:href="http://www.jmir.org/2017/9/e302/" xlink:type="simple"/>
    <abstract>
      <sec sec-type="background">
        <title>Background</title>
        <p>The Center for Epidemiologic Studies Depression Scale (CES-D) is a measure of depressive symptomatology which is widely used internationally. Though previous attempts were made to shorten the CES-D scale, few have attempted to develop a Computerized Adaptive Test (CAT) version for the CES-D.</p>
      </sec>
      <sec sec-type="objective">
        <title>Objective</title>
        <p>The aim of this study was to provide evidence on the efficiency and accuracy of the CES-D when administered using CAT using an American sample group.</p>
      </sec>
      <sec sec-type="methods">
        <title>Methods</title>
        <p>We obtained a sample of 2060 responses to the CESD-D from US participants using the myPersonality application. The average age of participants was 26 years (range 19-77). We randomly split the sample into two groups to evaluate and validate the psychometric models. We used evaluation group data (n=1018) to assess dimensionality with both confirmatory factor and Mokken analysis. We conducted further psychometric assessments using item response theory (IRT), including assessments of item and scale fit to Samejima’s graded response model (GRM), local dependency and differential item functioning. We subsequently conducted two CAT simulations to evaluate the CES-D CAT using the validation group (n=1042).</p>
      </sec>
      <sec sec-type="results">
        <title>Results</title>
        <p>Initial CFA results indicated a poor fit to the model and Mokken analysis revealed 3 items which did not conform to the same dimension as the rest of the items. We removed the 3 items and fit the remaining 17 items to GRM. We found no evidence of differential item functioning (DIF) between age and gender groups. Estimates of the level of CES-D trait score provided by the simulated CAT algorithm and the original CES-D trait score derived from original scale were correlated highly. The second CAT simulation conducted using real participant data demonstrated higher precision at the higher levels of depression spectrum.</p>
      </sec>
      <sec sec-type="conclusions">
        <title>Conclusions</title>
        <p>Depression assessments using the CES-D CAT can be more accurate and efficient than those made using the fixed-length assessment.</p>
      </sec>
    </abstract>
    <kwd-group>
      <kwd>depression</kwd>
      <kwd>assessment</kwd>
      <kwd>psychometrics</kwd>
      <kwd>patient reported outcome measures</kwd>
      <kwd>patient outcome assessment</kwd>
    </kwd-group></article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>The Center for Epidemiologic Studies Depression Scale (CES-D) is a commonly used 20-item self-rating scale designed to measure depressive symptomatology in both clinical and non-clinical settings [<xref ref-type="bibr" rid="ref1">1</xref>]. It is used in both epidemiological research and as a diagnostic screening tool [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>].</p>
      <p>Despite much debate on the cut-off score which yield better sensitivities and specificities [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>], it is commonly accepted that persons who score 16 or above on the CES-D’s 0 to 60 scale are likely to be clinically depressed [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. While some authors have suggested that the CES-D has a four-factor structure, it appears to provide meaningful measurement along a single dimension [<xref ref-type="bibr" rid="ref7">7</xref>]. Hence, this level of internal consistency suggests that the CES-D should be used as an overall scale to measure a single latent construct—depressive symptoms [<xref ref-type="bibr" rid="ref8">8</xref>].</p>
      <p>Although the fixed-length version of the CES-D is widely used, recent developments in the availability of software to conduct advanced psychometric analyses and to develop computer adaptive assessments bring new opportunities for advanced Internet-based depressive symptom assessment. Computerized Adaptive Testing (CAT), refers to an algorithm-based assessment protocol which iteratively matches participants in a psychometric assessment with the most relevant item for them. Conducting assessments in this manner often reduces the number of items which need to be administered in an assessment, reducing the length of assessments by as much as 82%, compared to fixed-length measures of the same construct [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref11">11</xref>]. CAT typically relies on item parameter information derived from item-response theory. A large number of item-response theory models are suitable for developing item banks including the graded response model (GRM), the Rasch family of models as well as multidimensional models [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>].</p>
      <p>As well as demonstrable increases in efficiency, CATs can deal with other issues which prohibit accurate measurement using static questionnaires. For example, CATs are able to adjust for demographic differences in the interpretations of items commonly seen between different groups and known as differential item functioning (DIF) [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref16">16</xref>]. It is also possible to account for issues caused by items being <italic>too</italic> similar which can spuriously inflate assessment reliability [<xref ref-type="bibr" rid="ref17">17</xref>].</p>
      <p>An investigation conducted by Smit et al [<xref ref-type="bibr" rid="ref10">10</xref>] demonstrated that the CES-D items make suitable candidates for CAT administration in a sample of Dutch adolescents aged between 12 and 17 [<xref ref-type="bibr" rid="ref18">18</xref>]. The study shows that CAT administration could approach the reliability of the paper-based measures using fewer than half the items on the original. Other CATs have developed novel item banks to create CATs of depression, including the D-CAT [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>] and PROMIS depression item banks [<xref ref-type="bibr" rid="ref21">21</xref>]. These item banks show similar performance, arriving at reliable estimates of depressive symptomology using fewer than 10 items. Though both using legacy questionnaires to “feed” CATs and developing item banks specifically for that purpose have advantages and disadvantages. One advantages of using the CES-D for CAT is that it is not only well known and widely understood but it is also freely available in the public domain, allowing its use as a CAT assessment without incurring additional fees or reliance on restrictive proprietary software.</p>
      <p>Thus, this paper aims to validate the CES-D assessment for use as a Web-based CAT using a sample taken from the US general population which will allow patients, clinicians, and other members of the public to evaluate depression symptomology efficiently and precisely online.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Participants</title>
        <p>We recruited 2060 individuals who completed the CES-D scale via the myPersonality application [<xref ref-type="bibr" rid="ref22">22</xref>]. MyPersonality is a Facebook application that allowed Facebook users to complete psychological tests and receive feedback on their scores. Users of the myPersonality application provided opt-in consent to allow us to record their assessment scores in exchange for the opportunity to receive feedback, which can be later shared online. The sample was divided into two groups using a randomly generated numeric string (random.org) for analysis. The first group is used for evaluation of the CES-D scale (n=1018). The second group is used for validating the CAT results based the calibration of the item parameters derived from the evaluation sample (n=1042). The samples were independent from one another. For group 1, there were 65.52% (665/1018) 6 females and 34.39% (348/1012) males. The mean age of the participants was 26 years (SD 12.12). For group 2, there were 65.93% (687/1042) females and 33.69% (351/1042) males. The mean age for participants was 25.86 (SD 10.44). Five participants from group 1 and 4 participants from group 2 did not reveal their gender. All individuals reported that they were from the United States.</p>
      </sec>
      <sec>
        <title>Measure</title>
        <p>The CES-D is a self-report questionnaire which measures severity of depression from the perspective of the individual (see <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>). Subjects responded to the CES-D by indicating on a 4-point Likert-scale stating how often each depressive symptom occurred during the past week (0=rarely or none of the time, 1=some of the time, 2=much of the time, 3=most or all the time). The potential range of scores is from 0 to 60, with higher scores indicating higher levels of depressive symptomology.</p>
        <p>The CES-D scale is a well validated and widely used instrument in many studies internationally [<xref ref-type="bibr" rid="ref23">23</xref>-<xref ref-type="bibr" rid="ref25">25</xref>]. Reliability and validity of the scale has been tested in both general and clinical populations [<xref ref-type="bibr" rid="ref1">1</xref>]. Previous results show that the 20-item scale yields good internal consistency for the general population (Cronbach alpha=.85) and for a psychiatric population (Cronbach alpha=.90) [<xref ref-type="bibr" rid="ref26">26</xref>]. Adequate test-retest reliability was found over 2 to 8-week period and 3 to 12-month period, respectively [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>]. Convergent validity was supported by the significant correlations with other scales designed to assess depression symptoms [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>]. The CES-D scale is available to use in the public domain and free to use without restriction.</p>
      </sec>
      <sec>
        <title>Data Analysis</title>
        <p>The internal consistency of the CES-D scale was determined using the Cronbach alpha statistic [<xref ref-type="bibr" rid="ref30">30</xref>], confirmatory factor analysis (CFA) was first performed to determine the structure of the model. The maximum-likelihood estimator was in the confirmatory analyses. Four fit indices were used in this study: chi-square statistics [<xref ref-type="bibr" rid="ref31">31</xref>]; the Comparative fit index (CFI, [<xref ref-type="bibr" rid="ref32">32</xref>]), the Tucker Lewis Index (TLI, Tucker and Lewis 1973), and the root-mean-square error of approximation (RMSEA, [<xref ref-type="bibr" rid="ref33">33</xref>]). The chi-square statistics indicates whether the observed covariance matrix is similar to the predicted covariance matrix. However, the result is liable to bias in large sample sizes [<xref ref-type="bibr" rid="ref34">34</xref>]. As such, other criteria such as absolute and comparative fix indices are used to evaluate the model. The CFI and TLI indices are the relative reduction in lack of fit of an observed model versus an independent model; with values of 0.90 or greater indicating an adequate fit [<xref ref-type="bibr" rid="ref35">35</xref>]. For RMSEA [<xref ref-type="bibr" rid="ref33">33</xref>], values less than 0.05 indicate good fit, and values greater than 0.10 as indication of poor fit of a model after accounting for degrees of freedom of the model.</p>
        <p>Subsequently, Mokken analysis was used to provide further insight into the scale’s factor structure and the scalability of the items [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]. Following Mokken analysis, data were analyzed using GRM [<xref ref-type="bibr" rid="ref38">38</xref>], which has been shown to be suitable for calibrating items for use as CAT assessments [<xref ref-type="bibr" rid="ref39">39</xref>]. Item discrimination values ranging from 0.64 to 1.34 were considered to be moderately discriminative, and values 1.35 or greater are highly discriminative [<xref ref-type="bibr" rid="ref40">40</xref>].</p>
        <p>Following the protocol set out by the PROMIS investigators [<xref ref-type="bibr" rid="ref41">41</xref>], we assessed the assumptions of GRM and made modifications, where necessary, to the scale to resolve breaches of model assumptions, which are detailed below.</p>
        <p>Local independence of items was assessed using Yen’s Q3 method of correlated residuals. Item residual correlations above .20 were considered indicative of local dependence between items [<xref ref-type="bibr" rid="ref42">42</xref>]. Different strategies exist for managing items with local dependency, which including removing the items from the scale completely or collapsing the items into a testlet.</p>
        <p>The DIF analysis using the lordif package was conducted for age and gender groups to identify measurement biases between groups [<xref ref-type="bibr" rid="ref43">43</xref>]. The lordif package utilizes ordinal logistic regression methods to calculate DIF [<xref ref-type="bibr" rid="ref44">44</xref>]. DIF is observed when the probability of answering a specific item correctly is not the same for individuals with the same level of depressive symptoms but who belong to a different demographic group [<xref ref-type="bibr" rid="ref15">15</xref>]. For example, male and female participants may both have equal levels of depressive symptoms, but if the certain items are interpreted differently between groups then observed mean scores may incorrectly show that one group has higher levels of depressive symptoms than the other because of an artefact of their gender that was not adequately controlled for within the test. Hence, DIF is used to identify items with unwanted bias and indicate that the same item sets and parameters might be needed for different diagnostic groups [<xref ref-type="bibr" rid="ref16">16</xref>].</p>
        <p>We conducted DIF analysis to assess item invariance with respect to age and gender. Two criteria were adopted in this study to detect meaningful DIF: changes in the beta [<xref ref-type="bibr" rid="ref43">43</xref>] and the pseudo R-square [<xref ref-type="bibr" rid="ref45">45</xref>]. Values ranging from 5% to 10% beta change and pseudo R-squared &#62;.13 suggest that meaningful DIF exist for a particular item [<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref46">46</xref>]. For our study, items with beta change of above &#62;1% was flagged for DIF. We divided the sample into 2 groups based on the mean age (26 years) of the sample. Participants who were younger than mean age were placed in the first group (n=399) and those that were older than the mean age were placed in the second group (n=200). For gender groups, all the males were in the first group (n=348), whereas all the females were in second group (n=665). Participants who did not wish to reveal their gender (n=9) were excluded from the DIF analysis as there were too few to create an adequate additional group.</p>
        <p>We evaluated the impact of DIF on the CES-D scores by recalibrating the items to the GRM model using the DIF-adjusted item parameters [<xref ref-type="bibr" rid="ref47">47</xref>]. The person scores were recalculated based on these parameters. Finally, the strength of the association between the DIF-adjusted person score and original person score were evaluated using Pearson correlation. A high correlation would suggest that adjusting for DIF would make negligible differences in the person scores, and as such, could be ignored [<xref ref-type="bibr" rid="ref48">48</xref>]. A low correlation between the DIF-adjusted person scores and original person scores suggest that the DIF makes a meaningful difference on the final scores and that group-specific parameters should be used when developing a CAT.</p>
      </sec>
      <sec>
        <title>Establishing Evaluation of CES-D CAT Simulation</title>
        <p>Two simulations were conducted to evaluate the properties of the item pool and the CAT algorithm. The first simulation employed simulated responses from various levels of the latent trait derived from participants who completed the full CES-D scale to determine the average number of items that had to be administered.</p>
        <p>The second simulations were respondents from the validation group and thus, the simulations were conducted using real data. The item parameter estimates used in the CES-D CAT were derived from the evaluation group. The validation sample used in this simulation did not overlap with the evaluation sample used to calibrate the item bank. Nevertheless, the individuals of this sample completed the same CES-D items that had been employed in the construction of the item bank. As such, responses to all items in the item bank were available. Both the respondents’ latent trait levels and responses to individual items were used to estimate the number of items needed to administer in a CAT. Correlations with the simulated CAT score and their scores derived from the full CES-D were obtained for both groups.</p>
        <p>The maximum Fisher Information criterion was used for item selection [<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>]. The Bayesian modal estimation was used at the beginning of the CAT simulation to estimate ability [<xref ref-type="bibr" rid="ref51">51</xref>]. This approach temporarily assumes that the ability of the test takers is normally distributed. Once a mixed response pattern is obtained, the normal distribution assumption is no longer requires and thus, a non-Bayesian maximum likelihood estimation is used [<xref ref-type="bibr" rid="ref52">52</xref>]. Maximum likelihood estimation is subsequently used to estimate the final ability of the test taker [<xref ref-type="bibr" rid="ref49">49</xref>]. The major advantage of using maximum likelihood estimation of ability is that it can account for all the information in the test taker’s responses in conjunction with the information available on each test item. The stopping rule for both simulations were set at SE≤0.32, which roughly corresponds to a reliability value≥0.90 [<xref ref-type="bibr" rid="ref53">53</xref>].</p>
      </sec>
      <sec>
        <title>Software</title>
        <p>Analyses were all conducted using the R Statistical Computing Environment [<xref ref-type="bibr" rid="ref54">54</xref>]. Individual packages were loaded to conduct CFA (“lavaan,” [<xref ref-type="bibr" rid="ref55">55</xref>]), Mokken (“mokken,” [<xref ref-type="bibr" rid="ref56">56</xref>]) and item response theory (IRT) including CAT simulations (“mirt,” [<xref ref-type="bibr" rid="ref57">57</xref>] and “catR” [Magis and Raîche, 2011]).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Confirmatory Factor Analysis</title>
        <p>Confirmatory factor analysis (CFA) was employed to investigate the unidimensionality of the CES-D scale. <xref ref-type="table" rid="table1">Table 1</xref> lists the mean, standard deviation, and the factor loadings of the CES-D items, revealing no reason for concern about the multivariate distribution of the data. Therefore, the model was estimated using the maximum likelihood method. As shown, the factor loadings are above the recommended threshold of .3 (Kline, 2013).</p>
        <p>Initial CFA results indicate a poor fit to the model (χ<sup>2</sup><sub>8.4</sub>, <italic>P</italic>&#60;.05; TLI=0.94; CFI=0.86; and RMSEA=0.09 (95% CI=0.08-0.09)).</p>
      </sec>
      <sec>
        <title>Unidimensionality</title>
        <p>We used Mokken analysis to further explore the dimensional structure of the CES-D and identify the potential sources of multidimensionality identified with the CFA. The evaluation of item homogeneity is based on the Loevinger’s <italic>H</italic> coefficient [<xref ref-type="bibr" rid="ref58">58</xref>]. Scalability is considered to be sufficient for both items and the scale where Loevinger’s <italic>H</italic> is equal to or greater than 0.30 [<xref ref-type="bibr" rid="ref59">59</xref>]. We found that items 2, 11, and 15 displayed item coefficients of homogeneity&#60;0.3. Hence, these items were eliminated from further analysis. This strategy was repeated and all the items were found to be above the recommended threshold, which conformed to a single dimension with Loevinger’s coefficient of homogeneity at a scale level of 0.43 (<xref ref-type="table" rid="table2">Table 2</xref>).</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Factor loadings and item descriptive statistics for the CES-D scale.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="250"/>
            <col width="250"/>
            <col width="250"/>
            <col width="250"/>
            <thead>
              <tr valign="top">
                <td>Item no.</td>
                <td>Mean</td>
                <td>SD</td>
                <td>Factor loadings</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>q1</td>
                <td>2.09</td>
                <td>0.95</td>
                <td>0.53</td>
              </tr>
              <tr valign="top">
                <td>q2</td>
                <td>1.94</td>
                <td>1.04</td>
                <td>0.40</td>
              </tr>
              <tr valign="top">
                <td>q3</td>
                <td>2.22</td>
                <td>1.07</td>
                <td>0.81</td>
              </tr>
              <tr valign="top">
                <td>q4</td>
                <td>2.34</td>
                <td>1.06</td>
                <td>0.58</td>
              </tr>
              <tr valign="top">
                <td>q5</td>
                <td>2.67</td>
                <td>1.00</td>
                <td>0.51</td>
              </tr>
              <tr valign="top">
                <td>q6</td>
                <td>2.42</td>
                <td>1.04</td>
                <td>0.85</td>
              </tr>
              <tr valign="top">
                <td>q7</td>
                <td>2.48</td>
                <td>1.01</td>
                <td>0.49</td>
              </tr>
              <tr valign="top">
                <td>q8</td>
                <td>2.43</td>
                <td>0.99</td>
                <td>0.56</td>
              </tr>
              <tr valign="top">
                <td>q9</td>
                <td>2.16</td>
                <td>1.09</td>
                <td>0.70</td>
              </tr>
              <tr valign="top">
                <td>q10</td>
                <td>2.09</td>
                <td>1.03</td>
                <td>0.54</td>
              </tr>
              <tr valign="top">
                <td>q11</td>
                <td>2.57</td>
                <td>1.11</td>
                <td>0.42</td>
              </tr>
              <tr valign="top">
                <td>q12</td>
                <td>2.31</td>
                <td>0.94</td>
                <td>0.72</td>
              </tr>
              <tr valign="top">
                <td>q13</td>
                <td>2.25</td>
                <td>1.01</td>
                <td>0.60</td>
              </tr>
              <tr valign="top">
                <td>q14</td>
                <td>2.76</td>
                <td>1.07</td>
                <td>0.69</td>
              </tr>
              <tr valign="top">
                <td>q15</td>
                <td>1.90</td>
                <td>0.92</td>
                <td>0.41</td>
              </tr>
              <tr valign="top">
                <td>q16</td>
                <td>2.36</td>
                <td>0.98</td>
                <td>0.71</td>
              </tr>
              <tr valign="top">
                <td>q17</td>
                <td>1.77</td>
                <td>0.96</td>
                <td>0.54</td>
              </tr>
              <tr valign="top">
                <td>q18</td>
                <td>2.59</td>
                <td>0.99</td>
                <td>0.80</td>
              </tr>
              <tr valign="top">
                <td>q19</td>
                <td>2.30</td>
                <td>1.07</td>
                <td>0.63</td>
              </tr>
              <tr valign="top">
                <td>q20</td>
                <td>2.51</td>
                <td>1.01</td>
                <td>0.58</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Loevinger’s coefficient of homogeneity at an item-level.</p>
          </caption>
          <table width="1000" cellpadding="6" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="200"/>
            <col width="200"/>
            <col width="200"/>
            <col width="200"/>
            <col width="200"/>
            <thead>
              <tr valign="top">
                <td>Item</td>
                <td>Mean</td>
                <td>Item H (H<sub>i</sub>)<sup>a</sup></td>
                <td>Standard Error</td>
                <td>Dimensionality</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>2.09</td>
                <td>0.38</td>
                <td>0.02</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>2.22</td>
                <td>0.55</td>
                <td>0.01</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>4</td>
                <td>2.34</td>
                <td>0.41</td>
                <td>0.02</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>5</td>
                <td>2.67</td>
                <td>0.38</td>
                <td>0.02</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>6</td>
                <td>2.42</td>
                <td>0.57</td>
                <td>0.01</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>7</td>
                <td>2.48</td>
                <td>0.35</td>
                <td>0.02</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>8</td>
                <td>2.43</td>
                <td>0.39</td>
                <td>0.02</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>9</td>
                <td>2.16</td>
                <td>0.49</td>
                <td>0.02</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>10</td>
                <td>2.10</td>
                <td>0.39</td>
                <td>0.02</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>12</td>
                <td>2.31</td>
                <td>0.50</td>
                <td>0.02</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>13</td>
                <td>2.25</td>
                <td>0.42</td>
                <td>0.02</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>14</td>
                <td>2.76</td>
                <td>0.48</td>
                <td>0.02</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>16</td>
                <td>1.90</td>
                <td>0.49</td>
                <td>0.02</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>17</td>
                <td>2.36</td>
                <td>0.40</td>
                <td>0.02</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>18</td>
                <td>1.77</td>
                <td>0.55</td>
                <td>0.01</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>19</td>
                <td>2.60</td>
                <td>0.43</td>
                <td>0.02</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>20</td>
                <td>2.30</td>
                <td>0.41</td>
                <td>0.02</td>
                <td>1</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>Scale H=0.45.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Graded Response Model</title>
        <p>Once we have established unidimensionality using Mokken analysis. We fitted the remaining 17 items to Samejima’s GRM (<xref ref-type="table" rid="table3">Table 3</xref>). The slope and threshold parameters in the GRM are used describe the relationship between each item and overall depressive symptom severity. The slope parameter reflects how well the items discriminate between respondents with or without depressive symptoms. The item discrimination values (alpha) ranged from a high of alpha=3.70 (item 5) to a relative low, but still strong, alpha=1.13 (item 7). The threshold parameter describes the endorsement of depressive symptoms, with larger values indicating greater levels of depressive symptoms. The thresholds for the lowest item category (b1) ranged from −3.31 (item 18) to 0.15 (item 17) on a z-score scale, indicating low to average levels of depressive symptoms, relative to the rest of our sample, for the individuals who endorsed the lowest CES-D category. The thresholds for the highest CES-D category (b3) ranged from 3.50 (item 3) to 1.25 (item 14), indicating moderate to high levels of depressive symptoms. All the standard errors of the <italic>b</italic> estimates were considered marginal, indicating that the items were normally distributed. An item fit analysis was conducted to identify any misfits. However, the results indicated that the remaining items fitted the model. Examination of the factor loadings revealed that all items loaded significantly (&#62;.50) on the single factor. Therefore, this model described the data adequately.</p>
      </sec>
      <sec>
        <title>Local independence</title>
        <p>Local dependency was apparently between items 18,12, and 16 as well as items 1, 19, and 15. Items 8, 12, and 16 were grouped as testlet 1, and items 19, and 15 were grouped as testlet 2. We observed the item residual correlation and found that item 4 was still correlated (&#62;0.2) with the first testlet. Hence, we grouped item 4 together with the first testlet and repeated the analysis, resulting in no correlated residuals greater than 0.2. Within the IRT framework, the fit indices based on the limited information M<sub>2</sub> statistic was used to assess the model fit [<xref ref-type="bibr" rid="ref60">60</xref>]. The result shows that the RMSEA was at 0.065 (95% CI 0.06-0.07), and comparative indices (TLI=0.96, CFI=0.97) were above the recommended threshold [<xref ref-type="bibr" rid="ref35">35</xref>].</p>
        <p><xref ref-type="fig" rid="figure1">Figure 1</xref> displays the test information curve for the IRT GRM. The test characteristics curve is simply the additive of the scores associated with increasing levels of depressive symptoms. The test information is at its highest (18.71) when the theta level is slightly above 0, while the lowest around of information can be found at both tails of the <italic>x</italic>-axis. Hence, the CES-D scale is most precise in estimating the underlying trait when the theta level is approximately zero (average).</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Parameter estimates and factor loadings for the 17 items of the CES-D Scale.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="165"/>
            <col width="165"/>
            <col width="165"/>
            <col width="165"/>
            <col width="165"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td>Item</td>
                <td>a</td>
                <td>b1</td>
                <td>b2</td>
                <td>b3</td>
                <td>Factor 1</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Item 1</td>
                <td>1.22 (0.09)</td>
                <td>−0.97 (0.09)</td>
                <td>0.93 (0.09)</td>
                <td>2.85 (0.15)</td>
                <td>0.58</td>
              </tr>
              <tr valign="top">
                <td>Item 3</td>
                <td>3.15 (0.18)</td>
                <td>−1.56 (0.15)</td>
                <td>1.14 (0.15)</td>
                <td>3.50 (0.21)</td>
                <td>0.88</td>
              </tr>
              <tr valign="top">
                <td>Item 4</td>
                <td>1.45 (0.09)</td>
                <td>−1.31 (0.10)</td>
                <td>0.20 (0.09)</td>
                <td>2.16 (0.12)</td>
                <td>0.65</td>
              </tr>
              <tr valign="top">
                <td>Item 5</td>
                <td>1.14 (0.08)</td>
                <td>−2.13 (0.15)</td>
                <td>−0.38 (0.08)</td>
                <td>1.44 (0.10)</td>
                <td>0.56</td>
              </tr>
              <tr valign="top">
                <td>Item 6</td>
                <td>3.70 (0.22)</td>
                <td>−2.81 (0.21)</td>
                <td>0.37 (0.16)</td>
                <td>3.70 (0.24)</td>
                <td>0.91</td>
              </tr>
              <tr valign="top">
                <td>Item 7</td>
                <td>1.13 (0.07)</td>
                <td>−1.71 (0.10)</td>
                <td>0.04 (0.08)</td>
                <td>1.81 (0.10)</td>
                <td>0.55</td>
              </tr>
              <tr valign="top">
                <td>Item 8</td>
                <td>1.37 (0.09)</td>
                <td>−1.84 (0.11)</td>
                <td>0.19 (0.09)</td>
                <td>2.11 (0.12)</td>
                <td>0.63</td>
              </tr>
              <tr valign="top">
                <td>Item 9</td>
                <td>2.03 (0.12)</td>
                <td>−0.81 (0.11)</td>
                <td>0.86 (0.11)</td>
                <td>2.66 (0.15)</td>
                <td>0.77</td>
              </tr>
              <tr valign="top">
                <td>Item 10</td>
                <td>1.29 (0.09)</td>
                <td>−0.66 (0.09)</td>
                <td>0.79 (0.09)</td>
                <td>2.56 (0.13)</td>
                <td>0.60</td>
              </tr>
              <tr valign="top">
                <td>Item 12</td>
                <td>2.14 (0.13)</td>
                <td>−2.09 (0.15)</td>
                <td>0.65 (0.12)</td>
                <td>3.33 (0.18)</td>
                <td>0.78</td>
              </tr>
              <tr valign="top">
                <td>Item 13</td>
                <td>1.49 (0.09)</td>
                <td>−1.27 (0.10)</td>
                <td>0.58 (0.09)</td>
                <td>2.49 (0.13)</td>
                <td>0.66</td>
              </tr>
              <tr valign="top">
                <td>item 14</td>
                <td>1.98 (0.11)</td>
                <td>−2.59 (0.14)</td>
                <td>−0.70 (0.11)</td>
                <td>1.25 (0.11)</td>
                <td>0.76</td>
              </tr>
              <tr valign="top">
                <td>Item 16</td>
                <td>2.12 (0.13)</td>
                <td>−2.06 (0.14)</td>
                <td>0.44 (0.12)</td>
                <td>2.98 (0.16)</td>
                <td>0.78</td>
              </tr>
              <tr valign="top">
                <td>Item 17</td>
                <td>1.38 (0.10)</td>
                <td>0.15 (0.09)</td>
                <td>1.57 (0.11)</td>
                <td>3.24 (0.18)</td>
                <td>0.63</td>
              </tr>
              <tr valign="top">
                <td>Item 18</td>
                <td>2.89 (0.16)</td>
                <td>−3.31 (0.20)</td>
                <td>−0.34 (0.14)</td>
                <td>2.82 (0.18)</td>
                <td>0.86</td>
              </tr>
              <tr valign="top">
                <td>Item 19</td>
                <td>1.50 (0.10)</td>
                <td>−1.21 (0.10)</td>
                <td>0.41 (0.09)</td>
                <td>2.15 (0.12)</td>
                <td>0.66</td>
              </tr>
              <tr valign="top">
                <td>Item 20</td>
                <td>1.37 (0.09)</td>
                <td>−1.99 (0.12)</td>
                <td>0.09 (0.09)</td>
                <td>1.83 (0.11)</td>
                <td>0.63</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>The test information of the CES-D scale.</p>
          </caption>
          <graphic xlink:href="jmir_v19i9e302_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>CES-D CAT Simulation of respondents.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="200"/>
            <col width="80"/>
            <col width="80"/>
            <col width="80"/>
            <col width="80"/>
            <col width="80"/>
            <col width="80"/>
            <col width="80"/>
            <col width="80"/>
            <col width="80"/>
            <col width="80"/>
            <thead>
              <tr valign="top">
                <td>Measure</td>
                <td>D1<sup>a</sup></td>
                <td>D2</td>
                <td>D3</td>
                <td>D4</td>
                <td>D5</td>
                <td>D6</td>
                <td>D7</td>
                <td>D8</td>
                <td>D9</td>
                <td>D10</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Mean theta</td>
                <td>−1.70</td>
                <td>−1.04</td>
                <td>−0.69</td>
                <td>−0.37</td>
                <td>−0.09</td>
                <td>0.16</td>
                <td>0.40</td>
                <td>0.68</td>
                <td>1.01</td>
                <td>1.64</td>
              </tr>
              <tr valign="top">
                <td>RMSE<sup>b</sup></td>
                <td>0.29</td>
                <td>0.35</td>
                <td>0.31</td>
                <td>0.33</td>
                <td>0.32</td>
                <td>0.32</td>
                <td>0.30</td>
                <td>0.32</td>
                <td>0.34</td>
                <td>0.34</td>
              </tr>
              <tr valign="top">
                <td>Mean bias</td>
                <td>0.01</td>
                <td>0.00</td>
                <td>0.02</td>
                <td>0.00</td>
                <td>0.02</td>
                <td>0.02</td>
                <td>−0.03</td>
                <td>−0.05</td>
                <td>−0.07</td>
                <td>0.01</td>
              </tr>
              <tr valign="top">
                <td>Mean test length</td>
                <td>13.98</td>
                <td>12.34</td>
                <td>11.04</td>
                <td>9.50</td>
                <td>8.30</td>
                <td>7.70</td>
                <td>7.60</td>
                <td>8.18</td>
                <td>9.77</td>
                <td>13.09</td>
              </tr>
              <tr valign="top">
                <td>Mean standard error</td>
                <td>0.34</td>
                <td>0.34</td>
                <td>0.33</td>
                <td>0.34</td>
                <td>0.33</td>
                <td>0.33</td>
                <td>0.33</td>
                <td>0.34</td>
                <td>0.34</td>
                <td>0.34</td>
              </tr>
              <tr valign="top">
                <td>Number of simulees</td>
                <td>105</td>
                <td>104</td>
                <td>104</td>
                <td>104</td>
                <td>104</td>
                <td>104</td>
                <td>104</td>
                <td>104</td>
                <td>104</td>
                <td>105</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>D: decile.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>RMSE: root mean square error</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>DIF Analysis</title>
        <p>DIF was not found between age groups. However, results indicated that item 14 (“I felt lonely”) showed moderate DIF for gender groups, with a beta change of more than 1% and a pseudo R-square of 0.08. When the DIF-adjusted person scores were calculated, the Pearson correlation between the original person scores and the DIF-adjusted person scores were 0.99. A <italic>t</italic> test analysis showed a non-significant mean difference with scores for DIF-adjusted person scores (mean=0.01, SD=0.88), and original person scores (mean=0.00, SD=0.97); <italic>t</italic><sub>2016.4</sub>=−0.15, <italic>P</italic>=.88.</p>
        <p>On the basis of these results, the conclusion arrived at was that statistically significant DIF was identified for item 14 using the two criteria of beta change and pseudo R-squared. However, the strength of association between the original person scores and the DIF-adjusted person scores were greater than 0.99. Therefore, the final decision was that any DIF found between the groups could be disregarded.</p>
      </sec>
      <sec>
        <title>Computer Adaptive Testing Simulation</title>
        <sec>
          <title>Simulation I</title>
          <p><xref ref-type="table" rid="table4">Table 4</xref> presents the results of the first simulation. In this analysis, the data were sorted into 10 equal parts, with each part representing one tenth of the sample group. There are appropriate 104 or 105 participants in each decile (D) rank (n=1042). The estimated average test length was 10.16 with SD of 2.34. The mean RMSE was .32 and the mean bias was −.0083. The lowest number of items administered to the simulees was in D5, with an average of 8.3 test items. The lowest and highest decile rank requires substantially more items (D1=13.98 items; D10=13.09 items) in order to reach the same target precision of SE≤0.32.</p>
        </sec>
        <sec>
          <title>Simulation II</title>
          <p>The second simulation study was conducted using the responses from a sample of real respondents (validation group) who completed the full CES-D scale. The stopping rule was set at SE≤0.32. The result of the second simulation can be found in <xref ref-type="table" rid="table5">Table 5</xref>. On average, 11.72 items with SD of 2.68 were required to estimate the latent trait at this level of precision. The mean RMSE was 1.14 and the mean bias was 0.18. Unlike the first simulation, only respondents in the lowest decile ranking required the administration of substantially more items to reach the specified level of precision (D1=14.76 items). Interestingly, there is a downward trend in the length of items from D9 (14.61 items) to D10 (8.41 items), indicating higher precision at higher levels of depressive symptoms with the use of lesser items.</p>
          <p>Further inspection of the item administration pattern (<xref ref-type="fig" rid="figure2">Figure 2</xref>), suggests a drop in the number of items required to estimate the latent trait accurately around. This could be due of the CAT algorithm selecting items with the highest information at every step, resulting in a quicker estimate of the latent trait. <xref ref-type="fig" rid="figure2">Figure 2</xref> shows the number of items administered by the CES-D CAT as a function of the standardized score of the depressive symptoms construct.</p>
          <p>Estimates of the level of CES-D trait score provided by the simulated CAT algorithm and the original CES-D trait score derived from original scale correlated highly (<italic>r</italic>=0.98). This indicates that a precise estimation of the latent trait is possible with substantial item savings using CAT approaches (<xref ref-type="fig" rid="figure3">Figure 3</xref>).</p>
          <p><xref ref-type="fig" rid="figure3">Figure 3</xref> shows exceptionally high correlation between the score from the CAT and the score given to the same participants when every item was completed.</p>
          <table-wrap position="float" id="table5">
            <label>Table 5</label>
            <caption>
              <p>CES-D CAT Simulation of CAT algorithm.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="200"/>
              <col width="80"/>
              <col width="80"/>
              <col width="80"/>
              <col width="80"/>
              <col width="80"/>
              <col width="80"/>
              <col width="80"/>
              <col width="80"/>
              <col width="80"/>
              <col width="80"/>
              <thead>
                <tr valign="top">
                  <td>Measure</td>
                  <td>D1</td>
                  <td>D2</td>
                  <td>D3</td>
                  <td>D4</td>
                  <td>D5</td>
                  <td>D6</td>
                  <td>D7</td>
                  <td>D8</td>
                  <td>D9</td>
                  <td>D10</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>Mean Theta</td>
                  <td>−1.70</td>
                  <td>−1.04</td>
                  <td>−0.69</td>
                  <td>−0.37</td>
                  <td>−0.09</td>
                  <td>0.16</td>
                  <td>0.40</td>
                  <td>0.68</td>
                  <td>1.01</td>
                  <td>1.64</td>
                </tr>
                <tr valign="top">
                  <td>RMSE</td>
                  <td>1.46</td>
                  <td>1.15</td>
                  <td>0.86</td>
                  <td>0.42</td>
                  <td>0.36</td>
                  <td>0.50</td>
                  <td>0.61</td>
                  <td>0.92</td>
                  <td>1.65</td>
                  <td>2.08</td>
                </tr>
                <tr valign="top">
                  <td>Mean bias</td>
                  <td>−1.45</td>
                  <td>−1.13</td>
                  <td>−0.82</td>
                  <td>−0.29</td>
                  <td>0.11</td>
                  <td>0.34</td>
                  <td>0.53</td>
                  <td>0.85</td>
                  <td>1.58</td>
                  <td>2.05</td>
                </tr>
                <tr valign="top">
                  <td>Mean test length</td>
                  <td>14.76</td>
                  <td>14.04</td>
                  <td>13.44</td>
                  <td>12.81</td>
                  <td>9.67</td>
                  <td>8.17</td>
                  <td>8.70</td>
                  <td>12.55</td>
                  <td>14.61</td>
                  <td>8.41</td>
                </tr>
                <tr valign="top">
                  <td>Mean standard error</td>
                  <td>0.42</td>
                  <td>0.34</td>
                  <td>0.33</td>
                  <td>0.33</td>
                  <td>0.33</td>
                  <td>0.33</td>
                  <td>0.34</td>
                  <td>0.34</td>
                  <td>0.33</td>
                  <td>0.37</td>
                </tr>
                <tr valign="top">
                  <td>Number of simulees</td>
                  <td>105</td>
                  <td>104</td>
                  <td>104</td>
                  <td>104</td>
                  <td>104</td>
                  <td>104</td>
                  <td>104</td>
                  <td>104</td>
                  <td>104</td>
                  <td>105</td>
                </tr>
              </tbody>
            </table>
          </table-wrap>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Relationship between number of items administered and level of depression (theta).</p>
            </caption>
            <graphic xlink:href="jmir_v19i9e302_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <fig id="figure3" position="float">
            <label>Figure 3</label>
            <caption>
              <p>Comparison of CES-D CAT scores with an IRT score computed from all items in the item bank.</p>
            </caption>
            <graphic xlink:href="jmir_v19i9e302_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>The psychometric properties of the CES-D measure were evaluated using a US sample. This sample was chosen to avoid issues of DIF across culture, and with the aim of providing an item bank which could be suitable for use within a clinical and research setting in the United States. The CES-D scale displayed excellent internal consistency based on the Cronbach alpha. The factor structure of the CES-D was subsequently evaluated using confirmatory factor and Mokken analysis. However, the results from the CFA indicated that the model provided an inadequate fit to the data. Mokken analysis identified three items as sources of multidimensionality in the CES-D. Items 2, 11, and 15 were considered to have poor fit and were subsequently removed from the analysis. Item 2 referred to “I did not feel like eating; my appetite was poor,” item 11 referred to “my sleep was restless,” and item 15 referred to “People were unfriendly.” The result showed that the final 17 items were found to be suitable for measuring a unidimensional trait and thus, the item parameters achieved from the remaining items allowed us to develop a computerized adaptive CES-D assessment.</p>
        <p>The CES-D scale was calibrated using the IRT approaches. Most IRT based models require that items measure a single underlying dimension and this condition was met based on the result of the Mokken analysis. Furthermore, IRT based frameworks made computer-adaptive CES-D possible with the estimated item parameters derived from IRT models. Simulated computer-adaptive administration of the item bank demonstrates the ability to estimate precise latent trait levels with similar or higher levels of internal reliability similar to the original scale but using fewer items. These results are commensurate with other research exploring the performance of the CES-D as a CAT in other contexts including adolescents and people with multimorbidity [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref61">61</xref>] and for adaptive testing of depressive symptoms using the PROMIS system [<xref ref-type="bibr" rid="ref62">62</xref>].</p>
        <p>Unlike a test developed using classical test theory, in which the number of items is fixed and precision naturally varies between participants who have differing levels of latent ability, CAT fixes the precision while allowing the number of items to vary. CAT can only be conducted using computer administration and the items are previously calibrated with a suitable item response model. The steps to conducting a CAT are (1) administer an item, (2) compute the latent score and its standard error, (3) identify the next most informative item based on the current latent score estimate and IRT parameters, and (4) repeat steps 1-3 until the predefined stopping rule has been met.</p>
        <p>In our simulation studies, we found a very high correlation between the CAT scores obtained when all 17 items were administered and when the stopping rule was introduced (leading to a mean test length of 10 items). Moreover, at the extreme (higher) end of the latent trait continuum, it only requires 8 items to identify individuals with depressive symptoms. This encourages quicker assessment of depressive symptoms, which can help clinicians to identify potential groups of persons who may benefit from immediate medical intervention. In spite of substantial improvements in efficiency by employing the CAT procedure, little information is lost and scores are still estimated accurately. By comparison, the time taken to complete the CES-D CAT will be shorter than the original 20-item scale. This time saving may seem small as far as a single scale is concerned, but psychometric assessment usually involves multiple questionnaires and, from this perspective, substantial time saving is evident.</p>
      </sec>
      <sec>
        <title>Limitations and Future Research</title>
        <p>A limitation to the current research is the small number of items used to measure CES-D. With CAT, the precision of latent trait estimates increases with the number of items in the item bank. A smaller item bank gives fewer options for item selection and may results in reduced item variation between assessments. However, to apply stricter stopping-rule criteria means that the number of items necessary to complete the CES-D CAT will be about the same as completing all the original scale, thus, no extra benefit remains with the use of CES-D CAT. Therefore, while this study reports the stopping rule at less than or equal to 0.32, which is equivalent to a reliability of more than or equal to 0.90, the precision can still be heightened by increasing the test information. This can be achieved by adding more high-quality items to the item bank. Hence, future studies could evaluate the CAT system where new items are included as part of the test to increase the item bank and ensure that the performance of the CAT system is not compromised. The performance of the CAT algorithms can also be evaluated under “live” testing conditions rather than simulation of existing data to ensure that participants’ test performance under conventional ‘fixed length’ and adaptive conditions do not differ significantly.</p>
        <p>Compared with population-based samples used in the development of item banks elsewhere [<xref ref-type="bibr" rid="ref21">21</xref>], our sample was younger and had a greater proportion of women. Given the nature of the recruitment into the study via a voluntary online app it is not surprising that this sample is more reflective of a “digitally native” population of younger people. One important caveat of this research is therefore that our findings should not be extrapolated to a general population but rather support the growing body of literature demonstrating the suitability of the CES-D for adaptive testing in different group as a means of making measurement more precise and efficient while retaining an item bank that is familiar to clinicians.</p>
        <p>In this study, we assess the content validity of the CAT-administered CESD by comparing depressive symptom estimates from the full-length assessment with an adaptively administered version. Further research is required to establish to predictive validity of this tool for the correct classification of clinical depression to support its use in clinical contexts.</p>
        <p>There are some discussions about the factor structure of the CES-D and whether a single factor is appropriate for assessing depressive symptomatology. Several researchers have suggested that the CES-D scale is a measure of the underlying 4-factor structure [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref64">64</xref>]. However, the construction of a 4-factor scale may be too challenging as psychometric test designed for health assessment aims to be as short as possible. Nevertheless, in the event that a 4-factor scale is developed for the CES-D, then a 4-factor CES-D CAT under the conditions of content balancing may be introduced. In other words, a proportionate sampling of items is taken from each of the factor domains, while ensuring unidimensionality is achieved [<xref ref-type="bibr" rid="ref52">52</xref>]. Researchers can thus consider new research avenues in which one could understand in finer gradient of the depressive symptoms.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>Our findings presented in this study shows that the CES-D CAT is a precise and efficient tool for screening depressive symptoms. Furthermore, the measurements provided by CAT are more likely to result in more meaningful research conclusions than classical approaches. More informed decisions could also be made based on measurement data at an individual level rather than at a scale level.</p>
        <p>While increased complexity with regards to the test development is inevitable, the CES-D CAT has immediate advantages such as increased accuracy, exact interpretable, and shorter time spent over conventional testing approaches. Open source software such as the <italic>Concerto</italic> testing platform [<xref ref-type="bibr" rid="ref65">65</xref>] makes it more accessible than ever before for researchers to develop and implement their own CAT system. Furthermore, the CESD-CAT outperforms the paper-based versions of the CES-D in terms of reliability, length, and flexibility in which they may be administered in a clinical setting. CATs are more dynamic as they adjust accordingly to the ability level of the test taker, indicating both efficiency and effectiveness. Thus, the CES-D CAT is suitable to be administered as a primary tool for understanding and screening individuals in the US with depressive symptomatology.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <app id="app1">
        <title>Multimedia Appendix 1</title>
        <p>CES-D questions.</p>
        <media xlink:href="jmir_v19i9e302_app1.pdf" xlink:title="PDF File (Adobe PDF File), 12KB"/>
      </app>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">CAT</term>
          <def>
            <p>Computerized Adaptive Test</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CES-D</term>
          <def>
            <p>Center for Epidemiologic Studies Depression Scale</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CFA</term>
          <def>
            <p>Confirmatory factor analysis</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">CFI</term>
          <def>
            <p>Comparative fit index</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">DIF</term>
          <def>
            <p>Differential item functioning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">GRM</term>
          <def>
            <p>graded response model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">IRT</term>
          <def>
            <p>item response theory</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">RMSEA</term>
          <def>
            <p>root-mean-square error of approximation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">TLI</term>
          <def>
            <p>Tucker Lewis Index</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Radloff</surname>
            <given-names>L</given-names>
          </name>
        </person-group>
        <article-title>The CES-D scale a self-report depression scale for research in the general population</article-title>
        <source>Appl Psychol Meas</source>  
        <year>1977</year>  
        <volume>1</volume>  
        <issue>3</issue>  
        <fpage>385</fpage>  
        <lpage>401</lpage>  
        <pub-id pub-id-type="doi">10.1177/014662167700100306</pub-id></nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Himmelfarb</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Murrell</surname>
            <given-names>SA</given-names>
          </name>
        </person-group>
        <article-title>Reliability and validity of five mental health scales in older persons</article-title>
        <source>J Gerontol</source>  
        <year>1983</year>  
        <volume>38</volume>  
        <issue>3</issue>  
        <fpage>333</fpage>  
        <lpage>339</lpage>  
        <pub-id pub-id-type="medline">6841929</pub-id></nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Myers</surname>
            <given-names>JK</given-names>
          </name>
          <name name-style="western">
            <surname>Weissman</surname>
            <given-names>MM</given-names>
          </name>
        </person-group>
        <article-title>Use of a self-report symptom scale to detect depression in a community sample</article-title>
        <source>The American Journal of Psychiatry</source>  
        <year>1980</year>  
        <volume>137</volume>  
        <issue>9</issue>  
        <fpage>1081</fpage>  
        <lpage>4</lpage>  
        <pub-id pub-id-type="medline">7425160</pub-id></nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Roberts</surname>
            <given-names>RE</given-names>
          </name>
        </person-group>
        <article-title>Reliability of the CES-D scale in different ethnic contexts</article-title>
        <source>Psychiatry Res</source>  
        <year>1980</year>  
        <volume>2</volume>  
        <issue>2</issue>  
        <fpage>125</fpage>  
        <lpage>34</lpage>  
        <pub-id pub-id-type="medline">6932058</pub-id></nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Comstock</surname>
            <given-names>GW</given-names>
          </name>
          <name name-style="western">
            <surname>Helsing</surname>
            <given-names>KJ</given-names>
          </name>
        </person-group>
        <article-title>Symptoms of depression in two communities</article-title>
        <source>Psychol Med</source>  
        <year>1977</year>  
        <volume>6</volume>  
        <issue>4</issue>  
        <fpage>551</fpage>  
        <lpage>63</lpage>  
        <pub-id pub-id-type="medline">1005571</pub-id></nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hankin</surname>
            <given-names>JR</given-names>
          </name>
          <name name-style="western">
            <surname>Locke</surname>
            <given-names>BZ</given-names>
          </name>
        </person-group>
        <article-title>The persistence of depressive symptomatology among prepaid group practice enrollees: an exploratory study</article-title>
        <source>Am J Public Health</source>  
        <year>1982</year>  
        <volume>72</volume>  
        <issue>9</issue>  
        <fpage>1000</fpage>  
        <lpage>1007</lpage>  
        <pub-id pub-id-type="medline">7102848</pub-id></nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Shafer</surname>
            <given-names>AB</given-names>
          </name>
        </person-group>
        <article-title>Meta‐analysis of the factor structures of four depression questionnaires: Beck, CES‐D, Hamilton, and Zung</article-title>
        <source>J Clin Psychol</source>  
        <year>2006</year>  
        <volume>62</volume>  
        <issue>1</issue>  
        <fpage>123</fpage>  
        <lpage>46</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://doi.wiley.com/10.1002/jclp.20213"/>
        </comment>  
        <pub-id pub-id-type="medline">16287149</pub-id></nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kohout</surname>
            <given-names>FJ</given-names>
          </name>
          <name name-style="western">
            <surname>Berkman</surname>
            <given-names>LF</given-names>
          </name>
          <name name-style="western">
            <surname>Evans</surname>
            <given-names>DA</given-names>
          </name>
          <name name-style="western">
            <surname>Cornoni-Huntley</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Two shorter forms of the CES-D (Center for Epidemiological Studies Depression) depression symptoms index</article-title>
        <source>J Aging Health</source>  
        <year>1993</year>  
        <month>05</month>  
        <volume>5</volume>  
        <issue>2</issue>  
        <fpage>179</fpage>  
        <lpage>93</lpage>  
        <pub-id pub-id-type="doi">10.1177/089826439300500202</pub-id>
        <pub-id pub-id-type="medline">10125443</pub-id></nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Gibbons</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Bower</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Lovell</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Valderas</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Skevington</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Electronic quality of life assessment using computer-adaptive testing</article-title>
        <source>J Med Internet Res</source>  
        <year>2016</year>  
        <month>09</month>  
        <day>30</day>  
        <volume>18</volume>  
        <issue>9</issue>  
        <fpage>e240</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2016/9/e240/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.6053</pub-id>
        <pub-id pub-id-type="medline">27694100</pub-id>
        <pub-id pub-id-type="pii">v18i9e240</pub-id>
        <pub-id pub-id-type="pmcid">PMC5065679</pub-id></nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Smits</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Cuijpers</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>van Straten</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Applying computerized adaptive testing to the CES-D scale: a simulation study</article-title>
        <source>Psychiatry Res</source>  
        <year>2011</year>  
        <month>06</month>  
        <day>30</day>  
        <volume>188</volume>  
        <issue>1</issue>  
        <fpage>147</fpage>  
        <lpage>55</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0165-1781(10)00769-9"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.psychres.2010.12.001</pub-id>
        <pub-id pub-id-type="medline">21208660</pub-id>
        <pub-id pub-id-type="pii">S0165-1781(10)00769-9</pub-id></nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hays</surname>
            <given-names>RD</given-names>
          </name>
          <name name-style="western">
            <surname>Morales</surname>
            <given-names>LS</given-names>
          </name>
          <name name-style="western">
            <surname>Reise</surname>
            <given-names>SP</given-names>
          </name>
        </person-group>
        <article-title>Item response theory and health outcomes measurement in the 21st century</article-title>
        <source>Medical care</source>  
        <year>2000</year>  
        <volume>38</volume>  
        <issue>9 Suppl</issue>  
        <fpage>1128</fpage>  
        <lpage>42</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.pubmedcentral.nih.gov/articlerender.fcgi?artid=1815384&#38;tool=pmcentrez&#38;rendertype=abstract"/>
        </comment>  
        <pub-id pub-id-type="medline">10982088</pub-id></nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Gibbons</surname>
            <given-names>RD</given-names>
          </name>
          <name name-style="western">
            <surname>Weiss</surname>
            <given-names>DJ</given-names>
          </name>
          <name name-style="western">
            <surname>Frank</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Kupfer</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>Computerized adaptive diagnosis and testing of mental health disorders</article-title>
        <source>Annu Rev Clin Psychol</source>  
        <year>2016</year>  
        <volume>12</volume>  
        <fpage>83</fpage>  
        <lpage>104</lpage>  
        <pub-id pub-id-type="doi">10.1146/annurev-clinpsy-021815-093634</pub-id>
        <pub-id pub-id-type="medline">26651865</pub-id></nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wahl</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Löwe</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Bjorner</surname>
            <given-names>JB</given-names>
          </name>
          <name name-style="western">
            <surname>Fischer</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Langs</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Voderholzer</surname>
            <given-names>U</given-names>
          </name>
          <name name-style="western">
            <surname>Aita</surname>
            <given-names>SA</given-names>
          </name>
          <name name-style="western">
            <surname>Bergemann</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Brähler</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Rose</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Standardization of depression measurement: a common metric was developed for 11 self-report depression measures</article-title>
        <source>J Clin Epidemiol</source>  
        <year>2014</year>  
        <volume>67</volume>  
        <issue>1</issue>  
        <fpage>86</fpage>  
        <pub-id pub-id-type="medline">24262771</pub-id></nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bee</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Gibbons</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Callaghan</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Fraser</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Lovell</surname>
            <given-names>K</given-names>
          </name>
        </person-group>
        <article-title>Evaluating and quantifying user and carer involvement in mental health care planning (EQUIP): co-development of a new patient-reported outcome measure</article-title>
        <source>PLoS One</source>  
        <year>2016</year>  
        <volume>11</volume>  
        <issue>3</issue>  
        <fpage>e0149973</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0149973"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pone.0149973</pub-id>
        <pub-id pub-id-type="medline">26963252</pub-id>
        <pub-id pub-id-type="pii">PONE-D-15-26884</pub-id>
        <pub-id pub-id-type="pmcid">PMC4786101</pub-id></nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Holland</surname>
            <given-names>PW</given-names>
          </name>
          <name name-style="western">
            <surname>Wainer</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <source>Differential item functioning</source>  
        <year>2012</year>  
        <publisher-loc>Hillsdale, NJ</publisher-loc>
        <publisher-name>Lawrence Erlbaum Associates, Inc</publisher-name></nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Tennant</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Penta</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Tesio</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Grimby</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Thonnard</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Slade</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Lawton</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Simone</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Carter</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Lundgren-Nilsson</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Tripolski</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Ring</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Biering-Sørensen</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Marincek</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Burger</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Phillips</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Assessing and adjusting for cross-cultural validity of impairment and activity limitation scales through differential item functioning within the framework of the Rasch model: the PRO-ESOR project</article-title>
        <source>Med Care</source>  
        <year>2004</year>  
        <month>01</month>  
        <volume>42</volume>  
        <issue>1 Suppl</issue>  
        <fpage>I37</fpage>  
        <lpage>48</lpage>  
        <pub-id pub-id-type="doi">10.1097/01.mlr.0000103529.63132.77</pub-id>
        <pub-id pub-id-type="medline">14707754</pub-id></nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wright</surname>
            <given-names>BD</given-names>
          </name>
        </person-group>
        <article-title>Local dependency, correlations and principal components</article-title>
        <source>Rasch Measurement Transactions</source>  
        <year>1996</year>  
        <volume>10</volume>  
        <issue>3</issue>  
        <fpage>509</fpage>  
        <lpage>11</lpage> </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Smits</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Cuijpers</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>van Straten</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Applying computerized adaptive testing to the CES-D scale: a simulation study</article-title>
        <source>Psychiatry Res Internet</source>  
        <year>2011</year>  
        <volume>188</volume>  
        <issue>1</issue>  
        <fpage>147</fpage>  
        <lpage>55</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.sciencedirect.com/science/article/pii/S0165178110007699"/>
        </comment>  
        <pub-id pub-id-type="medline">21208660</pub-id></nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Fliege</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Becker</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Walter</surname>
            <given-names>OB</given-names>
          </name>
          <name name-style="western">
            <surname>Rose</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Bjorner</surname>
            <given-names>JB</given-names>
          </name>
          <name name-style="western">
            <surname>Klapp</surname>
            <given-names>BF</given-names>
          </name>
        </person-group>
        <article-title>Evaluation of a computer-adaptive test for the assessment of depression (D-CAT) in clinical application</article-title>
        <source>Int J Methods Psychiatr Res</source>  
        <year>2009</year>  
        <volume>18</volume>  
        <issue>1</issue>  
        <fpage>23</fpage>  
        <lpage>36</lpage>  
        <pub-id pub-id-type="doi">10.1002/mpr.274</pub-id>
        <pub-id pub-id-type="medline">19194856</pub-id></nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Fliege</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Becker</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Walter</surname>
            <given-names>OB</given-names>
          </name>
          <name name-style="western">
            <surname>Bjorner</surname>
            <given-names>JB</given-names>
          </name>
          <name name-style="western">
            <surname>Klapp</surname>
            <given-names>BF</given-names>
          </name>
          <name name-style="western">
            <surname>Rose</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Development of a computer-adaptive test for depression (D-CAT)</article-title>
        <source>Qual Life Res</source>  
        <year>2005</year>  
        <month>12</month>  
        <volume>14</volume>  
        <issue>10</issue>  
        <fpage>2277</fpage>  
        <lpage>91</lpage>  
        <pub-id pub-id-type="doi">10.1007/s11136-005-6651-9</pub-id>
        <pub-id pub-id-type="medline">16328907</pub-id></nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Pilkonis</surname>
            <given-names>PA</given-names>
          </name>
          <name name-style="western">
            <surname>Choi</surname>
            <given-names>SW</given-names>
          </name>
          <name name-style="western">
            <surname>Reise</surname>
            <given-names>SP</given-names>
          </name>
          <name name-style="western">
            <surname>Stover</surname>
            <given-names>AM</given-names>
          </name>
          <name name-style="western">
            <surname>Riley</surname>
            <given-names>WT</given-names>
          </name>
          <name name-style="western">
            <surname>Cella</surname>
            <given-names>D</given-names>
          </name>
          <collab>PROMIS Cooperative Group</collab>
        </person-group>
        <article-title>Item banks for measuring emotional distress from the patient-reported outcomes measurement information system (PROMIS®): depression, anxiety, and anger</article-title>
        <source>Assessment</source>  
        <year>2011</year>  
        <month>09</month>  
        <volume>18</volume>  
        <issue>3</issue>  
        <fpage>263</fpage>  
        <lpage>83</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21697139"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1177/1073191111411667</pub-id>
        <pub-id pub-id-type="medline">21697139</pub-id>
        <pub-id pub-id-type="pii">1073191111411667</pub-id>
        <pub-id pub-id-type="pmcid">PMC3153635</pub-id></nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kosinski</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Matz</surname>
            <given-names>SC</given-names>
          </name>
          <name name-style="western">
            <surname>Gosling</surname>
            <given-names>SD</given-names>
          </name>
          <name name-style="western">
            <surname>Popov</surname>
            <given-names>V</given-names>
          </name>
          <name name-style="western">
            <surname>Stillwell</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>Facebook as a research tool for the social sciences: opportunities, challenges, ethical considerations, and practical guidelines</article-title>
        <source>Am Psychol</source>  
        <year>2015</year>  
        <volume>70</volume>  
        <issue>6</issue>  
        <fpage>543</fpage>  
        <lpage>56</lpage>  
        <pub-id pub-id-type="doi">10.1037/a0039210</pub-id>
        <pub-id pub-id-type="medline">26348336</pub-id></nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Quiñones</surname>
            <given-names>AR</given-names>
          </name>
          <name name-style="western">
            <surname>Thielke</surname>
            <given-names>SM</given-names>
          </name>
          <name name-style="western">
            <surname>Clark</surname>
            <given-names>ME</given-names>
          </name>
          <name name-style="western">
            <surname>Phillips</surname>
            <given-names>KM</given-names>
          </name>
          <name name-style="western">
            <surname>Elnitsky</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Andresen</surname>
            <given-names>EM</given-names>
          </name>
        </person-group>
        <article-title>Validity of center for epidemiologic studies depression (CES-D) scale in a sample of Iraq and Afghanistan veteran</article-title>
        <source>SAGE Open Med</source>  
        <year>2016</year>  
        <volume>4</volume>  
        <fpage>2050312116643906</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27127628"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1177/2050312116643906</pub-id>
        <pub-id pub-id-type="medline">27127628</pub-id>
        <pub-id pub-id-type="pii">10.1177_2050312116643906</pub-id>
        <pub-id pub-id-type="pmcid">PMC4834469</pub-id></nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Tapia</surname>
            <given-names>AJ</given-names>
          </name>
          <name name-style="western">
            <surname>Wagner</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Heredia</surname>
            <given-names>MER</given-names>
          </name>
          <name name-style="western">
            <surname>González-Forteza</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Study of depression in students from Mexico City and the state of Michoacán using the revised version of the CES-D</article-title>
        <source>Salud Mental</source>  
        <year>2015</year>  
        <volume>38</volume>  
        <issue>2</issue>  
        <fpage>103</fpage>  
        <lpage>7</lpage>  
        <pub-id pub-id-type="doi">10.17711/SM.0185-3325.2015.014</pub-id></nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lacasse</surname>
            <given-names>JJ</given-names>
          </name>
          <name name-style="western">
            <surname>Forgeard</surname>
            <given-names>MJ</given-names>
          </name>
          <name name-style="western">
            <surname>Jayawickreme</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Jayawickreme</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>The factor structure of the CES-D in a sample of Rwandan genocide survivors</article-title>
        <source>Soc Psychiatry Psychiatr Epidemiol</source>  
        <year>2014</year>  
        <volume>49</volume>  
        <issue>3</issue>  
        <fpage>459</fpage>  
        <lpage>65</lpage>  
        <pub-id pub-id-type="medline">24173407</pub-id></nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hann</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Winter</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Jacobsen</surname>
            <given-names>P</given-names>
          </name>
        </person-group>
        <article-title>Measurement of depressive symptoms in cancer patients: evaluation of the center for epidemiological studies depression scale (CES-D)</article-title>
        <source>J Psychosom Res</source>  
        <year>1999</year>  
        <month>05</month>  
        <volume>46</volume>  
        <issue>5</issue>  
        <fpage>437</fpage>  
        <lpage>43</lpage>  
        <pub-id pub-id-type="medline">10404478</pub-id>
        <pub-id pub-id-type="pii">S0022399999000045</pub-id></nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Boey</surname>
            <given-names>KW</given-names>
          </name>
        </person-group>
        <article-title>Cross-validation of a short form of the CES-D in Chinese elderly</article-title>
        <source>Int J Geriatr Psychiatry</source>  
        <year>1999</year>  
        <volume>14</volume>  
        <issue>8</issue>  
        <fpage>608</fpage>  
        <lpage>17</lpage>  
        <pub-id pub-id-type="medline">10489651</pub-id></nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Vilagut</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Forero</surname>
            <given-names>CG</given-names>
          </name>
          <name name-style="western">
            <surname>Barbaglia</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Alonso</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Screening for depression in the general population with the center for epidemiologic studies depression (CES-D): a systematic review with meta-analysis</article-title>
        <source>PLoS One</source>  
        <year>2016</year>  
        <volume>11</volume>  
        <issue>5</issue>  
        <fpage>e0155431</fpage>  
        <pub-id pub-id-type="medline">27182821</pub-id></nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Choi</surname>
            <given-names>SW</given-names>
          </name>
          <name name-style="western">
            <surname>Schalet</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Cook</surname>
            <given-names>KF</given-names>
          </name>
          <name name-style="western">
            <surname>Cella</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>Establishing a common metric for depressive symptoms: linking the BDI-II, CES-D, and PHQ-9 to PROMIS depression</article-title>
        <source>Psychol Assess</source>  
        <year>2014</year>  
        <volume>26</volume>  
        <issue>2</issue>  
        <fpage>513</fpage>  
        <lpage>27</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://psycnet.apa.org/journals/pas/26/2/513/"/>
        </comment>  
        <pub-id pub-id-type="medline">24548149</pub-id></nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Cronbach</surname>
            <given-names>LJ</given-names>
          </name>
        </person-group>
        <article-title>Coefficient alpha and the internal structure of tests</article-title>
        <source>Psychometrika</source>  
        <year>1951</year>  
        <volume>16</volume>  
        <issue>3</issue>  
        <fpage>297</fpage>  
        <lpage>334</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://link.springer.com/article/10.1007/BF02310555"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1007/BF02310555</pub-id></nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bollen</surname>
            <given-names>KA</given-names>
          </name>
        </person-group>
        <article-title>A new incremental fit index for general structural equation models</article-title>
        <source>Sociol Methods Res</source>  
        <year>1989</year>  
        <volume>17</volume>  
        <issue>3</issue>  
        <fpage>303</fpage>  
        <lpage>15</lpage>  
        <pub-id pub-id-type="doi">10.1177/0049124189017003004</pub-id></nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bentler</surname>
            <given-names>PM</given-names>
          </name>
        </person-group>
        <article-title>Comparative fit indexes in structural models</article-title>
        <source>Psychol Bull</source>  
        <year>1990</year>  
        <volume>107</volume>  
        <issue>2</issue>  
        <fpage>238</fpage>  
        <lpage>46</lpage>  
        <pub-id pub-id-type="medline">2320703</pub-id></nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Browne</surname>
            <given-names>MW</given-names>
          </name>
          <name name-style="western">
            <surname>Cudek</surname>
            <given-names>R</given-names>
          </name>
        </person-group>
        <article-title>Alternative ways of assessing model fit</article-title>
        <source>Sociol Methods Res</source>  
        <year>1993</year>  
        <volume>21</volume>  
        <issue>2</issue>  
        <fpage>230</fpage>  
        <lpage>58</lpage>  
        <pub-id pub-id-type="doi">10.1177/0049124192021002005</pub-id></nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Cameron</surname>
            <given-names>IM</given-names>
          </name>
          <name name-style="western">
            <surname>Scott</surname>
            <given-names>NW</given-names>
          </name>
          <name name-style="western">
            <surname>Adler</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Reid</surname>
            <given-names>IC</given-names>
          </name>
        </person-group>
        <article-title>A comparison of three methods of assessing differential item functioning (DIF) in the hospital anxiety depression scale: ordinal logistic regression, Rasch analysis and the Mantel chi-square procedure</article-title>
        <source>Qual Life Res</source>  
        <year>2014</year>  
        <volume>23</volume>  
        <issue>10</issue>  
        <fpage>2883</fpage>  
        <lpage>8</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://link.springer.com/10.1007/s11136-014-0719-3"/>
        </comment>  
        <pub-id pub-id-type="medline">24848597</pub-id></nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hu</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Bentler</surname>
            <given-names>PM</given-names>
          </name>
        </person-group>
        <article-title>Cutoff criteria for fit indexes in covariance structure analysis: conventional criteria versus new alternatives</article-title>
        <source>Struct Equ Model a</source>  
        <year>1999</year>  
        <volume>6</volume>  
        <issue>1</issue>  
        <fpage>1</fpage>  
        <lpage>55</lpage>  
        <pub-id pub-id-type="doi">10.1080/10705519909540118</pub-id></nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Sijtsma</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Emons</surname>
            <given-names>WH</given-names>
          </name>
          <name name-style="western">
            <surname>Bouwmeester</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Nyklíček</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Roorda</surname>
            <given-names>LD</given-names>
          </name>
        </person-group>
        <article-title>Nonparametric IRT analysis of quality-of-life scales and its application to the world health organization quality-of-life scale (WHOQOL-Bref)</article-title>
        <source>Qual Life Res</source>  
        <year>2008</year>  
        <volume>17</volume>  
        <issue>2</issue>  
        <fpage>275</fpage>  
        <lpage>90</lpage>  
        <pub-id pub-id-type="medline">18246447</pub-id></nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Stochl</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Jones</surname>
            <given-names>PB</given-names>
          </name>
          <name name-style="western">
            <surname>Croudace</surname>
            <given-names>TJ</given-names>
          </name>
        </person-group>
        <article-title>Mokken scale analysis of mental health and well-being questionnaire item responses: a non-parametric IRT method in empirical research for applied health researchers</article-title>
        <source>BMC Med Res Methodol</source>  
        <year>2012</year>  
        <month>06</month>  
        <day>11</day>  
        <volume>12</volume>  
        <fpage>74</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/1471-2288-12-74"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/1471-2288-12-74</pub-id>
        <pub-id pub-id-type="medline">22686586</pub-id>
        <pub-id pub-id-type="pii">1471-2288-12-74</pub-id>
        <pub-id pub-id-type="pmcid">PMC3464599</pub-id></nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Samejima</surname>
            <given-names>F</given-names>
          </name>
        </person-group>
        <source>Psychometricsociety</source>  
        <year>1969</year>  
        <access-date>2017-08-11</access-date>
        <comment>Estimation of latent ability using a response pattern of graded scores 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://www.psychometricsociety.org/sites/default/files/pdf/MN17.pdf">https://www.psychometricsociety.org/sites/default/files/pdf/MN17.pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6sd8xdEVx"/></comment> </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Forero</surname>
            <given-names>CG</given-names>
          </name>
          <name name-style="western">
            <surname>Maydeu-Olivares</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Estimation of IRT graded response models: limited versus full information methods</article-title>
        <source>Psychol Methods</source>  
        <year>2009</year>  
        <month>09</month>  
        <volume>14</volume>  
        <issue>3</issue>  
        <fpage>275</fpage>  
        <lpage>99</lpage>  
        <pub-id pub-id-type="doi">10.1037/a0015825</pub-id>
        <pub-id pub-id-type="medline">19719362</pub-id>
        <pub-id pub-id-type="pii">2009-12975-006</pub-id></nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Baker</surname>
            <given-names>FB</given-names>
          </name>
        </person-group>
        <source>The basics of item response theory</source>  
        <year>2001</year>  
        <publisher-loc>College Park, MD</publisher-loc>
        <publisher-name>ERIC clearinghouse on assessment and evaluation</publisher-name></nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Reeve</surname>
            <given-names>BB</given-names>
          </name>
          <name name-style="western">
            <surname>Hays</surname>
            <given-names>RD</given-names>
          </name>
          <name name-style="western">
            <surname>Bjorner</surname>
            <given-names>JB</given-names>
          </name>
          <name name-style="western">
            <surname>Cook</surname>
            <given-names>KF</given-names>
          </name>
          <name name-style="western">
            <surname>Crane</surname>
            <given-names>PK</given-names>
          </name>
          <name name-style="western">
            <surname>Teresi</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Thissen</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Revicki</surname>
            <given-names>DA</given-names>
          </name>
          <name name-style="western">
            <surname>Weiss</surname>
            <given-names>DJ</given-names>
          </name>
          <name name-style="western">
            <surname>Hambleton</surname>
            <given-names>RK</given-names>
          </name>
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Gershon</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Reise</surname>
            <given-names>SP</given-names>
          </name>
          <name name-style="western">
            <surname>Lai</surname>
            <given-names>JS</given-names>
          </name>
          <name name-style="western">
            <surname>Cella</surname>
            <given-names>D</given-names>
          </name>
          <collab>PROMIS Cooperative Group</collab>
        </person-group>
        <article-title>Psychometric evaluation and calibration of health-related quality of life item banks: plans for the patient-reported outcomes measurement information system (PROMIS)</article-title>
        <source>Med Care</source>  
        <year>2007</year>  
        <month>05</month>  
        <volume>45</volume>  
        <issue>5 Suppl 1</issue>  
        <fpage>S22</fpage>  
        <lpage>31</lpage>  
        <pub-id pub-id-type="doi">10.1097/01.mlr.0000250483.85507.04</pub-id>
        <pub-id pub-id-type="medline">17443115</pub-id>
        <pub-id pub-id-type="pii">00005650-200705001-00004</pub-id></nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yen</surname>
            <given-names>WM</given-names>
          </name>
        </person-group>
        <article-title>Scaling performance assessments: strategies for managing local item dependence</article-title>
        <source>J Educ Meas</source>  
        <year>1993</year>  
        <volume>30</volume>  
        <issue>3</issue>  
        <fpage>187</fpage>  
        <lpage>213</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://onlinelibrary.wiley.com/doi/10.1111/j.1745-3984.1993.tb00423.x/abstract"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1111/j.1745-3984.1993.tb00423.x</pub-id></nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Choi</surname>
            <given-names>SW</given-names>
          </name>
          <name name-style="western">
            <surname>Gibbons</surname>
            <given-names>LE</given-names>
          </name>
          <name name-style="western">
            <surname>Crane</surname>
            <given-names>PK</given-names>
          </name>
        </person-group>
        <article-title>Lordif: an R package for detecting differential item functioning using iterative hybrid ordinal logistic regression/item response theory and Monte Carlo</article-title>
        <source>J Stat Softw</source>  
        <year>2011</year>  
        <volume>39</volume>  
        <issue>8</issue>  
        <fpage>1</fpage>  
        <lpage>30</lpage>  
        <pub-id pub-id-type="medline">21572908</pub-id></nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Crane</surname>
            <given-names>PK</given-names>
          </name>
          <name name-style="western">
            <surname>Gibbons</surname>
            <given-names>LE</given-names>
          </name>
          <name name-style="western">
            <surname>Jolley</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>van</surname>
            <given-names>BG</given-names>
          </name>
        </person-group>
        <article-title>Differential item functioning analysis with ordinal logistic regression techniques. DIFdetect and difwithpar</article-title>
        <source>Med Care</source>  
        <year>2006</year>  
        <month>11</month>  
        <volume>44</volume>  
        <issue>11 Suppl 3</issue>  
        <fpage>S115</fpage>  
        <lpage>23</lpage>  
        <pub-id pub-id-type="doi">10.1097/01.mlr.0000245183.28384.ed</pub-id>
        <pub-id pub-id-type="medline">17060818</pub-id>
        <pub-id pub-id-type="pii">00005650-200611001-00017</pub-id></nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zumbo</surname>
            <given-names>BD</given-names>
          </name>
        </person-group>
        <source>A handbook on the theory and methods of differential item functioning (DIF)</source>  
        <year>1999</year>  
        <publisher-loc>Ottawa, Ontario, Canada</publisher-loc>
        <publisher-name>Directorate of Human Resources Research and Evaluation, Department of National Defense</publisher-name></nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Crane</surname>
            <given-names>PK</given-names>
          </name>
          <name name-style="western">
            <surname>Gibbons</surname>
            <given-names>LE</given-names>
          </name>
          <name name-style="western">
            <surname>Ocepek-Welikson</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Cook</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Cella</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Narasimhalu</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Hays</surname>
            <given-names>RD</given-names>
          </name>
          <name name-style="western">
            <surname>Teresi</surname>
            <given-names>JA</given-names>
          </name>
        </person-group>
        <article-title>A comparison of three sets of criteria for determining the presence of differential item functioning using ordinal logistic regression</article-title>
        <source>Qual Life Res</source>  
        <year>2007</year>  
        <volume>16</volume>  
        <issue>1</issue>  
        <fpage>69</fpage>  
        <lpage>84</lpage>  
        <pub-id pub-id-type="medline">17554640</pub-id></nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Cook</surname>
            <given-names>KF</given-names>
          </name>
          <name name-style="western">
            <surname>Bombardier</surname>
            <given-names>CH</given-names>
          </name>
          <name name-style="western">
            <surname>Bamer</surname>
            <given-names>AM</given-names>
          </name>
          <name name-style="western">
            <surname>Choi</surname>
            <given-names>SW</given-names>
          </name>
          <name name-style="western">
            <surname>Kroenke</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Fann</surname>
            <given-names>JR</given-names>
          </name>
        </person-group>
        <article-title>Do somatic and cognitive symptoms of traumatic brain injury confound depression screening?</article-title>
        <source>Arch Phys Med Rehabil</source>  
        <year>2011</year>  
        <month>05</month>  
        <volume>92</volume>  
        <issue>5</issue>  
        <fpage>818</fpage>  
        <lpage>23</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21530731"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.apmr.2010.12.008</pub-id>
        <pub-id pub-id-type="medline">21530731</pub-id>
        <pub-id pub-id-type="pii">S0003-9993(10)00978-0</pub-id>
        <pub-id pub-id-type="pmcid">PMC3121102</pub-id></nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Baylor</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Yorkston</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Eadie</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Chung</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Amtmann</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>The communicative participation item bank (CPIB): item bank calibration and development of a disorder-generic short form</article-title>
        <source>J Speech Lang Hear Res</source>  
        <year>2013</year>  
        <month>08</month>  
        <volume>56</volume>  
        <issue>4</issue>  
        <fpage>1190</fpage>  
        <lpage>208</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23816661"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1044/1092-4388(2012/12-0140)</pub-id>
        <pub-id pub-id-type="medline">23816661</pub-id>
        <pub-id pub-id-type="pii">1092-4388_2012_12-0140</pub-id>
        <pub-id pub-id-type="pmcid">PMC4377222</pub-id></nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lord</surname>
            <given-names>FM</given-names>
          </name>
        </person-group>
        <source>Applications of item response theory to practical testing problems</source>  
        <year>1980</year>  
        <publisher-loc>Mahwah, NJ</publisher-loc>
        <publisher-name>Erlbaum Associates</publisher-name></nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Veerkamp</surname>
            <given-names>WJ</given-names>
          </name>
          <name name-style="western">
            <surname>Berger</surname>
            <given-names>MP</given-names>
          </name>
        </person-group>
        <article-title>Some new item selection criteria for adaptive testing</article-title>
        <source>‎J Educ Behav Stat</source>  
        <year>1997</year>  
        <volume>22</volume>  
        <issue>2</issue>  
        <fpage>203</fpage>  
        <lpage>26</lpage>  
        <pub-id pub-id-type="doi">10.3102/10769986022002203</pub-id></nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Birnbaum</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Some latent trait models and their use in inferring an examinee’s ability</article-title>
        <source>Statistical theories of mental test scores</source>  
        <year>1968</year>  
        <publisher-loc>Reading, MA</publisher-loc>
        <publisher-name>Addison-Wesley Pub Co</publisher-name>
        <fpage>397</fpage>  
        <lpage>479</lpage> </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Weiss</surname>
            <given-names>DJ</given-names>
          </name>
        </person-group>
        <article-title>Better data from better measurements using computerized adaptive testing</article-title>
        <source>JMM</source>  
        <year>2011</year>  
        <volume>2</volume>  
        <issue>1</issue>  
        <fpage>1</fpage>  
        <lpage>27</lpage>  
        <pub-id pub-id-type="doi">10.2458/v2i1.12351</pub-id></nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Walter</surname>
            <given-names>OB</given-names>
          </name>
        </person-group>
        <article-title>Adaptive tests for measuring anxiety and depression</article-title>
        <source>Elements of adaptive testing</source>  
        <year>2009</year>  
        <publisher-loc>New York</publisher-loc>
        <publisher-name>Springer</publisher-name>
        <fpage>123</fpage>  
        <lpage>36</lpage> </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <collab>R Core Team</collab>
        </person-group>
        <source>R-project</source>  
        <year>2016</year>  
        <access-date>2017-08-11</access-date>
        <comment>R: a language and environment for statistical computing 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.r-project.org/">http://www.r-project.org/</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6sdFLbOk1"/></comment> </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Rosseel</surname>
            <given-names>Y</given-names>
          </name>
        </person-group>
        <article-title>Lavaan: an R package for structural equation modeling</article-title>
        <source>J Stat Softw</source>  
        <year>2012</year>  
        <volume>48</volume>  
        <issue>2</issue>  
        <fpage>1</fpage>  
        <lpage>36</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://www.jstatsoft.org/article/view/v048i02"/>
        </comment>  
        <pub-id pub-id-type="doi">10.18637/jss.v048.i02</pub-id></nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Van der Ark</surname>
            <given-names>LA</given-names>
          </name>
        </person-group>
        <article-title>New developments in Mokken scale analysis in R</article-title>
        <source>J Stat Softw</source>  
        <year>2012</year>  
        <volume>48</volume>  
        <issue>5</issue>  
        <fpage>1</fpage>  
        <lpage>27</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jstatsoft.org/v48/i05/paper"/>
        </comment>  
        <pub-id pub-id-type="doi">10.18637/jss.v048.i05</pub-id></nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Chalmers</surname>
            <given-names>RP</given-names>
          </name>
        </person-group>
        <article-title>mirt: A multidimensional item response theory package for the R environment</article-title>
        <source>J Stat Softw</source>  
        <year>2012</year>  
        <volume>48</volume>  
        <issue>6</issue>  
        <fpage>1</fpage>  
        <lpage>29</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://scholar.google.co.uk/scholar?hl=en&#38;q=Chalmers+MIRT&#38;btnG=&#38;as_sdt=1%2C5&#38;as_sdtp=#0"/>
        </comment>  
        <pub-id pub-id-type="doi">10.18637/jss.v048.i06</pub-id></nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Mokken</surname>
            <given-names>RJ</given-names>
          </name>
        </person-group>
        <source>A theory and procedure of scale analysis with applications in political research</source>  
        <year>1971</year>  
        <publisher-loc>Berlin</publisher-loc>
        <publisher-name>Mouton</publisher-name></nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Sijtsma</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Molenaar</surname>
            <given-names>IW</given-names>
          </name>
        </person-group>
        <source>Introduction to Nonparametric Item Response Theory</source>  
        <year>2002</year>  
        <publisher-loc>London</publisher-loc>
        <publisher-name>Sage Publications</publisher-name></nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Maydeu-Olivares</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Joe</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <article-title>Limited information goodness-of-fit testing in multidimensional contingency tables</article-title>
        <source>Psychometrika</source>  
        <year>2006</year>  
        <volume>71</volume>  
        <issue>4</issue>  
        <fpage>713</fpage>  
        <lpage>732</lpage> </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Forkmann</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Boecker</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Norra</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Eberle</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Kircher</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Schauerte</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Mischke</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Westhofen</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Gauggel</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Wirtz</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Development of an item bank for the assessment of depression in persons with mental illnesses and physical diseases using Rasch analysis</article-title>
        <source>Rehabil Psychol</source>  
        <year>2009</year>  
        <month>05</month>  
        <volume>54</volume>  
        <issue>2</issue>  
        <fpage>186</fpage>  
        <lpage>97</lpage>  
        <pub-id pub-id-type="doi">10.1037/a0015612</pub-id>
        <pub-id pub-id-type="medline">19469609</pub-id>
        <pub-id pub-id-type="pii">2009-07289-009</pub-id></nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Schalet</surname>
            <given-names>BD</given-names>
          </name>
          <name name-style="western">
            <surname>Pilkonis</surname>
            <given-names>PA</given-names>
          </name>
          <name name-style="western">
            <surname>Yu</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Dodds</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Johnston</surname>
            <given-names>KL</given-names>
          </name>
          <name name-style="western">
            <surname>Yount</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Riley</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Cella</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>Clinical validity of PROMIS depression, anxiety, and anger across diverse clinical samples</article-title>
        <source>J Clin Epidemiol</source>  
        <year>2016</year>  
        <volume>73</volume>  
        <fpage>119</fpage>  
        <lpage>27</lpage>  
        <pub-id pub-id-type="medline">26931289</pub-id></nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Williams</surname>
            <given-names>CD</given-names>
          </name>
          <name name-style="western">
            <surname>Taylor</surname>
            <given-names>TR</given-names>
          </name>
          <name name-style="western">
            <surname>Makambi</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Harrell</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Palmer</surname>
            <given-names>JR</given-names>
          </name>
          <name name-style="western">
            <surname>Rosenberg</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Adams-Campbell</surname>
            <given-names>LL</given-names>
          </name>
        </person-group>
        <article-title>CES-D four-factor structure is confirmed, but not invariant, in a large cohort of African American women</article-title>
        <source>Psychiatry Res</source>  
        <year>2007</year>  
        <month>03</month>  
        <day>30</day>  
        <volume>150</volume>  
        <issue>2</issue>  
        <fpage>173</fpage>  
        <lpage>80</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.psychres.2006.02.007</pub-id>
        <pub-id pub-id-type="medline">17291596</pub-id>
        <pub-id pub-id-type="pii">S0165-1781(06)00041-2</pub-id></nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Boisvert</surname>
            <given-names>JA</given-names>
          </name>
          <name name-style="western">
            <surname>McCreary</surname>
            <given-names>DR</given-names>
          </name>
          <name name-style="western">
            <surname>Wright</surname>
            <given-names>KD</given-names>
          </name>
          <name name-style="western">
            <surname>Asmundson</surname>
            <given-names>GJ</given-names>
          </name>
        </person-group>
        <article-title>Factorial validity of the center for epidemiologic studies-depression (CES-D) scale in military peacekeepers</article-title>
        <source>Depress Anxiety</source>  
        <year>2003</year>  
        <volume>17</volume>  
        <issue>1</issue>  
        <fpage>19</fpage>  
        <lpage>25</lpage>  
        <pub-id pub-id-type="doi">10.1002/da.10080</pub-id>
        <pub-id pub-id-type="medline">12577274</pub-id></nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Scalise</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Allen</surname>
            <given-names>DD</given-names>
          </name>
        </person-group>
        <article-title>Use of open-source software for adaptive measurement: Concerto as an R-based computer adaptive development and delivery platform</article-title>
        <source>Br J Math Stat Psychol</source>  
        <year>2015</year>  
        <volume>68</volume>  
        <issue>3</issue>  
        <fpage>478</fpage>  
        <lpage>96</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://doi.wiley.com/10.1111/bmsp.12057"/>
        </comment>  
        <pub-id pub-id-type="medline">26061260</pub-id></nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
