<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v26i1e56874</article-id>
      <article-id pub-id-type="pmid">39626241</article-id>
      <article-id pub-id-type="doi">10.2196/56874</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Predicting and Monitoring Symptoms in Patients Diagnosed With Depression Using Smartphone Data: Observational Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>de Azevedo Cardoso</surname>
            <given-names>Taiane</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Zhang</surname>
            <given-names>Ruoyu</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>John</surname>
            <given-names>Anjum Susan</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>AL-Asadi</surname>
            <given-names>Ali</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Kallio</surname>
            <given-names>Johanna</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Ikäheimonen</surname>
            <given-names>Arsi</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Computer Science</institution>
            <institution>Aalto University</institution>
            <addr-line>Konemiehentie 2</addr-line>
            <addr-line>Espoo, 02150</addr-line>
            <country>Finland</country>
            <phone>358 449750110</phone>
            <email>arsi.ikaheimonen@aalto.fi</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1617-6911</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Luong</surname>
            <given-names>Nguyen</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0122-0286</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Baryshnikov</surname>
            <given-names>Ilya</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6229-6116</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Darst</surname>
            <given-names>Richard</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0402-7994</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Heikkilä</surname>
            <given-names>Roope</given-names>
          </name>
          <degrees>MA</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2125-577X</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Holmen</surname>
            <given-names>Joel</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <xref rid="aff7" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6598-1810</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Martikkala</surname>
            <given-names>Annasofia</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0003-9523-2700</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Riihimäki</surname>
            <given-names>Kirsi</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff8" ref-type="aff">8</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3913-5968</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Saleva</surname>
            <given-names>Outi</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0005-3454-9282</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <name name-style="western">
            <surname>Isometsä</surname>
            <given-names>Erkki</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5956-2399</ext-link>
        </contrib>
        <contrib id="contrib11" contrib-type="author">
          <name name-style="western">
            <surname>Aledavood</surname>
            <given-names>Talayeh</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0110-5694</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Computer Science</institution>
        <institution>Aalto University</institution>
        <addr-line>Espoo</addr-line>
        <country>Finland</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Psychiatry</institution>
        <institution>University of Helsinki</institution>
        <addr-line>Helsinki</addr-line>
        <country>Finland</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Helsinki and Uusimaa Hospital District</institution>
        <addr-line>Helsinki</addr-line>
        <country>Finland</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>School of Science</institution>
        <institution>Aalto University</institution>
        <addr-line>Espoo</addr-line>
        <country>Finland</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>City of Helsinki Mental Health Servcies</institution>
        <addr-line>Helsinki</addr-line>
        <country>Finland</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>University of Turku</institution>
        <addr-line>Turku</addr-line>
        <country>Finland</country>
      </aff>
      <aff id="aff7">
        <label>7</label>
        <institution>Turku University Central Hospital</institution>
        <addr-line>Turku</addr-line>
        <country>Finland</country>
      </aff>
      <aff id="aff8">
        <label>8</label>
        <institution>Finnish Institute for Health and Welfare</institution>
        <addr-line>Helsinki</addr-line>
        <country>Finland</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Arsi Ikäheimonen <email>arsi.ikaheimonen@aalto.fi</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>3</day>
        <month>12</month>
        <year>2024</year>
      </pub-date>
      <volume>26</volume>
      <elocation-id>e56874</elocation-id>
      <history>
        <date date-type="received">
          <day>29</day>
          <month>1</month>
          <year>2024</year>
        </date>
        <date date-type="rev-request">
          <day>21</day>
          <month>6</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>7</day>
          <month>7</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>24</day>
          <month>9</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Arsi Ikäheimonen, Nguyen Luong, Ilya Baryshnikov, Richard Darst, Roope Heikkilä, Joel Holmen, Annasofia Martikkala, Kirsi Riihimäki, Outi Saleva, Erkki Isometsä, Talayeh Aledavood. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 03.12.2024.</copyright-statement>
      <copyright-year>2024</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2024/1/e56874" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Clinical diagnostic assessments and the outcome monitoring of patients with depression rely predominantly on interviews by professionals and the use of self-report questionnaires. The ubiquity of smartphones and other personal consumer devices has prompted research into the potential of data collected via these devices to serve as digital behavioral markers for indicating the presence and monitoring of the outcome of depression.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This paper explores the potential of using behavioral data collected with smartphones to detect and monitor depression symptoms in patients diagnosed with depression. Specifically, it investigates whether this data can accurately classify the presence of depression, as well as monitor the changes in depressive states over time.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>In a prospective cohort study, we collected smartphone behavioral data for up to 1 year. The study consists of observations from 164 participants, including healthy controls (n=31) and patients diagnosed with various depressive disorders: major depressive disorder (MDD; n=85), MDD with comorbid borderline personality disorder (n=27), and major depressive episodes with bipolar disorder (n=21). Data were labeled based on depression severity using 9-item Patient Health Questionnaire (PHQ-9) scores. We performed statistical analysis and used supervised machine learning on the data to classify the severity of depression and observe changes in the depression state over time.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Our correlation analysis revealed 32 behavioral markers associated with the changes in depressive state. Our analysis classified patients who are depressed with an accuracy of 82% (95% CI 80%-84%) and change in the presence of depression with an accuracy of 75% (95% CI 72%-76%). Notably, the most important smartphone features for classifying depression states were screen-off events, battery charge levels, communication patterns, app usage, and location data. Similarly, for predicting changes in depression state, the most important features were related to location, battery level, screen, and accelerometer data patterns.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The use of smartphone digital behavioral markers to supplement clinical evaluations may aid in detecting the presence and changes in severity of symptoms of depression, particularly if combined with intermittent use of self-report of symptoms.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>data analysis</kwd>
        <kwd>digital phenotyping</kwd>
        <kwd>digital behavioral data</kwd>
        <kwd>depression symptoms</kwd>
        <kwd>depression monitoring</kwd>
        <kwd>mHealth</kwd>
        <kwd>mobile health</kwd>
        <kwd>smartphone</kwd>
        <kwd>mobile phone</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>In recent years, digital tools and algorithms have become indispensable in health care, including mental health. Data-driven technologies have the potential to renew health care, providing new avenues for personalized care, remote monitoring, and improved service access. At the same time, mental health disorders, including depression, have remained a significant concern. Depressive disorders are estimated to be the second-leading cause of life-years lost to disability worldwide [<xref ref-type="bibr" rid="ref1">1</xref>]. Alongside markedly impacting individuals’ quality of life, depressive disorders impose a substantial economic burden, including costs to health care and societies overall due to disability, reduced employment, and impaired work productivity [<xref ref-type="bibr" rid="ref2">2</xref>].</p>
      <p>Psychiatric evaluations are based on clinical interviews, relying on patients’ self-reflections and recollections, which are susceptible to memory biases and subjective inaccuracies [<xref ref-type="bibr" rid="ref3">3</xref>]. Further, the absence of definitive physiological biomarkers for mental disorders complicates accurate diagnoses and treatment [<xref ref-type="bibr" rid="ref4">4</xref>]. Given these challenges, a growing interest has been in data-driven clinical monitoring and decision-making, supplementing subjective evaluations with objective, longitudinal, physiological, and behavioral data collected via digital devices [<xref ref-type="bibr" rid="ref5">5</xref>]. This approach, known as digital phenotyping, involves creating a digital representation of a patient’s clinical phenotype using behavioral, social, and physiological markers. The premise of the data-driven approach lies in the inherent value of continuous monitoring, uncovering valuable insights unattainable through intermittent assessments [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
      <p>Recent data-driven studies using devices like smartphones and activity trackers have effectively used digital behavioral data to monitor and detect participants’ depressive moods [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. These studies gather sensor data to identify behavioral patterns associated with depressive disorders, such as changes in physical activity, phone usage, and sleep routines. The primary goals include differentiating between patients with depression and healthy controls, classifying mood state transitions, and predicting future mood states. Alongside passively collected data, these studies often use established self-report questionnaires as the reference standard for subjects' severity of depressive symptoms.</p>
      <p>However, some of the studies have used limited data collection, sample sizes of fewer than 50 participants [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref11">11</xref>], a sample of college students [<xref ref-type="bibr" rid="ref12">12</xref>-<xref ref-type="bibr" rid="ref15">15</xref>], and data collected over only a few weeks [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. Due to these limitations, it may be challenging to generalize results to either a broader population or a free-living setting. Regarding methodologies, earlier research has used smartphone sensors and data categorized as smartphone usage [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>], GPS location data-based features [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref17">17</xref>], physical activity data or step counts [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref17">17</xref>], communication patterns [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref17">17</xref>], Bluetooth data [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>], sleep data [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref15">15</xref>], metrics for behavior regularity [<xref ref-type="bibr" rid="ref15">15</xref>], and physiological measurements [<xref ref-type="bibr" rid="ref17">17</xref>]. Furthermore, studies have used several metrics for depression as the ground truth, including the 9-item Patient Health Questionnaire (PHQ-9) [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>], a compact version of the 4-item Patient Health Questionnaire (PHQ-4) [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref19">19</xref>], the Montgomery and Åsberg Depression Rating Scale [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref20">20</xref>], and the Beck Depression Inventory-II [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. The analysis methods used in these studies vary, encompassing correlation analysis [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref12">12</xref>], machine learning [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>], and deep learning [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>].</p>
      <p>This paper builds on previous research, exploring the potential of using behavioral data collected with smartphones to detect and monitor depression symptoms in outpatients diagnosed with depression. Our study aims to identify digital behavioral markers indicative of depressive states and assess the accuracy of this data in detecting depression. Key markers extracted from smartphone sensors, such as the accelerometer, app usage, battery status, communication log, screen activations, and GPS location, comprise metrics like screen-on activation count, total distance traveled, average battery level, phone call count, app usage duration, and maximum acceleration. We analyzed a comprehensive dataset, gathered through smartphones, from patients with depression who have a diagnosis of either major depressive disorder (MDD), major depressive episodes with bipolar disorder (MDE&#124;BD), or MDD with comorbidborderline personality disorder (MDD&#124;BPD) and healthy control<italic>s.</italic> The focus was on distinguishing patients self-reporting moderate or more severe depression symptoms and tracking changes in reported depression levels.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Dataset Description</title>
        <p>We used the data from the Mobile Monitoring of Mood (MoMo-Mood) study, a 1-year multimodal digital phenotyping study of individuals undergoing treatment for mental disorders and healthy controls [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. The MoMo-Mood study recruited 164 participants from 4 different groups: healthy controls (n=31) and patients with MDD (n=85), MDD&#124;BPD (n=27), and MDE&#124;BD (n=21). Voluntary patients were recruited in Finland from the mood disorder outpatient treatment facilities of the Helsinki University Hospital Mood Disorder Division, Turku University Central Hospital Department of Psychiatry, and City of Espoo Mental Health Services. The patients were diagnosed with structured interviews, namely the Mini-International Neuropsychiatric Interview [<xref ref-type="bibr" rid="ref24">24</xref>] and the Structured Clinical Interview for DSM-IV Axis II Personality Disorders [<xref ref-type="bibr" rid="ref25">25</xref>], as having ongoing major depressive episodes. Healthy controls were collected by contacting, via email, lists of students from the University of Helsinki and Aalto University, users of student health services from these institutions, and recruiting voluntary health care personnel from Helsinki University Hospital.</p>
        <p>Each group had more female individuals than male individuals: (1) control group, 24 female individuals and 7 male individuals; (2) MDD group, 46 female individuals and 31 male individuals; (3) MDE&#124;BD group, 18 female individuals and 3 male individuals; and (4) MDD&#124;BPD group, 23 female individuals and 1 male individual. On average, control group participants were older than patient group participants, with average ages as follows: (1) control group, 41.8 (SD 13.9) years, (2) MDD group, 39.0 (SD 14.2) years, (3) MDE&#124;BD group, 37.1 (SD 10.3) years, and (4) MDD&#124;BPD group, 28.3 (SD 6.0) years. A more detailed description is provided elsewhere [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>].</p>
        <p>Study participants were recruited on a rolling basis, allowing them to join and leave the research at various intervals. They were requested to stay involved in the study for 1 year. Data collection was carried out in 2 phases. In the initial 2 weeks, called the <italic>active phase</italic>, participants collected data continuously via personal devices (smartphones running Android operating system), bed sensors, and actigraphs, and they answered daily mood-related questions. The active phase was followed by the <italic>passive phase,</italic> lasting up to 1 year. During the passive phase, data collection via smartphones continued, and participants’ depression was monitored by biweekly PHQ-9 surveys prompted via the smartphone. The PHQ-9 comprises 9 questions, each scored from 0 to 3, based on the frequency of depressive symptoms over the past 2 weeks. Thus, the total score ranges from 0 to 27, with high values representing more severe depression. The passive data originate from various smartphone sensors, including accelerometers, app usage, communication, battery level and screen status logs, and GPS location data. The data were collected through the Niima data collection platform [<xref ref-type="bibr" rid="ref26">26</xref>]. This work exclusively focuses on the passive phase of the study, which uses smartphone data and PHQ-9 survey responses. This phase was selected due to its unobtrusive data collection methods and, thus, the minimal requirement for behavioral adjustment from the participants.</p>
      </sec>
      <sec>
        <title>Data Preprocessing</title>
        <p>We used Python and the <italic>Niimpy</italic> behavioral data analysis toolbox [<xref ref-type="bibr" rid="ref27">27</xref>] for data preprocessing. We extracted 93 behavioral features from the raw data. <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> provides a detailed description of data sources and extracted features. Furthermore, we segmented the data from the accelerometer, app usage, battery status, communication log, and smartphone screen activations into 6-hour bins (12:00 AM to 06:00 AM, 6:00 AM to 12:00 PM, 12:00 PM to 6:00 PM, and 6:00 PM to 12:00 AM). We extracted 308 additional features, resulting in a total of 401 features. The data from different sensors were resampled and averaged over 14-day periods. The data were merged with the PHQ-9 responses to align data from the preceding biweekly period with the questionnaire responses. Of the 164 participants in the active phase, 99 proceeded to the passive phase. For the analysis, we selected participants who had provided passive data for at least 14 days and had answered a PHQ-9 survey at the end of this period, yielding 83 participants. Each participant provided data for up to 1 year, yielding 26 biweekly data points. Due to missing observations and participant withdrawals from the study, 818 observations (37.9% of the possible 2158 observations) were available for further analysis. <xref rid="figure1" ref-type="fig">Figure 1</xref> details the data collection and preparation for the analysis, while <xref rid="figure2" ref-type="fig">Figure 2</xref> provides additional information on data aggregation and alignment.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>The MoMo-Mood study data collection and preparation schema. MoMo-Mood: Mobile Monitoring of Mood; PHQ-9: 9-item Patient Health Questionnaire.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e56874_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Schematics of data aggregation and alignment. PHQ-9: 9-item Patient Health Questionnaire.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e56874_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Statistical Analysis</title>
        <sec>
          <title>Distributional Testing</title>
          <p>To examine whether passively collected smartphone sensor data show differences between patient groups and control participants, we used distributional testing using the nonparametric 2-sample Kolmogorov-Smirnov test [<xref ref-type="bibr" rid="ref28">28</xref>]. The test was chosen due to its capability to detect variations across the entire distribution, including the tails. For the test, we averaged the biweekly sampled data by participant, normalized the data, and omitted the missing values<italic>.</italic> For robustness against the risk of type I errors (false-positive) due to multiple comparisons, we implemented false discovery rate (FDR) correction using the Benjamini-Hochberg procedure [<xref ref-type="bibr" rid="ref29">29</xref>] at a significance level of α=.05.</p>
        </sec>
        <sec>
          <title>Correlation Analysis</title>
          <p>We conducted a correlation analysis to assess the association between passive data features and PHQ-9 scores. We pooled passive data from all participants, omitted missing values, and applied the Spearman rank correlation coefficient to assess the strength of the relationship. Furthermore, we used FDR correction using the Benjamini-Hochberg procedure at a significance level of α=.05 to account for the multiple testing involved, controlling the expected proportion of false discoveries.</p>
        </sec>
      </sec>
      <sec>
        <title>Predictive Modeling</title>
        <p>To achieve the research goal, we deployed supervised machine learning models for predicting both the presence of depression and state transitions of depressive states. We used a cutoff PHQ-9 depression score of 10 for binary classification analyses. Scores of 10 or higher were considered <italic>depressed,</italic> and scores below 10 as <italic>nondepressed.</italic> We chose a cutoff value of 10 because it signifies clinical depression, typically warranting a treatment plan that may include counseling, follow-up sessions, and possibly pharmacotherapy for the individual. For defining the depression state transition, we used the same threshold of 10 and the previous depression state. Each transition is paired with a specific label, used as the target variable for the depression state transition modeling. The transition definitions are presented in <xref ref-type="table" rid="table1">Table 1</xref>.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Overview of depression state transition definitions and corresponding labels.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="500"/>
            <thead>
              <tr valign="top">
                <td>Transition description</td>
                <td>Label</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Depressed→Depressed</td>
                <td>Remains depressed</td>
              </tr>
              <tr valign="top">
                <td>Depressed→Nondepressed</td>
                <td>Improves</td>
              </tr>
              <tr valign="top">
                <td>Nondepressed→Nondepressed</td>
                <td>Remains nondepressed</td>
              </tr>
              <tr valign="top">
                <td>Nondepressed→Depressed</td>
                <td>Declines</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <p>We built a machine learning pipeline using Python (version 3.10.8) and the following libraries: <italic>scikit-learn</italic> (version 1.2.0) [<xref ref-type="bibr" rid="ref30">30</xref>], <italic>extreme gradient boosting</italic> (<italic>XGBoost</italic>; version 1.7.3) [<xref ref-type="bibr" rid="ref31">31</xref>], <italic>OPTUNA</italic> (version 3.1.0) [<xref ref-type="bibr" rid="ref32">32</xref>], <italic>imbalance-learn</italic> (version 0.11.0) [<xref ref-type="bibr" rid="ref33">33</xref>], and <italic>Shapley additive explanations</italic> (<italic>SHAP</italic>; version 0.41.0) [<xref ref-type="bibr" rid="ref34">34</xref>]. Initially, we partitioned our dataset into a 75%:25% train:test split, preventing data leakage by keeping each participant’s data exclusively in either the training or test set. We conducted feature prefiltering by removing features with no or low variance, many missing observations, and a high correlation with other features. We compared filtering and wrapper-based methods and embedded feature selection methods with XGBoost classifiers for feature selection. We used data missingness, variance, and cross-correlation thresholding-based feature selection for the filtering-based method and the sequential forward selection method for the wrapper-based method. Standard preprocessing was applied to selected features, comprising imputation using median values, scaling transformations, and data normalization. To address the class imbalance and improve the robustness of our classification models against overfitting to the majority class, we used the synthetic minority oversampling technique (SMOTE) [<xref ref-type="bibr" rid="ref35">35</xref>], a method for generating synthetic minority class samples to balance the dataset. We applied SMOTE at 2 stages of the model’s development. First, the training data folds were balanced using SMOTE during the cross-validation process. We then applied SMOTE to the entire training dataset in preparation for the final model fitting. For pipeline details, refer to <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p>
        <p>In our study, we focused on the prediction task of identifying (1) the presence and (2) the state transitions of depression symptoms using passively sensed smartphone data and supervised machine learning models. <xref rid="figure3" ref-type="fig">Figure 3</xref> outlines how data was used for prediction. Specifically, 3 models were examined, namely k-nearest neighbors, support vector classifier, and XGBoost, all of which are commonly used models in digital phenotyping studies [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]. To fine-tune feature filtering, transformation functions, classification model, and SMOTE hyperparameters, we used stratified grouped 5-fold cross-validation, using the OPTUNA framework [<xref ref-type="bibr" rid="ref32">32</xref>]. The primary objective in the hyperparameter optimization process was to maximize the <italic>F</italic><sub>1</sub>-score, which balances precision and recall, thereby ensuring a more reliable evaluation of model performance. We used a pruning early stopping technique, which ceases training if there is no improvement in the <italic>F</italic><sub>1</sub>-score (our chosen validation metric). Finally, we used the test data and bootstrapping validation (using 10,000 bootstrap samples from training data) to evaluate the model performance, assessing the performances with accuracy, precision, recall, negative predictive value (NPV), and <italic>F</italic><sub>1</sub>-scores, as defined in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>. <italic>F</italic><sub>1</sub>-score is a valuable metric because maximizing it ensures that both false positives (identifying a participant who is nondepressed as depressed) and false negatives (failing to identify a participant who is depressed) are minimized. High recall reflects low false-negative classification, so we emphasized its importance in model performance evaluation.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Schema for depression presence and transition prediction using passive behavioral data. An asterisk (*) depicts a model using the PHQ-9 measurement from the preceding biweekly period as a predictor. Time point t0 on the analysis timeline represents the active phase, and points from t1 to t26 represent the passive phase. PHQ-9: 9-item Patient Health Questionnaire.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e56874_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Measuring Feature Importance</title>
        <p>For the final part, focusing on model interpretation, we assessed the importance of features (behavioral markers) for the best-performing XGBoost models to gain insight into the underlying classification mechanisms of the model. We evaluated the importance of each feature for depression presence and the state transition classifications using SHAP values [<xref ref-type="bibr" rid="ref34">34</xref>]. SHAP values measure each feature’s contribution to the model prediction, their relative importance compared with other features, and the significance of feature interactions.</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>The Helsinki and Uusimaa Hospital District’s Ethics Committee approved the research protocol for the MoMo-Mood study (approval number § 125/2018). A research permit was granted by Helsinki and Uusimaa Hospital District Psychiatry. This covered data streams, data collection platform security, and participants’ consent information. All data in transit were encrypted, and participant privacy was a key design value. Local IT support and the research ethics committee approved the written data security statement. Study participants were presented with full study information and data collected prior to providing written consent. The participants were allowed to withdraw whenever they chose. As remuneration for their participation, participants received 4 movie tickets at the end of the initial phase of the study.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Descriptive Statistics</title>
        <p>The raw data from the passive collection phase contained over 67 million data points, and 819 biweekly PHQ-9 surveys gathered data from 99 participants from 4 subgroups: 25 healthy controls, 46 patients with MDD, 16 patients with MDD&#124;BPD, and 12 patients with MDE&#124;BD. Participant selection, filtering, and preprocessing reduced the raw data to 327,200 data points (818 observations with 401 data features) and PHQ-9 scores to 818 observations. The resulting dataset had 83 participants, comprising 20 healthy controls, 41 patients with MDD, 12 patients with MDD&#124;BPD, and 10 patients with MDE&#124;BD.</p>
      </sec>
      <sec>
        <title>PHQ-9 Scores</title>
        <p>Most of the patients’ PHQ-9 scores during the passive data collection phase remained within the range of 5-19, representing mild to moderate clinical depression, while most control scores remained within the range of 0-4, representing no depression. The group-wise mean scores over the passive phase were as follows: control group, 1.2 (SD 1.8); MDD group, 11.9 (SD 6.7); MDE&#124;BD group, 13.7 (SD 6.5); and MDD&#124;BPD group, 13.8 (SD 6.6). It is noteworthy that the patient group scores predominantly represent mild to moderately severe clinical depression. <xref rid="figure4" ref-type="fig">Figure 4</xref> [<xref ref-type="bibr" rid="ref38">38</xref>] presents these differences and the distribution of PHQ-9 scores across the various groups.</p>
        <p>On average, PHQ-9 scores remain at similar levels within patient groups throughout the study, while all patient groups express a slightly decreasing trend at the beginning of the study. At the group level, MDE&#124;BD and MDD&#124;BPD groups exhibited more fluctuation in the scores toward the end of the study period as the number of participants within those groups decreased. Control group scores exhibited a slightly decreasing trend. <xref rid="figure5" ref-type="fig">Figure 5</xref> shows the overall trends in PHQ-9 scores, averaged over each group throughout the study. It is worth noting that the number of participants decreased over time, leading to increased fluctuations in average scores.</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>PHQ-9 score distributions for control and patient groups.To assess differences in PHQ-9 scores across various groups, we used a generalized estimating equations approach. We chose the method due to its effectiveness in dealing with correlated response data and its ability to provide robust SEs. The analysis revealed statistically significant differences in PHQ-9 scores between the control group and each of the patient groups. The significance of these differences was high, with <italic>P</italic>&#60;.001 for each comparison. MDD: major depressive disorder; MDD&#124;BPD: major depressive disorder with comorbid borderline personality disorder; MDE&#124;BD: major depressive episodes with bipolar disorder; PHQ-9: 9-item Patient Health Questionnaire.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e56874_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Averaged PHQ-9 score trends for controls and patient groups (standard deviations depicted by shaded regions). MDD: major depressive disorder; MDD&#124;BPD: major depressive disorder with comorbid borderline personality disorder; MDE&#124;BD: major depressive episodes with bipolar disorder; PHQ-9: 9-item Patient Health Questionnaire.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e56874_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>We compared the groups by depression severity by categorizing participants using a cutoff PHQ-9 score threshold of 10. Participants with a PHQ-9 score of 10 or higher were categorized as “Depressed,” and those below 10 were categorized as “Nondepressed.” <xref ref-type="table" rid="table2">Table 2</xref> shows the prevalence of depression severity across different patient groups.</p>
        <p>We categorized the 818 data points into 2 groups: 347 (42.4%) participants who are depressed and 471 (57.6%) participants who are nondepressed, resulting in mildly imbalanced classes considering the classification tasks. We assessed biweekly depression state transitions for each group, as described in <xref ref-type="table" rid="table1">Table 1</xref>. <xref ref-type="table" rid="table3">Table 3</xref> summarizes these transitions. Notably, the number of transitions for “Declines” and “Improves” was significantly lower than those for “Remains Depressed” and “Remains nondepressed.”</p>
        <p>These results show that in the data, the state changes in depression are infrequent compared with the occurrences where the state remains the same. Here, we noticed that transition classes have a significant imbalance, as only 119 (14.5%) out of 818 state changes counted as transitions, and 699 (85.5%) were stationary. This pronounced imbalance could bias classification algorithms toward the majority class, necessitating corrective measures for reliable analysis in subsequent stages.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Distribution of PHQ-9a scores by severity and group (n=818).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="270"/>
            <col width="140"/>
            <col width="140"/>
            <col width="140"/>
            <col width="140"/>
            <col width="140"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Group</td>
                <td>Control</td>
                <td>MDE&#124;BD<sup>b</sup></td>
                <td>MDD&#124;BPD<sup>c</sup></td>
                <td>MDD<sup>d</sup></td>
                <td>Total</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="7">
                  Depression severity, n (%)
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Depressed</td>
                <td>1 (0.1)</td>
                <td>65 (7.9)</td>
                <td>50 (6.1)</td>
                <td>231 (28.2)</td>
                <td>347 (42.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Nondepressed</td>
                <td>204 (24.9)</td>
                <td>36 (4.4)</td>
                <td>24 (2.9)</td>
                <td>207 (25.3)</td>
                <td>471 (57.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Total</td>
                <td>205 (25.1)</td>
                <td>101 (12.3)</td>
                <td>74 (9)</td>
                <td>438 (53.5)</td>
                <td>818 (100)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>PHQ-9: 9-Item Patient Health Questionnaire.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>MDE&#124;BD: major depressive episodes with bipolar disorder.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>MDD&#124;BPD: major depressive disorder with comorbid borderline personality disorder.</p>
            </fn>
            <fn id="table2fn4">
              <p><sup>d</sup>MDD: major depressive disorder.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Depression state transition counts for the control group and each patient group.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="280"/>
            <col width="0"/>
            <col width="140"/>
            <col width="0"/>
            <col width="140"/>
            <col width="0"/>
            <col width="140"/>
            <col width="0"/>
            <col width="140"/>
            <col width="0"/>
            <col width="130"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Group</td>
                <td colspan="2">Control</td>
                <td colspan="2">MDE&#124;BD<sup>a</sup></td>
                <td colspan="2">MDD&#124;BPD<sup>b</sup></td>
                <td colspan="2">MDD<sup>c</sup></td>
                <td>Total</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="12">
                  Transition, n
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Declines</td>
                <td colspan="2">1</td>
                <td colspan="2">9</td>
                <td colspan="2">5</td>
                <td colspan="2">34</td>
                <td colspan="2">49</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Improves</td>
                <td colspan="2">1</td>
                <td colspan="2">15</td>
                <td colspan="2">11</td>
                <td colspan="2">43</td>
                <td colspan="2">70</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Remains depressed</td>
                <td colspan="2">0</td>
                <td colspan="2">57</td>
                <td colspan="2">42</td>
                <td colspan="2">222</td>
                <td colspan="2">320</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Remains nondepressed</td>
                <td colspan="2">203</td>
                <td colspan="2">20</td>
                <td colspan="2">17</td>
                <td colspan="2">139</td>
                <td colspan="2">379</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Total</td>
                <td colspan="2">205</td>
                <td colspan="2">101</td>
                <td colspan="2">74</td>
                <td colspan="2">438</td>
                <td colspan="2">818</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>MDE&#124;BD: major depressive episodes with bipolar disorder.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>MDD&#124;BPD: major depressive disorder with comorbid borderline personality disorder.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>MDD: major depressive disorder.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Data Completeness</title>
        <p>Participant compliance and, thus, data completeness decreased as the study’s passive phase progressed. PHQ-9 survey answer compliance dropped below 70% after 6 weeks (3 biweekly periods) had passed, and after that, it continued to decline steadily. For further details, refer to <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>. Passive data collection compliance shows a pattern similar to answering the PHQ-9 survey. Most of the missing data occurred due to the participant dropping out of the study, while some participants had gaps in data collection. Notably, only a few participants remained in the study for the entire year. Also, the data collection for participants was incomplete due to missing features.</p>
      </sec>
      <sec>
        <title>Statistical Analysis</title>
        <p>Two-sample distributional testing using a 2-sample Kolmogorov-Smirnov test identified 20 significant features (5%), with <italic>P</italic> values ranging from .0045 to .0497. However, after applying the FDR correction for multiple comparisons at a significance level ⍺=.05, none of these features were statistically significant; thus, we found no evidence for patient group behavioral data differing from control data. For further details, see Table S1 in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>.</p>
        <p>Correlation analysis between the behavioral features and PHQ-9 scores using Spearman ranked correlation and FDR correction for multiple comparisons at significance level ⍺=.05 resulted in 32 (8%) out of 401 features exhibiting statistically significant correlations. The majority (18/32, 56%) of the correlations were very weak (absolute value from 0 to 0.19), and the rest (14/32, 44%) were weak (absolute value from 0.2 to 0.39). For more information, refer to Table S2 in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>.</p>
      </sec>
      <sec>
        <title>Depression Presence Classification</title>
        <p>We used 2 distinct approaches for classifying the presence of depression. The initial approach treated all biweekly aggregated passive data features (aligned with corresponding biweekly PHQ-9 scores) as independent observations. Using the XGBoost classifier with filter-based feature selection, we achieved the highest accuracy of 66% (95% CI 56%-70%) and an <italic>F</italic><sub>1</sub>-score of 0.66 (95% CI 0.5-0.7). The performance comparison of various classifiers and feature selection methods is detailed in Table S1 in <xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref>, while Table S2 in <xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref> provides a comprehensive summary of the model’s performance.</p>
        <p>For the second modeling approach, we included the measured PHQ-9 score from the previous biweekly period as a predictor in the model. Model performance improves notably after adding the predictor. XGBoost classifier with a filtering-based feature selection method achieved the best accuracy of 82% (95% CI 80%-84%) and a corresponding <italic>F</italic><sub>1</sub>-score of 0.82 (95% CI 0.80-0.85) across the test data of 208 samples.</p>
        <p>This classifier outperformed the other classifiers (k-nearest neighbor and support vector classifier) by a small margin. The “Nondepressed” class (99 samples) achieved a precision of 0.80 and recall of 0.83, with an NPV of 0.84 and an <italic>F</italic><sub>1</sub>-score of 0.81, reflecting balanced performance. The “Depressed” class (109 samples) had a slightly higher precision of 0.84, a recall of 0.81, an NPV of 0.80, and an <italic>F</italic><sub>1</sub>-score of 0.82, indicating a similar level of predictive accuracy to the “Nondepressed” class. Both macro- and weighted averages across precision, recall, <italic>F</italic><sub>1</sub>-score, and NPV are 0.82, demonstrating consistent performance in detecting both the presence and absence of depression. Table S3 in <xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref> summarizes the performance of selected classifiers and feature selection methods. <xref ref-type="table" rid="table4">Table 4</xref> summarizes the XGBoost classifier's performance, and Figure S1 in <xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref> presents the receiver operating characteristic curve for the classifier.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>XGBoost<sup>a</sup> model performance metrics for depression presence classification (using previous PHQ-9<sup>b</sup> score as a predictor).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="260"/>
            <col width="0"/>
            <col width="150"/>
            <col width="0"/>
            <col width="140"/>
            <col width="0"/>
            <col width="140"/>
            <col width="0"/>
            <col width="140"/>
            <col width="0"/>
            <col width="140"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Metric</td>
                <td colspan="2">Precision</td>
                <td colspan="2">Recall</td>
                <td colspan="2">NPV<sup>c</sup></td>
                <td colspan="2"><italic>F</italic><sub>1</sub>-score</td>
                <td>Support, n</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="12">
                  Class
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Nondepressed</td>
                <td colspan="2">0.80</td>
                <td colspan="2">0.83</td>
                <td colspan="2">0.84</td>
                <td colspan="2">0.81</td>
                <td colspan="2">99</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Depressed</td>
                <td colspan="2">0.84</td>
                <td colspan="2">0.81</td>
                <td colspan="2">0.80</td>
                <td colspan="2">0.82</td>
                <td colspan="2">109</td>
              </tr>
              <tr valign="top">
                <td colspan="12">
                  Averages
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Macroaverage</td>
                <td colspan="2">0.82</td>
                <td colspan="2">0.82</td>
                <td colspan="2">0.82</td>
                <td colspan="2">0.82</td>
                <td colspan="2">208</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Weighted average</td>
                <td colspan="2">0.82</td>
                <td colspan="2">0.82</td>
                <td colspan="2">0.82</td>
                <td colspan="2">0.82</td>
                <td colspan="2">208</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>XGBoost: extreme gradient boosting.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>PHQ-9: 9-item Patient Health Questionnaire.</p>
            </fn>
            <fn id="table4fn3">
              <p><sup>c</sup>NPV: negative predictive value.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Depression State Transition Classification</title>
        <p>For depression state transition classification, we used the XGBoost classifier with feature filtering since it performed best in the depression presence classification. The model was able to classify relatively well the cases where a participant’s state remains the same, while the accuracy is considerably lower for cases where the state changes. Applying SMOTE’s synthetic oversampling technique to alleviate class imbalance significantly increased the recall of the minority classes (depression transitions for “Declines” and “Increases”). The model achieved an accuracy of 75% (95% CI 72%-76%) and a corresponding <italic>F</italic><sub>1</sub>-score of 0.67 (95% CI 0.63-0.69). <xref ref-type="table" rid="table5">Table 5</xref> summarizes the model validation results for each transition type. For the transition of “Declines,” the model shows high NPV (0.98) but lower precision (0.34). It indicates that while the model reliably identifies cases where the state will not decline, it is less accurate at correctly identifying the cases where it declines. The recall is 0.76, leading to an <italic>F</italic><sub>1</sub>-score of 0.47, signifying unbalanced classification performance. “Increases” shows a similar pattern with high NPV (0.96) and moderate recall (0.74) but lower precision (0.46), resulting in an <italic>F</italic><sub>1</sub>-score of 0.57, also indicating unbalanced classification performance. For the “Remains Depressed” and “Remains nondepressed” states, the model exhibits higher precision (0.93 and 0.95, respectively) and NPV (0.86 and 0.83, respectively), along with recall rates of 0.72 and 0.77, leading to a more balanced performance with <italic>F</italic><sub>1</sub>-scores of 0.81 and 0.85. The macroaverage <italic>F</italic><sub>1</sub>-score of 0.67, compared with the overall accuracy of 0.75, reflects the effect of class imbalance on the model's performance. Further, Figures S2 and S3 in <xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref> display classification outcomes for the test data and a multiclass receiver operating characteristic curve for the XGBoost classifier.</p>
        <p>The results show the model’s ability to classify most cases correctly. With an overall accuracy of 75%, the model effectively balances precision across different cases. These findings demonstrate the model’s potential for predicting depression state transitions, leveraging smartphone-sensed behavioral data and self-reported PHQ-9 scores.</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>XGBoost<sup>a</sup> model performance metrics for depression state transition classification (using previous PHQ-9<sup>b</sup> score as a predictor).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="290"/>
            <col width="0"/>
            <col width="130"/>
            <col width="0"/>
            <col width="130"/>
            <col width="0"/>
            <col width="140"/>
            <col width="0"/>
            <col width="140"/>
            <col width="0"/>
            <col width="140"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Metric</td>
                <td colspan="2">Precision</td>
                <td colspan="2">Recall</td>
                <td colspan="2">NPV<sup>c</sup></td>
                <td colspan="2"><italic>F</italic><sub>1</sub>-score</td>
                <td>Support, n</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="12">
                  Transition
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Declines</td>
                <td colspan="2">0.34</td>
                <td colspan="2">0.76</td>
                <td colspan="2">0.98</td>
                <td colspan="2">0.47</td>
                <td colspan="2">17</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Increases</td>
                <td colspan="2">0.46</td>
                <td colspan="2">0.74</td>
                <td colspan="2">0.96</td>
                <td colspan="2">0.57</td>
                <td colspan="2">23</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Remains depressed</td>
                <td colspan="2">0.93</td>
                <td colspan="2">0.72</td>
                <td colspan="2">0.86</td>
                <td colspan="2">0.81</td>
                <td colspan="2">74</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Remains nondepressed</td>
                <td colspan="2">0.95</td>
                <td colspan="2">0.77</td>
                <td colspan="2">0.83</td>
                <td colspan="2">0.85</td>
                <td colspan="2">94</td>
              </tr>
              <tr valign="top">
                <td colspan="12">
                  Averages
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Macroaverage</td>
                <td colspan="2">0.67</td>
                <td colspan="2">0.75</td>
                <td colspan="2">0.91</td>
                <td colspan="2">0.67</td>
                <td colspan="2">208</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Weighted average</td>
                <td colspan="2">0.84</td>
                <td colspan="2">0.75</td>
                <td colspan="2">0.87</td>
                <td colspan="2">0.77</td>
                <td colspan="2">208</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>XGBoost: extreme gradient boosting.</p>
            </fn>
            <fn id="table5fn2">
              <p><sup>b</sup>PHQ-9: 9-Item Patient Health Questionnaire.</p>
            </fn>
            <fn id="table5fn3">
              <p><sup>c</sup>NPV: negative predictive value.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Feature Importance Analysis Using SHAP Values</title>
        <p>In our analysis of feature importance for classification of the presence of depression and depression state transition, we evaluated the relative significance of different features by examining the SHAP values in the best-performing XGBoost models. In summary, our findings highlight the previous PHQ-9 score as the most impactful feature when included in the model. For depression presence classification, additional significant features include smartphone screen status, app usage, battery level, phone call, and location–related information. In addition to the previous PHQ-9 score for state transition classification, screen status, location–, battery level– and accelerometer–related features stand out as the most important. Conversely, app usage and communication–related features had a limited impact on the models.</p>
        <p>The importance of the previous PHQ-9 score implies that the depression scores are autocorrelated, thus reflecting future depression levels. Smartphone screen status (e.g., screen on and off event counts) reveals users' interaction with the device, showing usage frequency and patterns. Similarly, battery level indicates phone usage, reflecting battery drains and charges. App usage features (especially apps labeled as leisure, sports, and social media) suggest behavioral patterns related to such activities as watching movies or listening to music, exercising, and communicating via social media. Finally, accelerometer-related features reveal physical activity and mobility patterns.</p>
        <p>Figures S1-S3 in <xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref> present the most important features of these classifications. Specifically, Figure S1 in <xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref> illustrates the important features of depression presence classification without considering the previous biweekly PHQ-9 scores. Conversely, Figure S2 in <xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref> shows the results for the model, including these scores as a predictor. Finally, Figure S3 in <xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref> explores features pertinent to depression state transition classification.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>Our analysis encompassed passively sensed digital behavioral data, which we compared against actively collected PHQ-9 survey data. Using the generalized estimating equation approach, we discovered a statistically significant difference in PHQ-9 score distributions between the control and patient groups. It is important to note that some patients likely experienced recovery after recruitment for the study, potentially lessening the severity of symptoms reflected in their PHQ-9 scores. Consequently, our data could underrepresent the depression severity spectrum, particularly among patients with more severe depression.</p>
        <p>After adjusting for multiple comparisons, distributional testing on behavioral features revealed no significant differences between control and patient groups. This finding suggests that the differences in behavioral data at the group level are minimal. Therefore, our study implies that detecting these subtle differences might require larger sample sizes or alternative statistical methodologies that can leverage hierarchical structures and temporal correlations.</p>
        <p>Correlation analysis identified 32 behavioral features with weak or very weak correlations with PHQ-9 scores, predominantly involving smartphone screen interaction (18 features) and accelerometer data (14 features). Despite most features showing no significant correlation with PHQ-9 scores, their potential value in classification tasks remains, especially considering possible nonlinear relationships or interactions with other features.</p>
        <p>For the depression prediction tasks, we found that the XGBoost classifier with filtering-based feature selection performed the best in discriminating between participants who are depressed and nondepressed, achieving 66% accuracy. The accuracy increased to 82% when we added the PHQ-9 score from the previous biweekly period as a predictor. The difference implies the importance of the temporal structure of the data. Therefore, we propose to include temporal information in future analyses to improve the accuracy. Further, for clinical monitoring applications, information about participants’ depression histories should be available, providing the temporal context necessary to enhance the model's predictive accuracy.</p>
        <p>Furthermore, our results show that the XGBoost classifier, combined with filter-based feature selection and PHQ-9 measurement from the previous biweekly monitoring period as a predictor, can differentiate mood state transitions with a classification accuracy of 75%. While promising, this accuracy level suggests room for further improvement in the model’s performance. Like the depression presence classification, we suggest using more comprehensive methods, personalized models, and temporal information. Additionally, we suspect that the data’s limited sample size and sparsity of transition events hinder the classification performance. Therefore, model development should benefit from a larger sample.</p>
        <p>Finally, feature importance analysis revealed insights into the key features of depression prediction models. The most significant predictor for detecting and classifying depression presence was previous biweekly PHQ-9 scores, complemented by features related to accelerometer, app usage, battery level, location, and screen events. The results emphasize the significance of daily behavioral patterns and time-of-day distinctions (morning, afternoon, evening, and nighttime) in accurately predicting depression. Interestingly, some features were identified by both the correlation and feature importance analyses for classifier models. While the methods and objectives of these analyses differ, the consistency in identifying the same key features across both approaches implies their potential relevance in depression prediction.</p>
      </sec>
      <sec>
        <title>Comparison With Previous Studies</title>
        <p>Our study aligns methodologically with previous research using validated depression assessments and analyzing passively collected smartphone behavioral features. Also, it focuses on statistical inference and machine learning techniques to classify depression among participants and distinguish participants based on behavioral data. Additionally, the identified important features are consistent with earlier research reporting features related to phone usage [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>], physical activity [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref17">17</xref>], and location data [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. By contrast, the importance of features related to communication [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]  were slightly underrepresented in our analysis.</p>
        <p>Our classification results are numerically comparable to previous studies using machine learning methods with smartphone data for depression detection. Using a cohort of college students, Chikersal et al [<xref ref-type="bibr" rid="ref14">14</xref>] achieved an 85% accuracy and an <italic>F</italic><sub>1</sub>-score of 0.82 in the postsemester depression detection task. They also achieved an 85% accuracy and an <italic>F</italic><sub>1</sub>-score of 0.80 in detecting a change in the depression state task. Similarly, Wang et al [<xref ref-type="bibr" rid="ref15">15</xref>] used machine learning and deep learning models to detect depression using a subset of smartphones, also from a cohort of college students, achieving an <italic>F</italic><sub>1</sub>-score of 0.65 using a machine learning model and an <italic>F</italic><sub>1</sub>-score of 0.7 using deep learning.</p>
        <p>However, our study differentiates itself by including a diverse cohort of real outpatients, clinically diagnosed with structured interviews, alongside control participants, thereby offering a broader perspective on depression. Additionally, the data are collected over an extended period in a naturalistic setting, enhancing the reliability of the findings. Unlike other studies that often focus on student populations, it demonstrates the feasibility of digital behavioral monitoring in real outpatients. Furthermore, it excludes certain data features like physiological measurements and social engagement metrics. Lastly, the study does not aim to predict future depressive states, setting it apart from other predictive modeling efforts in the field.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>While this research yields insightful outcomes, it is crucial to acknowledge certain limitations. First, dropouts and missing data increased substantially after the first 3 biweekly periods. Some participants provided data only for 1 biweekly period, limiting our model’s ability to capture patient symptom fluctuations. Second, our analysis does not fully account for the hierarchical and autocorrelational structure of the data. We rely on simplified analysis, using aggregated features and pooled participants, resulting in the loss of available information. Finally, our study does not accommodate external factors that might impact the participants’ behavior patterns and mood states. Given that the data collection partially took place during the COVID-19 era, factors such as social isolation could have played a role in changing the behavior patterns and emotional states of participants.</p>
      </sec>
      <sec>
        <title>Recommendations for Future Work</title>
        <p>This study lays the groundwork for multiple future research endeavors. A direct expansion of our work would be the implementation of personalized models designed to predict the depression state of individuals. These personalized models, which incorporate both group and participant variations and sample-level information, have demonstrated improved accuracy in depression classification tasks [<xref ref-type="bibr" rid="ref39">39</xref>]. Furthermore, we recommend fully using the temporal structure of the data in classification tasks. Given the inherent variability in symptomatic periods among patients with depression, analyzing temporal patterns and trends from longitudinal data could offer a more accurate representation of their evolving mental states than single-point estimates. We also encourage the exploration of deep learning models in future studies, as these models tend to surpass conventional machine learning methods in predictive accuracy [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. However, due to their complexity and less clear interpretability relative to more traditional methods, we suggest not starting with these models at the outset, instead gradually incorporating them into the analysis. Lastly, to address the challenges posed by the unbalanced dataset in our study, we suggest collecting additional data to enhance the robustness and generalizability of future research findings.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>In summary, this study demonstrates the potential of using smartphone-sensed behavioral data for monitoring depression symptoms, thereby paving the way for personalized and more effective mental health care. The results contribute to an expanding body of evidence supporting the integration of data-driven methods into mental health services. These insights may complement and enhance clinical practices, supplementing conventional diagnostic and monitoring approaches.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Summary of data sources and extracted features for each sensor.</p>
        <media xlink:href="jmir_v26i1e56874_app1.docx" xlink:title="DOCX File , 8 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>The machine learning pipeline for depression presence and state transition classification.</p>
        <media xlink:href="jmir_v26i1e56874_app2.docx" xlink:title="DOCX File , 114 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Definitions for key performance metrics accuracy, precision, recall, negative predictive value, and F1-score.</p>
        <media xlink:href="jmir_v26i1e56874_app3.docx" xlink:title="DOCX File , 9 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>The percentage of participants providing PHQ-9 data over time by group. PHQ-9: 9-item Patient Health Questionnaire.</p>
        <media xlink:href="jmir_v26i1e56874_app4.docx" xlink:title="DOCX File , 11 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>Kolmogorov-Smirnov test results for behavioral data distribution differences and Spearman rank correlation test results between behavioral data features and PHQ-9 scores. PHQ-9: 9-item Patient Health Questionnaire.</p>
        <media xlink:href="jmir_v26i1e56874_app5.docx" xlink:title="DOCX File , 14 KB"/>
      </supplementary-material>
      <supplementary-material id="app6">
        <label>Multimedia Appendix 6</label>
        <p>Performance comparison of depression presence classification models. Performance metrics for depression presence classification: nondepressed versus depressed. Comparative performance of depression presence classification models with biweekly PHQ-9 score as a predictor. ROC curves for depression presence classification and different depression transition classifications. Confusion matrix for depression state transition classification. PHQ-9: 9-item Patient Health Questionnaire; ROC: receiver operating characteristic.</p>
        <media xlink:href="jmir_v26i1e56874_app6.docx" xlink:title="DOCX File , 371 KB"/>
      </supplementary-material>
      <supplementary-material id="app7">
        <label>Multimedia Appendix 7</label>
        <p>Key features in depression presence XGBoost classification model based on SHAP values. Key features in depression presence classification XGBoost model with preceding biweekly PHQ-9 score as a predictor. Key features in depression state transition classification XGBoost model with previous PHQ-9 score. PHQ-9: 9-item Patient Health Questionnaire; SHAP: Shapley additive explanations; XGBoost: extreme gradient boosting.</p>
        <media xlink:href="jmir_v26i1e56874_app7.docx" xlink:title="DOCX File , 175 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">FDR</term>
          <def>
            <p>false discovery rate</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">MDD</term>
          <def>
            <p>major depressive disorder</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">MDD&#124;BPD</term>
          <def>
            <p>major depressive disorder with comorbid borderline personality disorder</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">MDE&#124;BD</term>
          <def>
            <p>major depressive episodes with bipolar disorder</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">MoMo-Mood</term>
          <def>
            <p>Mobile Monitoring of Mood</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">NPV</term>
          <def>
            <p>negative predictive value</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">PHQ-4</term>
          <def>
            <p>4-item Patient Health Questionnaire</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">PHQ-9</term>
          <def>
            <p>9-item Patient Health Questionnaire</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">SMOTE</term>
          <def>
            <p>synthetic minority over-sampling technique</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">SHAP</term>
          <def>
            <p>Shapley additive explanations</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">XGBoost</term>
          <def>
            <p>extreme gradient boosting</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>We acknowledge the support and input from Jesper Ekelund regarding the study design and data collection. The computational resources provided by the Aalto Science-IT project are gratefully acknowledged. We thank Yunhao Yuan for providing support and feedback for the visualizations.</p>
    </ack>
    <notes>
      <title>Data Availability</title>
      <p>Due to the fact that the data are highly sensitive, the collected data cannot be shared with researchers outside of our consortium. Our research permit does not allow the free availability of these data.</p>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>AI contributed to writing – original draft, writing – review &#38; editing, visualization, methodology, formal analysis, validation, data curation, and conceptualization. NL contributed to writing – original draft, review &#38; editing, methodology, and data curation. IB contributed to investigation, methodology, and writing – review &#38; editing. RD contributed to investigation, data collection software, data curation, and writing – review &#38; editing. RH contributed to investigation and methodology. JH contributed to investigation. AM contributed to investigation and writing – review &#38; editing. KR contributed to investigation and methodology. OS contributed to investigation. EI contributed to writing – review &#38; editing, investigation, project administration, investigation, methodology, supervision, funding acquisition, and conceptualization. TA contributed to writing – review &#38; editing, supervision, project administration, investigation, methodology, supervision, funding acquisition, and conceptualization.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <article-title>World mental health report: transforming mental health for all</article-title>
          <source>World Health Organization</source>
          <year>2022</year>
          <month>6</month>
          <day>16</day>
          <access-date>2024-01-26</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/publications/i/item/9789240049338">https://www.who.int/publications/i/item/9789240049338</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Health</surname>
              <given-names>TLG</given-names>
            </name>
          </person-group>
          <article-title>Mental health matters</article-title>
          <source>Lancet Glob Health</source>
          <year>2020</year>
          <volume>8</volume>
          <issue>11</issue>
          <fpage>e1352</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2214-109X(20)30432-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S2214-109X(20)30432-0</pub-id>
          <pub-id pub-id-type="medline">33069297</pub-id>
          <pub-id pub-id-type="pii">S2214-109X(20)30432-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC7561290</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nelson</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>McGorry</surname>
              <given-names>PD</given-names>
            </name>
            <name name-style="western">
              <surname>Wichers</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wigman</surname>
              <given-names>JTW</given-names>
            </name>
            <name name-style="western">
              <surname>Hartmann</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>Moving from static to dynamic models of the onset of mental disorder: a review</article-title>
          <source>JAMA Psychiatry</source>
          <year>2017</year>
          <volume>74</volume>
          <issue>5</issue>
          <fpage>528</fpage>
          <lpage>534</lpage>
          <pub-id pub-id-type="doi">10.1001/jamapsychiatry.2017.0001</pub-id>
          <pub-id pub-id-type="medline">28355471</pub-id>
          <pub-id pub-id-type="pii">2612446</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Torous</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kiang</surname>
              <given-names>MV</given-names>
            </name>
            <name name-style="western">
              <surname>Lorme</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Onnela</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>New tools for new research in psychiatry: a scalable and customizable platform to empower data driven smartphone research</article-title>
          <source>JMIR Ment Health</source>
          <year>2016</year>
          <volume>3</volume>
          <issue>2</issue>
          <fpage>e16</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mental.jmir.org/2016/2/e16/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/mental.5165</pub-id>
          <pub-id pub-id-type="medline">27150677</pub-id>
          <pub-id pub-id-type="pii">v3i2e16</pub-id>
          <pub-id pub-id-type="pmcid">PMC4873624</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hsin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Fromer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Walter</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Fleck</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Campbell</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Varghese</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Califf</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Transforming psychiatry into data-driven medicine with digital measurement tools</article-title>
          <source>NPJ Digit Med</source>
          <year>2018</year>
          <volume>1</volume>
          <fpage>37</fpage>
          <pub-id pub-id-type="doi">10.1038/s41746-018-0046-0</pub-id>
          <pub-id pub-id-type="medline">31304319</pub-id>
          <pub-id pub-id-type="pii">46</pub-id>
          <pub-id pub-id-type="pmcid">PMC6550182</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maatoug</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Oudin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Adrien</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Saudreau</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Bonnot</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Millet</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ferreri</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Mouchabac</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bourla</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Digital phenotype of mood disorders: a conceptual and critical review</article-title>
          <source>Front Psychiatry</source>
          <year>2022</year>
          <month>7</month>
          <day>26</day>
          <volume>13</volume>
          <fpage>895860</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35958638"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fpsyt.2022.895860</pub-id>
          <pub-id pub-id-type="medline">35958638</pub-id>
          <pub-id pub-id-type="pmcid">PMC9360315</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Leaning</surname>
              <given-names>IE</given-names>
            </name>
            <name name-style="western">
              <surname>Ikani</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Savage</surname>
              <given-names>HS</given-names>
            </name>
            <name name-style="western">
              <surname>Leow</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Beckmann</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ruhé</surname>
              <given-names>HG</given-names>
            </name>
            <name name-style="western">
              <surname>Marquand</surname>
              <given-names>AF</given-names>
            </name>
          </person-group>
          <article-title>From smartphone data to clinically relevant predictions: a systematic review of digital phenotyping methods in depression</article-title>
          <source>Neurosci Biobehav Rev</source>
          <year>2024</year>
          <volume>158</volume>
          <fpage>105541</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0149-7634(24)00009-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.neubiorev.2024.105541</pub-id>
          <pub-id pub-id-type="medline">38215802</pub-id>
          <pub-id pub-id-type="pii">S0149-7634(24)00009-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bufano</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Laurino</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Said</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tognetti</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Menicucci</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Digital phenotyping for monitoring mental disorders: systematic review</article-title>
          <source>J Med Internet Res</source>
          <year>2023</year>
          <volume>25</volume>
          <fpage>e46778</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2023//e46778/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/46778</pub-id>
          <pub-id pub-id-type="medline">38090800</pub-id>
          <pub-id pub-id-type="pii">v25i1e46778</pub-id>
          <pub-id pub-id-type="pmcid">PMC10753422</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Saeb</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kwasny</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Karr</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kording</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mohr</surname>
              <given-names>DC</given-names>
            </name>
          </person-group>
          <article-title>The relationship between clinical, momentary, and sensor-based assessment of depression</article-title>
          <source>Int Conf Pervasive Comput Technol Healthc</source>
          <year>2015</year>
          <volume>2015</volume>
          <fpage>e4273</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26640739"/>
          </comment>
          <pub-id pub-id-type="doi">10.4108/icst.pervasivehealth.2015.259034</pub-id>
          <pub-id pub-id-type="medline">26640739</pub-id>
          <pub-id pub-id-type="pmcid">PMC4667797</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Saeb</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lattie</surname>
              <given-names>EG</given-names>
            </name>
            <name name-style="western">
              <surname>Schueller</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Kording</surname>
              <given-names>KP</given-names>
            </name>
            <name name-style="western">
              <surname>Mohr</surname>
              <given-names>DC</given-names>
            </name>
          </person-group>
          <article-title>The relationship between mobile phone location sensor data and depressive symptom severity</article-title>
          <source>PeerJ</source>
          <year>2016</year>
          <volume>4</volume>
          <fpage>e2537</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28344895"/>
          </comment>
          <pub-id pub-id-type="doi">10.7717/peerj.2537</pub-id>
          <pub-id pub-id-type="medline">28344895</pub-id>
          <pub-id pub-id-type="pii">2537</pub-id>
          <pub-id pub-id-type="pmcid">PMC5361882</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Masud</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Mamun</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Thapa</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>DH</given-names>
            </name>
            <name name-style="western">
              <surname>Griffiths</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>SH</given-names>
            </name>
          </person-group>
          <article-title>Unobtrusive monitoring of behavior and movement patterns to detect clinical depression severity level via smartphone</article-title>
          <source>J Biomed Inform</source>
          <year>2020</year>
          <volume>103</volume>
          <fpage>103371</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(19)30291-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2019.103371</pub-id>
          <pub-id pub-id-type="medline">31935462</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(19)30291-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Boukhechba</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Daros</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Fua</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Chow</surname>
              <given-names>PI</given-names>
            </name>
            <name name-style="western">
              <surname>Teachman</surname>
              <given-names>BA</given-names>
            </name>
            <name name-style="western">
              <surname>Barnes</surname>
              <given-names>LE</given-names>
            </name>
          </person-group>
          <article-title>DemonicSalmon: monitoring mental health and social interactions of college students using smartphones</article-title>
          <source>Smart Health</source>
          <year>2018</year>
          <volume>9-10</volume>
          <fpage>192</fpage>
          <lpage>203</lpage>
          <pub-id pub-id-type="doi">10.1016/j.smhl.2018.07.005</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chikersal</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Dutcher</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Sefidgar</surname>
              <given-names>YS</given-names>
            </name>
            <name name-style="western">
              <surname>Seo</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Tumminia</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Villalba</surname>
              <given-names>DK</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Creswell</surname>
              <given-names>KG</given-names>
            </name>
            <name name-style="western">
              <surname>Creswell</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Doryab</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nurius</surname>
              <given-names>PS</given-names>
            </name>
            <name name-style="western">
              <surname>Riskin</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Dey</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Mankoff</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Leveraging collaborative-filtering for personalized behavior modeling</article-title>
          <source>Proc ACM Interact Mob Wearable Ubiquitous Technol</source>
          <year>2021</year>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>27</lpage>
          <pub-id pub-id-type="doi">10.1145/3448107</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chikersal</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Doryab</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tumminia</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Villalba</surname>
              <given-names>DK</given-names>
            </name>
            <name name-style="western">
              <surname>Dutcher</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Creswell</surname>
              <given-names>KG</given-names>
            </name>
            <name name-style="western">
              <surname>Mankoff</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Creswell</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Goel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dey</surname>
              <given-names>AK</given-names>
            </name>
          </person-group>
          <article-title>Detecting depression and predicting its onset using longitudinal symptoms captured by passive sensing</article-title>
          <source>ACM Trans Comput Hum Interact</source>
          <year>2021</year>
          <volume>28</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>41</lpage>
          <pub-id pub-id-type="doi">10.1145/3422821</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Nepal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Huckins</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Hernandez</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Vojdanovski</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Mack</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Plomp</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pillai</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Obuchi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dasilva</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Hedlund</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Rogers</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Meyer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Campbell</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>First-gen lens: assessing mental health of first-generation students across their first year at college using mobile sensing</article-title>
          <source>Proc ACM Interact Mob Wearable Ubiquitous Technol</source>
          <year>2022</year>
          <volume>6</volume>
          <issue>2</issue>
          <fpage>1</fpage>
          <lpage>32</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36561350"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3543194</pub-id>
          <pub-id pub-id-type="medline">36561350</pub-id>
          <pub-id pub-id-type="pii">95</pub-id>
          <pub-id pub-id-type="pmcid">PMC9770714</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jakobsen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Garcia-Ceja</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Riegler</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Stabell</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Nordgreen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Torresen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Fasmer</surname>
              <given-names>OB</given-names>
            </name>
            <name name-style="western">
              <surname>Oedegaard</surname>
              <given-names>KJ</given-names>
            </name>
          </person-group>
          <article-title>Applying machine learning in motor activity time series of depressed bipolar and unipolar patients compared to healthy controls</article-title>
          <source>PLoS One</source>
          <year>2020</year>
          <volume>15</volume>
          <issue>8</issue>
          <fpage>e0231995</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0231995"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0231995</pub-id>
          <pub-id pub-id-type="medline">32833958</pub-id>
          <pub-id pub-id-type="pii">PONE-D-20-09443</pub-id>
          <pub-id pub-id-type="pmcid">PMC7446864</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mullick</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Radovic</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shaaban</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Doryab</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Predicting depression in adolescents using mobile and wearable sensors: multimodal machine learning-based exploratory study</article-title>
          <source>JMIR Form Res</source>
          <year>2022</year>
          <volume>6</volume>
          <issue>6</issue>
          <fpage>e35807</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://formative.jmir.org/2022/6/e35807/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/35807</pub-id>
          <pub-id pub-id-type="medline">35749157</pub-id>
          <pub-id pub-id-type="pii">v6i6e35807</pub-id>
          <pub-id pub-id-type="pmcid">PMC9270714</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kroenke</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Spitzer</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>JBW</given-names>
            </name>
          </person-group>
          <article-title>The PHQ-9: validity of a brief depression severity measure</article-title>
          <source>J Gen Intern Med</source>
          <year>2001</year>
          <volume>16</volume>
          <issue>9</issue>
          <fpage>606</fpage>
          <lpage>613</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/11556941"/>
          </comment>
          <pub-id pub-id-type="doi">10.1046/j.1525-1497.2001.016009606.x</pub-id>
          <pub-id pub-id-type="medline">11556941</pub-id>
          <pub-id pub-id-type="pii">jgi01114</pub-id>
          <pub-id pub-id-type="pmcid">PMC1495268</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kroenke</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Spitzer</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>JBW</given-names>
            </name>
            <name name-style="western">
              <surname>Löwe</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>An ultra-brief screening scale for anxiety and depression: the PHQ–4</article-title>
          <source>Psychosomatics</source>
          <year>2009</year>
          <volume>50</volume>
          <issue>6</issue>
          <fpage>613</fpage>
          <lpage>621</lpage>
          <pub-id pub-id-type="doi">10.1016/s0033-3182(09)70864-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Müller</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Himmerich</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kienzle</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Szegedi</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Differentiating moderate and severe depression using the montgomery-asberg depression rating scale (MADRS)</article-title>
          <source>J Affect Disord</source>
          <year>2003</year>
          <volume>77</volume>
          <issue>3</issue>
          <fpage>255</fpage>
          <lpage>260</lpage>
          <pub-id pub-id-type="doi">10.1016/s0165-0327(02)00120-9</pub-id>
          <pub-id pub-id-type="medline">14612225</pub-id>
          <pub-id pub-id-type="pii">S0165032702001209</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Beck</surname>
              <given-names>AT</given-names>
            </name>
            <name name-style="western">
              <surname>Steer</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Ball</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ranieri</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Depression inventories -IA and -II in psychiatric outpatients</article-title>
          <source>J Pers Assess</source>
          <year>1996</year>
          <volume>67</volume>
          <issue>3</issue>
          <fpage>588</fpage>
          <lpage>597</lpage>
          <pub-id pub-id-type="doi">10.1207/s15327752jpa6703_13</pub-id>
          <pub-id pub-id-type="medline">8991972</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baryshnikov</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Aledavood</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Rosenström</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Heikkilä</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Darst</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Riihimäki</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Saleva</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Ekelund</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Isometsä</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Relationship between daily rated depression symptom severity and the retrospective self-report on PHQ-9: a prospective ecological momentary assessment study on 80 psychiatric outpatients</article-title>
          <source>J Affect Disord</source>
          <year>2023</year>
          <volume>324</volume>
          <fpage>170</fpage>
          <lpage>174</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0165-0327(22)01490-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jad.2022.12.127</pub-id>
          <pub-id pub-id-type="medline">36586594</pub-id>
          <pub-id pub-id-type="pii">S0165-0327(22)01490-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aledavood</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Luong</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Baryshnikov</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Darst</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Heikkilä</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Holmén</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ikäheimonen</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Mobile monitoring of mood (MoMo-Mood): a multimodal digital phenotyping study with major depressive patients and healthy controls</article-title>
          <source>JMIR Preprints</source>
          <comment>Preprint posted online on June 26, 2024</comment>
          <pub-id pub-id-type="doi">10.2196/preprints.63622</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sheehan</surname>
              <given-names>DV</given-names>
            </name>
            <name name-style="western">
              <surname>Lecrubier</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sheehan</surname>
              <given-names>KH</given-names>
            </name>
            <name name-style="western">
              <surname>Amorim</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Janavs</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Weiller</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Hergueta</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Baker</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Dunbar</surname>
              <given-names>GC</given-names>
            </name>
          </person-group>
          <article-title>The Mini-International Neuropsychiatric Interview (M.I.N.I.): the development and validation of a structured diagnostic psychiatric interview for DSM-IV and ICD-10</article-title>
          <source>J Clin Psychiatry</source>
          <year>1998</year>
          <volume>59</volume>
          <issue>Suppl 20</issue>
          <fpage>quiz 34</fpage>
          <lpage>57</lpage>
          <pub-id pub-id-type="medline">9881538</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>First</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Benjamin</surname>
              <given-names>LS</given-names>
            </name>
            <name name-style="western">
              <surname>Gibbon</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Spitzer</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>JB</given-names>
            </name>
          </person-group>
          <source>Structured Clinical Interview for DSM-IV Axis II Personality Disorders</source>
          <year>1997</year>
          <publisher-loc>Washington, DC</publisher-loc>
          <publisher-name>American Psychiatric Press</publisher-name>
          <fpage>1919</fpage>
          <lpage>1920</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aledavood</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Hoyos</surname>
              <given-names>AMT</given-names>
            </name>
            <name name-style="western">
              <surname>Alakörkkö</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kaski</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Saramäki</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Isometsä</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Darst</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Data collection for mental health studies through digital platforms: requirements and design of a prototype</article-title>
          <source>JMIR Res Protoc</source>
          <year>2017</year>
          <volume>6</volume>
          <issue>6</issue>
          <fpage>e110</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.researchprotocols.org/2017/6/e110/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/resprot.6919</pub-id>
          <pub-id pub-id-type="medline">28600276</pub-id>
          <pub-id pub-id-type="pii">v6i6e110</pub-id>
          <pub-id pub-id-type="pmcid">PMC5483244</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ikäheimonen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Triana</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Luong</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ziaei</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rantaharju</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Darst</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Aledavood</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Niimpy: a toolbox for behavioral data analysis</article-title>
          <source>SoftwareX</source>
          <year>2023</year>
          <volume>23</volume>
          <fpage>101472</fpage>
          <pub-id pub-id-type="doi">10.1016/j.softx.2023.101472</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Berger</surname>
              <given-names>VW</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Kolmogorov-Smirnov test: overview</article-title>
          <source>Wiley StatsRef: Statistics Reference Online</source>
          <year>2014</year>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>John Wiley &#38; Sons, Ltd</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Benjamini</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hochberg</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Controlling the false discovery rate: a practical and powerful approach to multiple testing</article-title>
          <source>J R Stat Soc Series B Stat Methodol</source>
          <year>1995</year>
          <volume>57</volume>
          <issue>1</issue>
          <fpage>289</fpage>
          <lpage>300</lpage>
          <pub-id pub-id-type="doi">10.1111/j.2517-6161.1995.tb02031.x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pedregosa</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Varoquaux</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gramfort</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Scikit-learn: machine learning in python</article-title>
          <source>J Mach Learn Res</source>
          <year>2011</year>
          <volume>12</volume>
          <fpage>2825</fpage>
          <lpage>2830</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmlr.org/papers/volume12/pedregosa11a/pedregosa11a.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Guestrin</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>XGBoost: a scalable tree boosting system</article-title>
          <year>2016</year>
          <conf-name>22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining. KDD -16. Association for Computing Machinery</conf-name>
          <conf-date>August 13, 2016</conf-date>
          <conf-loc>San Francisco, CA</conf-loc>
          <fpage>785</fpage>
          <lpage>794</lpage>
          <pub-id pub-id-type="doi">10.1145/2939672.2939785</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Akiba</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Sano</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yanase</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ohta</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Koyama</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Optuna: a Next-generation hyperparameter optimization framework</article-title>
          <year>2019</year>
          <conf-name>25th ACM SIGKDD International Conference on Knowledge Discovery &#38; Data Mining</conf-name>
          <conf-date>July 25, 2019</conf-date>
          <conf-loc>Anchorage, AK</conf-loc>
          <fpage>2623</fpage>
          <lpage>2631</lpage>
          <pub-id pub-id-type="doi">10.1145/3292500.3330701</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lemaître</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Nogueira</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Aridas</surname>
              <given-names>CK</given-names>
            </name>
          </person-group>
          <article-title>Imbalanced-learn: a Python toolbox to tackle the curse of imbalanced datasets in machine learning</article-title>
          <source>J Mach Learn Res</source>
          <year>2017</year>
          <volume>18</volume>
          <issue>17</issue>
          <fpage>1</fpage>
          <lpage>5</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://jmlr.org/papers/v18/16-365.html"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lundberg</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>SI</given-names>
            </name>
          </person-group>
          <article-title>A unified approach to interpreting model predictions</article-title>
          <source>Adv Neural Inf Process Syst</source>
          <year>2017</year>
          <volume>30</volume>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chawla</surname>
              <given-names>NV</given-names>
            </name>
            <name name-style="western">
              <surname>Bowyer</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Hall</surname>
              <given-names>LO</given-names>
            </name>
            <name name-style="western">
              <surname>Kegelmeyer</surname>
              <given-names>WP</given-names>
            </name>
          </person-group>
          <article-title>SMOTE: synthetic minority over-sampling technique</article-title>
          <source>J Artif Intell Res</source>
          <year>2002</year>
          <volume>16</volume>
          <fpage>321</fpage>
          <lpage>357</lpage>
          <pub-id pub-id-type="doi">10.1613/jair.953</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Benoit</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Onyeaka</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Keshavan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Torous</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Systematic review of digital phenotyping and machine learning in psychosis spectrum illnesses</article-title>
          <source>Harv Rev Psychiatry</source>
          <year>2020</year>
          <volume>28</volume>
          <issue>5</issue>
          <fpage>296</fpage>
          <lpage>304</lpage>
          <pub-id pub-id-type="doi">10.1097/hrp.0000000000000268</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jacobson</surname>
              <given-names>NC</given-names>
            </name>
            <name name-style="western">
              <surname>Summers</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Wilhelm</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Digital biomarkers of social anxiety severity: digital phenotyping using passive smartphone sensors</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <volume>22</volume>
          <issue>5</issue>
          <fpage>e16875</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/5/e16875/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/16875</pub-id>
          <pub-id pub-id-type="medline">32348284</pub-id>
          <pub-id pub-id-type="pii">v22i5e16875</pub-id>
          <pub-id pub-id-type="pmcid">PMC7293055</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hardin</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Hilbe</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <source>Generalized Estimating Equations: GEE. 2nd ed</source>
          <year>2013</year>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>Chapman &#38; Hall/CRC</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Palmius</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Saunders</surname>
              <given-names>KEA</given-names>
            </name>
            <name name-style="western">
              <surname>Carr</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Geddes</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Goodwin</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>de Vos</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Group-personalized regression models for predicting mental health scores from objective mobile phone data streams: observational study</article-title>
          <source>J Med Internet Res</source>
          <year>2018</year>
          <volume>20</volume>
          <issue>10</issue>
          <fpage>e10194</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2018/10/e10194/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/10194</pub-id>
          <pub-id pub-id-type="medline">30348626</pub-id>
          <pub-id pub-id-type="pii">v20i10e10194</pub-id>
          <pub-id pub-id-type="pmcid">PMC6231780</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
