<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JFR</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Form Res</journal-id>
      <journal-title>JMIR Formative Research</journal-title>
      <issn pub-type="epub">2561-326X</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v7i1e28848</article-id>
      <article-id pub-id-type="pmid">37561568</article-id>
      <article-id pub-id-type="doi">10.2196/28848</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>A Fast and Minimal System to Identify Depression Using Smartphones: Explainable Machine Learning–Based Approach</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Mullick</surname>
            <given-names>Tahsin</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Lee</surname>
            <given-names>Uichin</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Ahmed</surname>
            <given-names>Md Sabbir</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Design Inclusion and Access Lab</institution>
            <institution>North South University</institution>
            <addr-line>Plot #15, Block #B, Bashundhara</addr-line>
            <addr-line>Dhaka, 1229</addr-line>
            <country>Bangladesh</country>
            <phone>880 1781920068</phone>
            <email>msg2sabbir@gmail.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8668-0120</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Ahmed</surname>
            <given-names>Nova</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7715-1742</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Design Inclusion and Access Lab</institution>
        <institution>North South University</institution>
        <addr-line>Dhaka</addr-line>
        <country>Bangladesh</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Md Sabbir Ahmed <email>msg2sabbir@gmail.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>10</day>
        <month>8</month>
        <year>2023</year>
      </pub-date>
      <volume>7</volume>
      <elocation-id>e28848</elocation-id>
      <history>
        <date date-type="received">
          <day>26</day>
          <month>12</month>
          <year>2022</year>
        </date>
        <date date-type="rev-request">
          <day>27</day>
          <month>2</month>
          <year>2023</year>
        </date>
        <date date-type="rev-recd">
          <day>17</day>
          <month>3</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>19</day>
          <month>3</month>
          <year>2023</year>
        </date>
      </history>
      <copyright-statement>©Md Sabbir Ahmed, Nova Ahmed. Originally published in JMIR Formative Research (https://formative.jmir.org), 10.08.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Formative Research, is properly cited. The complete bibliographic information, a link to the original publication on https://formative.jmir.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://formative.jmir.org/2023/1/e28848" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Existing robust, pervasive device-based systems developed in recent years to detect depression require data collected over a long period and may not be effective in cases where early detection is crucial. Additionally, due to the requirement of running systems in the background for prolonged periods, existing systems can be resource inefficient. As a result, these systems can be infeasible in low-resource settings.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>Our main objective was to develop a minimalistic system to identify depression using data retrieved in the fastest possible time. Another objective was to explain the machine learning (ML) models that were best for identifying depression.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We developed a fast tool that retrieves the past 7 days’ app usage data in 1 second (mean 0.31, SD 1.10 seconds). A total of 100 students from Bangladesh participated in our study, and our tool collected their app usage data and responses to the Patient Health Questionnaire-9. To identify depressed and nondepressed students, we developed a diverse set of ML models: linear, tree-based, and neural network–based models. We selected important features using the stable approach, along with 3 main types of feature selection (FS) approaches: filter, wrapper, and embedded methods. We developed and validated the models using the nested cross-validation method. Additionally, we explained the best ML models through the Shapley additive explanations (SHAP) method.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Leveraging only the app usage data retrieved in 1 second, our light gradient boosting machine model used the important features selected by the stable FS approach and correctly identified 82.4% (n=42) of depressed students (precision=75%, F1-score=78.5%). Moreover, after comprehensive exploration, we presented a parsimonious stacking model where around 5 features selected by the all-relevant FS approach Boruta were used in each iteration of validation and showed a maximum precision of 77.4% (balanced accuracy=77.9%). Feature importance analysis suggested app usage behavioral markers containing diurnal usage patterns as being more important than aggregated data-based markers. In addition, a SHAP analysis of our best models presented behavioral markers that were related to depression. For instance, students who were not depressed spent more time on education apps on weekdays, whereas those who were depressed used a higher number of photo and video apps and also had a higher deviation in using photo and video apps over the morning, afternoon, evening, and night time periods of the weekend.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Due to our system’s fast and minimalistic nature, it may make a worthwhile contribution to identifying depression in underdeveloped and developing regions. In addition, our detailed discussion about the implication of our findings can facilitate the development of less resource-intensive systems to better understand students who are depressed and take steps for intervention.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>smartphone</kwd>
        <kwd>depression</kwd>
        <kwd>explainable machine learning</kwd>
        <kwd>low-resource settings</kwd>
        <kwd>real-time system</kwd>
        <kwd>students</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Depression is found in around 280 million people worldwide [<xref ref-type="bibr" rid="ref1">1</xref>]. Although it is a common mental disorder, 80% of its burden is found in people from low- and middle-income countries (LMICs) [<xref ref-type="bibr" rid="ref2">2</xref>]. It is the most prevalent mental disorder among adults in Bangladesh [<xref ref-type="bibr" rid="ref3">3</xref>]. Moreover, the depression rate among Bangladeshi university students is higher than in other groups [<xref ref-type="bibr" rid="ref4">4</xref>]. It is linked with physical illness [<xref ref-type="bibr" rid="ref5">5</xref>] and also with psychological problems, such as anxiety disorder [<xref ref-type="bibr" rid="ref6">6</xref>]. However, 75% of people living in LMICs do not receive any treatment for mental disorders [<xref ref-type="bibr" rid="ref7">7</xref>]. In this case, social stigma is a barrier [<xref ref-type="bibr" rid="ref7">7</xref>], which highlights the need for an unobtrusive way to identify depression. In contrast, there are people with psychological problems who seek support from primary care providers (PCPs). However, in more than 50% of cases, PCPs fail to recognize depression [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. Failing to identify depressed individuals at an early stage may have devastating consequences as this increases the risk of suicide [<xref ref-type="bibr" rid="ref10">10</xref>]. Recent research has shown that 60% of people who committed suicide struggled with major depression [<xref ref-type="bibr" rid="ref11">11</xref>]. Therefore, there is a need to identify depression faster, which may make a significant contribution to mitigating depression through early intervention [<xref ref-type="bibr" rid="ref12">12</xref>].</p>
        <p>With the advent of computational models, extensive research has been conducted on the development of machine learning (ML) models for depression identification. There are subjective data–based studies in which to develop models, researchers used demographic characteristics [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref16">16</xref>], information about the family [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>], lifestyle [<xref ref-type="bibr" rid="ref15">15</xref>], mental health [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref17">17</xref>], etc, and their findings demonstrated good accuracy of the models. For instance, an ML model correctly identified 64% of depressed participants [<xref ref-type="bibr" rid="ref14">14</xref>]. However, the main limitation of subjective studies is the use of self-reported data-based features for models, which makes the process obtrusive. Additionally, due to using features such as gender [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>], which remains constant, the models may not be able to capture changes in depression over time, which in turn may not work for remote monitoring and faster diagnosis. Furthermore, since manual input is required, these approaches can have fewer implications in resource-constrained clinical settings.</p>
        <p>To overcome these problems, researchers have explored pervasive devices leveraging behavioral data to improve mental health. Using Fitbit- and smartphone-sensed data, researchers [<xref ref-type="bibr" rid="ref18">18</xref>] explored the behavioral patterns linked with loneliness and identified students with loneliness with an accuracy of 80.2%. A previous study [<xref ref-type="bibr" rid="ref19">19</xref>] constructed 2 different data sets with behavioral data for over 100 days and predicted depression with an <italic>F</italic><sub>1</sub>-score of over 80%. Another study [<xref ref-type="bibr" rid="ref20">20</xref>] presented a personal behavioral model to predict depression that correctly identified over 80% of depressed students using data from 10 and 16 weeks. Although wearable technology shows promising performance, these systems need to run for the whole period of data collection (eg, for over 100 days [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]). Thus, the need for a long data collection period may not facilitate early intervention. In addition, the high price of wearable devices can make them unaffordable for people of low income [<xref ref-type="bibr" rid="ref22">22</xref>], which in turn may make the approaches infeasible for low-resource settings, where usage of wearable devices, such as Fitbit, is low.</p>
        <p>Smartphones have become affordable [<xref ref-type="bibr" rid="ref23">23</xref>] and are available to the majority of adults in emerging and developing countries [<xref ref-type="bibr" rid="ref24">24</xref>]. Smartphone usage has a significant relationship with depression [<xref ref-type="bibr" rid="ref25">25</xref>-<xref ref-type="bibr" rid="ref28">28</xref>] and loneliness [<xref ref-type="bibr" rid="ref29">29</xref>-<xref ref-type="bibr" rid="ref31">31</xref>]. Moreover, there remain significantly different use patterns between depressed and nondepressed individuals in terms of communication [<xref ref-type="bibr" rid="ref25">25</xref>] and social media [<xref ref-type="bibr" rid="ref26">26</xref>] app categories, which indicates that app usage data can be important predictors for identifying depression. Based on only phone usage data, an ML model in previous research [<xref ref-type="bibr" rid="ref21">21</xref>] showed a sensitivity of 45% in predicting postsemester depression, whereas another study [<xref ref-type="bibr" rid="ref27">27</xref>] achieved a sensitivity of 55.7% in identifying participants with depressive symptoms. To develop ML models, some studies have used sensed data [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>], along with smartphone usage data. In other studies [<xref ref-type="bibr" rid="ref34">34</xref>-<xref ref-type="bibr" rid="ref36">36</xref>], researchers have used smartphone-sensed data incorporating self-reported data to extract features for ML models. Studies have also relied solely on smartphone-sensed location data [<xref ref-type="bibr" rid="ref37">37</xref>-<xref ref-type="bibr" rid="ref40">40</xref>]. However, like studies based on wearables, in existing smartphone data–based studies, systems (ie, apps) need to run in the background for the whole data collection period, which may cause several problems. For example, due to running in the background for a long time (eg, 12 weeks [<xref ref-type="bibr" rid="ref28">28</xref>], 16 weeks [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref21">21</xref>]) as well as sensors consuming too much battery power [<xref ref-type="bibr" rid="ref41">41</xref>], these smartphone-sensed data-based systems may not be energy efficient, which can be a barrier to obtaining quality data from low-resource settings. Although some studies (eg, [<xref ref-type="bibr" rid="ref40">40</xref>]) were conducted to develop energy-efficient systems for depression identification, the systems may still not facilitate early intervention since a long data collection period is required. In addition, due to having a system tracking data continuously from the phone, users may feel reluctant, which may introduce research reactivity problems (eg, the Hawthorne effect [<xref ref-type="bibr" rid="ref42">42</xref>]), causing biases in app usage data.</p>
      </sec>
      <sec>
        <title>Objective</title>
        <p>To overcome the aforementioned limitations, such as the high price of wearables, the need to run the system in the background, and the need for long-term data, our primary objective was to develop a system, named <italic>Mon Majhi</italic> (in English, <italic>Mind Navigator</italic>), that can identify depression unobtrusively following a minimalistic approach and in real time. Another objective was to explain the best ML models that can facilitate a better understanding of depressed students among mental health care professionals and help them take steps in intervention.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>A Tool to Retrieve App Usage Data Instantly</title>
        <sec>
          <title>Development of a Data Collection Tool</title>
          <p>Self-reported app usage data do not represent actual behavior [<xref ref-type="bibr" rid="ref43">43</xref>]. In reporting app usage, users overestimate or underestimate data, which varies by type [<xref ref-type="bibr" rid="ref44">44</xref>]. For instance, Facebook usage duration is overestimated, while the frequency of launching Facebook is underestimated [<xref ref-type="bibr" rid="ref44">44</xref>]. Therefore, to obtain the exact app usage behavioral data of users, we developed an app [<xref ref-type="bibr" rid="ref45">45</xref>] for the Android platform, which is used by 95.9% of smartphone users in Bangladesh [<xref ref-type="bibr" rid="ref46">46</xref>]. To instantly (see the <italic>Time Required to Retrieve App Usage Data</italic> section) obtain raw app usage data (foreground and background events), we used some functions of the Java class <italic>UsageStatsManager</italic>. However, app usage events are kept for a few days in Android [<xref ref-type="bibr" rid="ref47">47</xref>], and thus, our tool can instantly retrieve app usage data for the previous 7 days, while aggregated app usage data (eg, total time spent on an app over 14 days) for longer than 7 days can be accessed by a Java application programming interface (API). Although the list of used apps can be accurately retrieved through the Java function <italic>queryUsageStats (intervalType, beginTime, endTime)</italic>, the usage duration data when the data collection period exceeded 7 days were not accurate, as we found by testing Mon Majhi in multiple ways. We tested the app by setting different values (eg, INTERVAL_WEEKLY, INTERVAL_MONTHLY) of the parameter <italic>intervalType</italic> as well as by properly changing the values of other parameters. By experimenting through the trial-and-error method, we found inaccuracy in the app usage duration when compared to the manually calculated app usage duration. In addition, while testing other phones, the users of the phones marked the data as inaccurate based on their best guess. Furthermore, except for usage duration, other data, such as frequency of launching, as well as raw data cannot be retrieved through the API, which hinders the extraction of more informative features, as presented in the <italic>Pipeline of ML Models</italic> section. Therefore, in this study, we used 7 days’ app usage data as we found it to be accurate.</p>
          <p>Once Mon Majhi (Figure A1 of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) is installed, with the user’s consent, the app retrieves the past 7 days’ app usage data. We chose to use Google Firebase as a database since it is secure and easy to integrate with mobile apps. We released the app [<xref ref-type="bibr" rid="ref45">45</xref>] on the Google Play Store; since this platform is known to Android users, participants may feel more comfortable installing apps from there.</p>
        </sec>
        <sec>
          <title>Testing the Data Collection Tool</title>
          <p>To check whether our app can accurately retrieve app usage data, we tested the app using the following 3 steps. We found that in each step, our app can calculate the past 7 days’ app usage data, such as duration, and launch accurately.</p>
          <list list-type="bullet">
            <list-item>
              <p>Step 1: We manually calculated the core app usage data duration and frequency of launch. We compared the manually calculated data with the app usage data retrieved by our data collection tool.</p>
            </list-item>
            <list-item>
              <p>Step 2: We compared the data retrieved by our app to the available apps [<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref49">49</xref>] in Google Play that are required to be run in the background to calculate app usage data.</p>
            </list-item>
            <list-item>
              <p>Step 3: Smartphones function differently depending on various conditions, including the manufacturer and smartphone model. To determine the generalizable performance of our app, we tested it on 9 different smartphones.</p>
            </list-item>
          </list>
        </sec>
        <sec>
          <title>Time Required to Retrieve App Usage Data</title>
          <p>To estimate the time required by our app to retrieve the past 7 days’ app usage data, we calculated the time difference between the start and the end of programs that were written to retrieve app usage data. To estimate a generalizable required time, we tested our app on 20 smartphones of 19 different models, with 8 different versions of Android operating systems and 7 different smartphone manufacturers. Our app retrieved the past 7 days’ app usage data 500 times from each of those phones. In total, it calculated the required time 10,000 (500×20) times. On average, it retrieved 7447.61 (SD 4986.62, median 6641, minimum=306, maximum=24,297) foreground and background app usage events (<xref rid="figure1" ref-type="fig">Figure 1</xref>a). The average time required was 307.94 ms (SD 1103.91, median 211, minimum=13, maximum=61,087 ms; <xref rid="figure1" ref-type="fig">Figure 1</xref>b). We found that among the 10,000 instances, only 97 had a retrieval time above 1 second (Table A1 of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
          <p>In retrieving data, there may be some factors affecting the time required. We explored the possible factors by performing a correlation of the required time with the 20 phones’ API level and the number of retrieval events. We did not find any significant correlation between the Android API level and the time required (<italic>r</italic><sub>s</sub>=0.18, <italic>P</italic>=.44; <xref rid="figure1" ref-type="fig">Figure 1</xref>c). In exploring the relationship with the number of events, we used the average number of events and the average time required for each phone; within each phone, there was almost no variation in the number of retrieved events (<xref rid="figure1" ref-type="fig">Figure 1</xref>a). We found the number of events had a significant positive relationship with the time required to retrieve data (<italic>r</italic><sub>s</sub>=0.56, <italic>P</italic>=.009; <xref rid="figure1" ref-type="fig">Figure 1</xref>d). Next, to estimate the plausible number of events in a student’s phone, we used the data set that was constructed for this research. On average, there were 8174.04 events (SD 4972.50) retrieved from each of the 100 students’ phones. In the 10,000 times data was retrieved, the number of retrieved app usage events was more than 8000 in the case of 4500 instances. To retrieve this large number of events, our app needed an average of 430.31 (SD 1596.46) ms. This reveals that, on average, our app can retrieve the past 7 days’ app usage data in less than 1 second.</p>
          <fig id="figure1" position="float">
            <label>Figure 1</label>
            <caption>
              <p>Performance of Mon Majhi in retrieving data. (a) Number of retrieved foreground and background events, (b) time required to retrieve data. Kernel density estimation shows the relationship of time with (c) API level and (d) number of foreground and background events. API: application programming interface.</p>
            </caption>
            <graphic xlink:href="formative_v7i1e28848_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>The study was approved by the Center for Research &amp; Development at Eastern University. In our app, there was a consent form where we mentioned study details, and all participants provided their consent before their voluntary data donation. Except for the app usage data, our app does not collect any other data, such as messages. All data were kept anonymous, and access to the database was limited to the researchers of this project only.</p>
        <p>The Center for Research &amp; Development (CDR) at Eastern University is the only section regarding research at Eastern University that takes care of everything needed for research. There is no other separate section like an ethics board to review research.</p>
      </sec>
      <sec>
        <title>Data Collection and Participants’ Demographic Characteristics</title>
        <p>Considering the high prevalence of depression (ie, 69.5% [<xref ref-type="bibr" rid="ref50">50</xref>]) among university students in Bangladesh as well as their high adoption of smartphones (86.6% use smartphones [<xref ref-type="bibr" rid="ref51">51</xref>]), we decided to use them as samples in this study. We collected data from July to October 2020 and reached participants through the snowball sampling method. Several participants were recruited through university teachers, and others were recruited through researchers’ close connections. To ensure the participants’ comfort, we arranged a discussion session, where we described the study objective, types of data collected, etc. Since the study was conducted during the COVID-19 pandemic, we conducted the meeting mostly using virtual platforms based on participants’ preferences and availability. To provide data, participants installed the app via Google Play. In total, 100 students from 12 different institutes of higher education and 7 different departments, including arts, law, medical science, and engineering faculties, participated.</p>
        <p>The participants were from 36 districts and 7 divisions, which covered 56.3% of districts and 87.5% of divisions in Bangladesh (<xref rid="figure2" ref-type="fig">Figure 2</xref>a). There were 87 (87%) male participants and 13 (13%) female participants (<xref rid="figure2" ref-type="fig">Figure 2</xref>b). The participants’ age varied from 19 to 30 years, and most participants’ age was below 25 years (<xref rid="figure2" ref-type="fig">Figure 2</xref>c). Although a few participants had a family income of more than 100,000 Bangladeshi Taka (BDT) (US $942.32), most participants reported a family income of up to BDT 50,000 (US $471.16; <xref rid="figure2" ref-type="fig">Figure 2</xref>d).</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Participants’ demographic characteristics. (a) Pushpins present the location of districts, and bold text presents the division name. Participants’ (b) gender, (c) age, and (d) monthly family income. BDT: Bangladeshi Taka.</p>
          </caption>
          <graphic xlink:href="formative_v7i1e28848_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Categorization of Depressed and Nondepressed Individuals</title>
        <p>To assess depression among participants, different versions of the clinically validated Patient Health Questionnaire have been widely used [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref40">40</xref>, <xref ref-type="bibr" rid="ref52">52</xref>]. We used the Patient Health Questionnaire-9 (PHQ-9) [<xref ref-type="bibr" rid="ref53">53</xref>] in this study. In our app, the scale was available in English and in the native language Bengali (details about scale translation are available in section B of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The PHQ-9 contains 9 items. Based on each participant’s experiences in the past 14 days, they responded to each item using 1 of 4 options: not at all (0), several days (1), more than half of the days (2), and nearly every day (3). A PHQ-9 score of 10 or more showed a sensitivity and specificity of 88% for measuring major depression [<xref ref-type="bibr" rid="ref53">53</xref>]. Therefore, following previous studies [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref53">53</xref>], we grouped participants who had a PHQ-9 score of at least 10 into the depressed group and those with a PHQ-9 score of &lt;10 into the nondepressed group.</p>
      </sec>
      <sec>
        <title>Pipeline of ML Models</title>
        <sec>
          <title>Feature Extraction</title>
          <p>From the 100 students’ smartphones, our app retrieved 817,404 foreground and background events carried out in 1129 unique apps. The mean number of retrieved events from each phone was 8174.2 (SD 4972.53; median 7849; minimum=70, maximum=29,113). Using the retrieved data on foreground and background events, we extracted the frequency of launching apps, usage duration, and the following behavioral markers to use as features in the ML models: number of used unique apps, diurnal usage, app usage sessions, entropy, hamming distance, data of app categories, and number of extracted features.</p>
        </sec>
        <sec>
          <title>Number of Unique Apps Used</title>
          <p>To count the number of unique apps used, we counted the number of app package names. The main motivation for using package names instead of app names was that among the 1129 apps (details are available in the <italic>Usage Data of App Categories</italic> section), 127 (11.2%) had duplicate names. For example, among the 8 apps in the Weather category, 7 (87.5%) app names were “Weather” and 1 (12.5%) app was named “Windy.” However, each app’s package name was unique.</p>
        </sec>
        <sec>
          <title>Diurnal Usage Data</title>
          <p>The depressed and nondepressed groups had significantly different diurnal usage patterns [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. Hence, we divided a day into 4 equal periods following previous studies [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. During the calculation of app usage data, we found foreground and background events of several apps that occurred in different periods, and we added the duration in the respective period through the use of a delimiter. For example, if an app is opened at 11:30 AM (morning) but closed at 12:20 PM (afternoon), then by setting 12:00 PM (noon) as a delimiter, we added 30 minutes to the morning period and 20 minutes to the afternoon period. Moreover, following a previous study [<xref ref-type="bibr" rid="ref54">54</xref>], in such cases, we counted the frequency of launch in the time range (eg, morning in this example) during which the app was opened:</p>
          <list list-type="bullet">
            <list-item>
              <p>Night: 12:01 AM to 06:00 AM</p>
            </list-item>
            <list-item>
              <p>Morning: 06:01 AM to 12:00 PM</p>
            </list-item>
            <list-item>
              <p>Afternoon: 12:01 PM to 6:00 PM</p>
            </list-item>
            <list-item>
              <p>Evening: 06:01 PM to 12:00 AM</p>
            </list-item>
          </list>
        </sec>
        <sec>
          <title>App Usage Sessions</title>
          <p>The Java function we used to retrieve the past 7 days’ app usage data does not provide the phone lock and unlock data (eg, the time when the phone was locked or unlocked), which makes it difficult to identify a session. Hence, we followed previous studies to define a session. Wang and Mark [<xref ref-type="bibr" rid="ref55">55</xref>] used the median break length of 40 seconds for grouping visits to Facebook into a single session. Other studies [<xref ref-type="bibr" rid="ref56">56</xref>,<xref ref-type="bibr" rid="ref57">57</xref>] have used a threshold of 60 seconds to identify a session of Facebook use. A threshold of 30 seconds has also been used to define the sequence of app usage into a single session [<xref ref-type="bibr" rid="ref58">58</xref>-<xref ref-type="bibr" rid="ref60">60</xref>]. However, using 30 seconds can identify sessions with less accuracy [<xref ref-type="bibr" rid="ref61">61</xref>]. Instead, van Berkel et al [<xref ref-type="bibr" rid="ref61">61</xref>] suggested using a threshold of 45 seconds, which was found to be more accurate. Therefore, in our study, we grouped app usage into a single session if there was no more than a 45-second gap between the last used app and the newly opened app. After that, depending on the time spent in each session, we defined 3 different types of sessions following previous studies [<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref63">63</xref>]:</p>
          <list list-type="bullet">
            <list-item>
              <p>Microsession: A session was defined as a microsession if a participant spent a maximum of 15 seconds on an app [<xref ref-type="bibr" rid="ref63">63</xref>].</p>
            </list-item>
            <list-item>
              <p>Review session: A session was defined as a review session if a participant interacted with an app for up to 60 seconds [<xref ref-type="bibr" rid="ref62">62</xref>]. However, due to the concept of microuse, we counted a session as a review session if a participant was found to spend between 15 seconds and 60 seconds on an app.</p>
            </list-item>
            <list-item>
              <p>Engage session: Following Banovic et al [<xref ref-type="bibr" rid="ref62">62</xref>], we counted this session if the participant spent more than 60 seconds using apps on a smartphone.</p>
            </list-item>
          </list>
        </sec>
        <sec>
          <title>Entropy</title>
          <p>Using Shannon’s entropy formula [<xref ref-type="bibr" rid="ref64">64</xref>], we calculated the entropy of every participant’s app usage, which presents the app usage pattern:</p>
          <disp-formula>
            <graphic xlink:href="formative_v7i1e28848_fig10.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </disp-formula>
          <p>where <italic>p</italic>(<italic>j</italic>) indicates the probability of use of the <italic>j</italic>-th app by the <italic>i</italic>-th participant and</p>
          <disp-formula>
            <graphic xlink:href="formative_v7i1e28848_fig11.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </disp-formula>
          <p>where <italic>usage_duration</italic>(<italic>j</italic>) presents the <italic>i</italic>-th participant’s usage duration on the <italic>j</italic>-th app. Having an unequal usage duration on each app will result in lower entropy, <italic>E</italic>. In that case, the pattern of app usage will be skewed, and from that, we can infer that the participant has a preference for certain apps. If a participant uses a single app, the entropy (<italic>E</italic>) will be 0. Having an equal usage duration for every app will result in higher entropy.</p>
        </sec>
        <sec>
          <title>Hamming Distance Ratio</title>
          <p>App signatures vary according to the group of people studied (eg, female vs male [<xref ref-type="bibr" rid="ref65">65</xref>]). Depressed and nondepressed students have different app signatures, which makes them uniquely reidentifiable [<xref ref-type="bibr" rid="ref26">26</xref>]. This difference is seen in app category as well [<xref ref-type="bibr" rid="ref26">26</xref>]. Accordingly, we believe that uniqueness in terms of apps as measured by the hamming distance [<xref ref-type="bibr" rid="ref66">66</xref>] can be a good metric to classify depressed and nondepressed students. For participant <italic>i</italic>, first, we calculated the distance from all the depressed participants:</p>
          <disp-formula>
            <graphic xlink:href="formative_v7i1e28848_fig12.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </disp-formula>
          <p>where <italic>D<sub>ij</sub></italic> denotes the distance of the <italic>i</italic>-th participant from the <italic>j</italic>-th depressed participant and <italic>AP<sub>i</sub></italic> and <italic>AP<sub>j</sub></italic> denote the set of apps used by the <italic>i</italic>-th and <italic>j</italic>-th participants, respectively. Next, we found the minimum distance of participant <italic>i</italic> from all (<italic>n</italic>) depressed participants: <italic>D<sub>i</sub></italic>=<italic>min</italic>{<italic>D<sub>i1</sub>, D<sub>i2</sub>, D<sub>i3</sub></italic>, . . . , <italic>D<sub>in</sub></italic>}. Similarly, we calculated the minimum distance of participant <italic>i</italic> in the nondepressed group, <italic>ND<sub>i</sub></italic>. After that, instead of using the distances (<italic>D<sub>i</sub></italic>, <italic>ND<sub>i</sub></italic>) separately as features, we used the ratio of the distances <inline-graphic xlink:href="formative_v7i1e28848_fig13.png" xlink:type="simple" mimetype="image"/>
. The motivation behind using the ratio is that it would provide us with information about how much more or less unique a participant is among the depressed group compared to the nondepressed group, and intuitively, this is more informative. Considering application in the real-world scenario where we have only app usage data, we did not use the information about the participant’s (ie, participant <italic>i</italic>) category (depressed or nondepressed) during the calculation of the hamming distance ratio, which makes the feature unbiased.</p>
        </sec>
        <sec>
          <title>Usage Data of App Categories</title>
          <p>To calculate the usage data of an app category, we summed up the usage data of each app in that category. We took several steps while categorizing the apps. For instance, in Google Play, developers set the category of their app. For the apps used by the participants of our study, we retrieved the developers’ referred category by using the app package name and an HTML parser. However, there were apps used by the participants that were not available in Google Play. To categorize those apps, we explored the app features from the online app stores (eg, APKMonk, APKMirror) and the developers’ websites. For instance, participants used the Photo Editor app, available in the Samsung Galaxy Store, which we verified by matching the app’s unique package name. After exploring the app, we found features (eg, adding effects on photos) regarding photography, and this directed us to keep the app in the Photo and Video app category. To categorize the apps, we also followed the app categorization process in previous studies [<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref67">67</xref>]. In addition, we discussed this with 2 students who graduated from the computer science and engineering department. In the case of apps where there was disagreement among the categorizers, we discussed with 2 more students and used the majority rule to select a category. Due to having a small number of participants in each subcategory of the Games category, we grouped all the subcategories (eg, arcade, puzzle) into the Games category. In addition, since during the COVID-19 pandemic, students attended classes through apps, such as Zoom and Google Meet [<xref ref-type="bibr" rid="ref68">68</xref>], we kept such apps in the Education category as all participants were students. After categorizing the 1129 apps the students used, we found that most (n=359, 31.8%) apps were in the Tools category and the least number of apps was in the Art and Design category (Table C1 of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Moreover, we found more than 50 apps in the Games, Photo and Video, Books and Reference, Communication, and Productivity categories (Table C1 of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
        </sec>
        <sec>
          <title>Calculation of the Number of Extracted Features</title>
          <p>To simply show the calculation, we kept the data in different sets. A set of data presents the total smartphone usage (regardless of the app category) and 27 app categories: <italic>app_category = {arts and design, . . . , weather, smartphone}</italic>.</p>
          <p>Since app usage behavior varies by weekdays and weekends [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref65">65</xref>], instead of using aggregated 7 days’ (weekday + weekend) data, we used the weekday and weekend data separately as a feature. The set of the days was <italic>days = {Weekdays, Weekends}</italic>.</p>
          <p>The sets of core data and session data were <italic>core_data = {duration, launch, number of apps, entropy, hamming distance}</italic> and <italic>session_data = {total number of sessions, microsession, review session, engage session}</italic>. We calculated the data for the whole day. In addition, we calculated the mean and SD for diurnal usage data consisting of morning, afternoon, evening, and night periods. We denoted these by the set of data characteristics: <italic>data_characteristics = {mean, SD, total data}</italic>.</p>
          <p>In total, we extracted 864 features: (28 items in <italic>app_category</italic> × 2 items in <italic>days</italic> × 5 items in <italic>core_data</italic> × 3 items in <italic>data_characteristics</italic>) + (regardless of the app category: 2 items in <italic>days</italic> × 4 items in <italic>session_data</italic> × 3 items in <italic>data_characteristics</italic>). There were several app categories (eg, Art and Design, Auto and Vehicles) where the number of users was low. Having a nonuser creates a sparse matrix that may not demonstrate enough variance. We excluded all such features where the percentage of users was less than 50%. This resulted in 219 features (Table C2 of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) going through the feature selection (FS) step.</p>
        </sec>
        <sec>
          <title>Feature Selection</title>
          <p>Broadly, FS approaches are categorized into 3 groups: (1) wrapper, (2) filter, and (3) embedded methods [<xref ref-type="bibr" rid="ref69">69</xref>]. We explored all 3 approaches. Moreover, we used the stable FS algorithm [<xref ref-type="bibr" rid="ref70">70</xref>] as described later. In addition, to make the models unbiased to the features having larger values, we scaled the features where we performed standard scaling as some of the data contained outliers and standardization is less sensitive to outliers than min-max scaling [<xref ref-type="bibr" rid="ref71">71</xref>].</p>
        </sec>
        <sec>
          <title>The Filter Method</title>
          <p>We used the information gain (IG) algorithm as the filter method. Unlike the Boruta algorithm, the IG algorithm does not inform a fixed set of features that can be optimal for classification. Hence, to select a set of top-scoring features, we set the lower bound by using the 1-in-10 rule [<xref ref-type="bibr" rid="ref72">72</xref>] approach where the top 5 features were selected due to there being 51 depressed participants (see the <italic>Depression Among Participants</italic> section) in our study. Gradually, we increased the number of features to 20 to avoid the possibility of having an overfitted model with a large number of features.</p>
        </sec>
        <sec>
          <title>The Wrapper Method</title>
          <p>Unlike minimal-optimal methods, all-relevant features are selected in Boruta [<xref ref-type="bibr" rid="ref73">73</xref>], where the random forest (RF) algorithm is wrapped. To implement this, we used the <italic>BorutaPy</italic> package [<xref ref-type="bibr" rid="ref74">74</xref>], which works by correcting the <italic>P</italic> values in 2 steps rather than the 1-step Bonferroni correction, which is conservative. We changed the maximum depth of the RF from 3 to 7 [<xref ref-type="bibr" rid="ref74">74</xref>], as suggested by the authors of the package.</p>
        </sec>
        <sec>
          <title>The Embedded Method</title>
          <p>The embedded method combines the strategies of the filter and wrapper methods. We used the RF as the embedded method. In selecting the number of features based on the score of feature importance, we used the same approach as we did for the filter method.</p>
        </sec>
        <sec>
          <title>The Stable Method</title>
          <p>In our study, we extracted 219 features from each of the 100 participants’ app usage data. Due to a small number of participants, there may be unstable features where features may vary across different samples. The stable FS approach [<xref ref-type="bibr" rid="ref70">70</xref>] was found to perform well in this scenario as many bootstrapped samples are created and the final set of features is selected based on a threshold (π<sub>th</sub>), which presents the percentage of subsamples containing a feature. We created 1000 bootstrapped subsamples and used a logistic regression (Logit) classifier as the base estimator that fit on the bootstrapped subsamples. In previous studies of depression identification, researchers have used random thresholds (eg, 0.25 [<xref ref-type="bibr" rid="ref75">75</xref>], 0.75 [<xref ref-type="bibr" rid="ref76">76</xref>]) to select features. Since there is no evidence of getting optimal performance using only those thresholds, we performed an empirical investigation to present the optimal threshold. We started from a threshold of 0.5, which indicates that 50% of the bootstrapped subsamples contain a particular feature. Gradually, we increased the threshold by 0.01 up to a threshold where no more features were selected.</p>
        </sec>
        <sec>
          <title>Development and Validation of the Models</title>
          <p>As there is no one-model-fits-all solution, we used a diverse set of ML algorithms, including those that are widely used in the medical informatics field, as shown in previous systematic reviews: decision tree (DT) [<xref ref-type="bibr" rid="ref77">77</xref>], RF, support vector machine (SVM) [<xref ref-type="bibr" rid="ref77">77</xref>-<xref ref-type="bibr" rid="ref79">79</xref>], and Logit [<xref ref-type="bibr" rid="ref78">78</xref>,<xref ref-type="bibr" rid="ref79">79</xref>] algorithms. Moreover, we used other ML algorithms to increase the diversity of the models: Gaussian Naive Bayes, K-nearest neighbor (KNN), support vector classifier (SVC), AdaBoost, extra tree, multilayer perceptron (MLP) [<xref ref-type="bibr" rid="ref71">71</xref>], light gradient boosting machine (LGBM) [<xref ref-type="bibr" rid="ref80">80</xref>], CatBoost [<xref ref-type="bibr" rid="ref81">81</xref>], and gradient boost (GB) [<xref ref-type="bibr" rid="ref82">82</xref>]. As the baseline classifier, we used a dummy classifier. To develop and validate the ML models, we used the nested cross-validation (CV) method. In the outer loop was the leave-one-participant-out cross-validation (LOPOCV), and in the inner loop was a 20-fold CV, where 19 folds were used for tuning the hyperparameters and the remaining 1 fold was used for validation. LOPOCV maximizes the number of samples in training, where in each iteration, (N – 1) samples are used for training and 1 sample is used for testing (<xref rid="figure3" ref-type="fig">Figure 3</xref>). We took steps to prevent the possibility of overfitting the models. We used the nested CV method, which shows unbiased performance [<xref ref-type="bibr" rid="ref83">83</xref>] and is used as the state-of-the-art method to restrain models from overfitting and overestimation [<xref ref-type="bibr" rid="ref35">35</xref>]. Additionally, in the outer loop of nested CV, we used LOPOCV, which has a lower variance [<xref ref-type="bibr" rid="ref84">84</xref>] and is used to minimize overfitting [<xref ref-type="bibr" rid="ref21">21</xref>].</p>
          <p>Hyperparameters in ML models play a role in enhancing performance. To tune the hyperparameters (the list of explored hyperparameters for the 13 ML algorithms is available in Table D1 of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), we used the Bayesian search optimization technique, which uses an informed search technique and works faster than the uninformed search technique (eg, grid search CV). It is worthwhile to mention that to develop unbiased ML models (<xref rid="figure3" ref-type="fig">Figure 3</xref>), the sample used in the testing was neither present in FS nor in the hyperparameter tuning steps. During model development, we maximized the <italic>F</italic><sub>1</sub>-score as it is based on the sensitivity and precision score, where sensitivity informed how many of the depressed participants were correctly classified and precision informed how many of the predicted depressed participants were truly depressed. After finding the best-performing models, we selected the top 5 algorithms as the base estimators to develop a stacking model, which works based on the wisdom of the crowd concept. To train the meta-learner Logit model of the stacking classifier, we used 10-fold CV. It is worthwhile to mention that in the case of each CV, we used the stratified technique so that the proportion of participants in each group remained the same in the training and testing parts, which ensured the unbiasedness of the model toward a particular group. For ML model development, we used Python packages, including <italic>hyperopt</italic> [<xref ref-type="bibr" rid="ref85">85</xref>] and <italic>sklearn</italic> [<xref ref-type="bibr" rid="ref86">86</xref>].</p>
          <p>To evaluate the performance of the classification models, we used the evaluation metrics precision, <italic>F</italic><sub>1</sub>-score, and accuracy. However, an overfitted model can predict only a single class without being able to predict the other class. At that time, we will obtain ~50% accuracy in our data set as there was almost an equal number of participants in each group. Therefore, in addition to other evaluation metrics, to understand the performance in classifying the students in each group, we also calculated the sensitivity and specificity. Specificity informed us how many of the nondepressed participants were accurately classified.</p>
          <fig id="figure3" position="float">
            <label>Figure 3</label>
            <caption>
              <p>Pipeline of Mon Majhi in identifying the depressed and nondepressed participants. DT: decision tree; GB: gradient boost; KNN: K-nearest neighbor; LGBM: light gradient boosting machine; LOPOCV: leave-one-participant-out cross-validation; MLP: multilayer perceptron; PHQ-9: Patient Health Questionnaire-9; RF: random forest; SVM: support vector machine; XGB: XGBoost.</p>
            </caption>
            <graphic xlink:href="formative_v7i1e28848_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Explanation of the Models</title>
          <p>Explaining the models can be insightful for mental health professionals to understand depressed students. Additionally, this can help in the reproducibility of ML models. To understand how different features affect the probability of remaining in a particular group, we used the Shapley additive explanations (SHAP) [<xref ref-type="bibr" rid="ref87">87</xref>] approach.</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Depression Among Participants</title>
        <p>Of the 100 participants in our study, 51 (51%) had depression and 49 (49%) did not. The PHQ-9 score of the depressed group ranged from 10 to 27, whereas that of the nondepressed group varied from 1 to 9 (<xref rid="figure4" ref-type="fig">Figure 4</xref>a). After exploring differences in the 9 symptoms of the PHQ-9, we found that, on average, depressed students were bothered by each symptom for around more than half of the days in the past 14 days (score=2; <xref rid="figure4" ref-type="fig">Figure 4</xref>b). However, nondepressed students were not bothered by the symptoms at all, except symptom 1 (little interest or pleasure in doing things), where the average score was around 1 (several days; <xref rid="figure4" ref-type="fig">Figure 4</xref>b).</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Depression score of the participants. (a) PHQ-9 score of the depressed and nondepressed participants. (b) Symptoms 1-9 of the PHQ-9 scale. Scores of 0, 1, 2, and 3 correspond to "not at all," "several days," "more than half of the days," and "nearly every day," respectively. PHQ-9: Patient Health Questionnaire-9.</p>
          </caption>
          <graphic xlink:href="formative_v7i1e28848_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Performance of the Models in Identifying Depression</title>
        <p>In this section, we present the performance of ML models that are promising for identifying depressed and nondepressed participants. In Tables E1 to E4 of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, we present all 13 classifiers’ performance in detail for models based on important features selected by the filter (IG), wrapper (Boruta), embedded (RF), and stable FS methods, respectively.</p>
        <sec>
          <title>Performance of ML Models in the Stable Feature Selection Approach</title>
          <p>In finding the optimal threshold for the stable FS approach, we started from a threshold of 0.5 where a feature was selected if it was present in at least 50% of the 1000 bootstrapped subsamples. At a threshold of 0.5, on average, 61.9 features (SD 2.6) were selected in each iteration of LOPOCV (<xref rid="figure5" ref-type="fig">Figure 5</xref>a). We found the AdaBoost classifier performed the best in the selected features at this threshold, where precision, sensitivity, and specificity were 72.5%, 72.5%, and 71.4%, respectively (<xref rid="figure5" ref-type="fig">Figure 5</xref>b). When we increased the threshold by 0.01, gradually, the number of selected features decreased and reached 0 at a threshold of 0.98. At a threshold of 0.6, the number of selected features was 28.6, which was less than half of the number of features selected at a threshold of 0.5 (<xref rid="figure5" ref-type="fig">Figure 5</xref>a). However, from a threshold of 0.5 to 0.6, the models’ performance did not vary largely (<xref rid="figure5" ref-type="fig">Figure 5</xref>b). In fact, the precision of the best models at each threshold was above 70%. In terms of precision, we found the best model at a threshold of 0.65, where the LGBM model–predicted depressed group was correct in 78% (n=39) of cases, and the sensitivity of 76.5% and specificity of 77.6% were also higher. Although an average of only 11.1 (SD 0.9) features were selected at a threshold of 0.77, in terms of sensitivity (82.4%) and the <italic>F</italic><sub>1</sub>-score (78.5%), the best performance was found at this threshold. However, the least number of features was selected at a threshold of 0.97, where in each iteration of LOPOCV, an average of 1.3 (SD 0.5) features were selected (<xref rid="figure5" ref-type="fig">Figure 5</xref>a) and the LGBM model’s predictions were the most accurate (precision=63.3%, sensitivity=60.8%, specificity=63.3%; <xref rid="figure5" ref-type="fig">Figure 5</xref>b) at this threshold.</p>
          <fig id="figure5" position="float">
            <label>Figure 5</label>
            <caption>
              <p>(a) Number of selected features and (b) performance of the best models at each threshold of the stable FS approach. The text at the end of the dotted lines presents the best models. FS: feature selection; Light GBM: light gradient boosting machine; LOPOCV: leave-one-participant-out cross-validation; ML: machine learning; MLP: multilayer perceptron.</p>
            </caption>
            <graphic xlink:href="formative_v7i1e28848_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Performance of ML Models in the Boruta Feature Selection Approach</title>
          <p>Unlike all other FS approaches, in the wrapper method Boruta, we found all-relevant features showing higher performance for prediction tasks. To find the optimal performance of the models, we tuned the base estimator RF’s maximum depth, which is wrapped in Boruta. On average, around 5 features were selected by Boruta when we varied the maximum depth from 3 to 7 (<xref rid="figure6" ref-type="fig">Figure 6</xref>a). Although the number of features did not vary, the set of selected features varied (Table F1 of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), which was reflected in the performance of the ML models (<xref rid="figure6" ref-type="fig">Figure 6</xref>b). We found the maximum sensitivity and <italic>F</italic><sub>1</sub>-score when depth was 4, where the KNN algorithm–based model showed a sensitivity of 82.4% and an <italic>F</italic><sub>1</sub>-score of 76.4%. However, the specificity (65.3%) of the model was below 70%. We found a better-performing model at a maximum depth of 6, where the GB algorithm model accurately identified 74.5% (n=38) of the depressed participants (sensitivity=74.5%), and the predicted depressed group was also correct in 73.1% (n=38) cases (precision=73.1%), with a specificity of 73.8% (<xref rid="figure6" ref-type="fig">Figure 6</xref>b).</p>
          <fig id="figure6" position="float">
            <label>Figure 6</label>
            <caption>
              <p>(a) Number of selected features and (b) ML models’ performance at different depths of the estimator of the Boruta algorithm. GB: gradient boost; KNN: K-nearest neighbor; LOPOCV: leave-one-participant-out cross-validation; ML: machine learning.</p>
            </caption>
            <graphic xlink:href="formative_v7i1e28848_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Comparison of the Feature Selection Approaches</title>
          <p>We compared the performance of the FS approaches by selecting the same number of features in each approach. In the filter method IG and the embedded method RF, we selected a subset of top-scoring features, where the lower and upper bounds were set following a process as described in the <italic>Feature Selection</italic> section. Unlike the filter and embedded methods, in the stable and also in the wrapper method Boruta, there was a variation in the number of selected features in each iteration of LOPOCV. Thus, for those 2 methods, we selected the best model by rounding the average number of selected features in LOPOCV so that the number of features becomes comparable. We found that using 5 features selected by the IG, the DT model performed better than the other 13 ML classifiers, where the precision, sensitivity, and specificity were 65.5%, 74.5%, and 69.7%, respectively (<xref ref-type="table" rid="table1">Table 1</xref>). Using the 5 features selected by the embedded and stable methods, CatBoost’s (precision=64.9%, sensitivity=72.5%, specificity=59.2%) and the RF’s (precision=69.1%, sensitivity=74.5%, specificity=65.3%) performance was higher, respectively (<xref ref-type="table" rid="table2">Table 2</xref>). However, the models based on the 5 features selected by Boruta outperformed the models based on the 5 features selected by the other 3 FS approaches (<xref ref-type="table" rid="table1">Tables 1</xref> and <xref ref-type="table" rid="table2">2</xref>). As mentioned previously, the GB model using 5 features selected by Boruta had a sensitivity, specificity, and <italic>F</italic><sub>1</sub>-score of 74.5%, 71.4%, and 73.8%, respectively (<xref ref-type="table" rid="table1">Table 1</xref>). In addition, it was interesting to observe that the same performance was found when using 6 and 7 features selected by the IG, 9 and 10 features selected by the RF, and 14 features selected by the stable FS approach (<xref ref-type="table" rid="table1">Tables 1</xref> and <xref ref-type="table" rid="table2">2</xref>). Thus, the GB model, developed by the 5 selected features of the all-relevant FS method, can be called the parsimonious model due to having a better predictive ability with a smaller number of features.</p>
          <p>The optimal performance of the ML models varied by the number of selected features, as shown in <xref ref-type="table" rid="table1">Tables 1</xref> and <xref ref-type="table" rid="table2">2</xref>. For example, in the IG, the best performance was found using 9 features (DT: precision=76.6%, sensitivity=70.6%, specificity=77.6%), while in the RF FS approach, we found the best performance using 15 features (GB: precision=74.1%, sensitivity=78.4%, specificity=71.4%). Considering the performance of all models of all FS approaches, a model with the maximum <italic>F</italic><sub>1</sub>-score and sensitivity was found by using around 11 features of the stable FS approach (LGBM: precision=75%, sensitivity=82.4%, <italic>F</italic><sub>1</sub>-score=78.5%, specificity=71.4%). However, although the models’ performance varied by the number of features, it appeared that in up to 10 features that were selected by each FS approach, there were several sets of features based on which the models’ scores were around 70% when the sensitivity, specificity, precision, and <italic>F</italic><sub>1</sub>-score were calculated (<xref ref-type="table" rid="table1">Tables 1</xref> and <xref ref-type="table" rid="table2">2</xref>).</p>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>Performance of the best models while selecting n features in the filter and wrapper FS<sup>a</sup> approaches.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="100"/>
              <col width="90"/>
              <col width="90"/>
              <col width="90"/>
              <col width="90"/>
              <col width="90"/>
              <col width="0"/>
              <col width="90"/>
              <col width="90"/>
              <col width="90"/>
              <col width="90"/>
              <col width="90"/>
              <thead>
                <tr valign="top">
                  <td>Features, n</td>
                  <td colspan="6">Filter method (IG<sup>b</sup>)</td>
                  <td colspan="5">Wrapper method (Boruta<sup>c</sup>)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Best model</td>
                  <td>Precision</td>
                  <td>Sensitivity</td>
                  <td><italic>F</italic><sub>1</sub>-score</td>
                  <td>Specificity</td>
                  <td colspan="2">Best model</td>
                  <td>Precision</td>
                  <td>Sensitivity</td>
                  <td><italic>F</italic><sub>1</sub>-score</td>
                  <td>Specificity</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>5</td>
                  <td>DT<sup>d</sup></td>
                  <td>0.655</td>
                  <td>0.745</td>
                  <td>0.697</td>
                  <td>0.592</td>
                  <td colspan="2">GB<sup>e</sup></td>
                  <td>0.731<sup>f</sup></td>
                  <td>0.745<sup>f</sup></td>
                  <td>0.738<sup>f</sup></td>
                  <td>0.714<sup>f</sup></td>
                </tr>
                <tr valign="top">
                  <td>6</td>
                  <td>XGB<sup>g</sup></td>
                  <td>0.731<sup>f</sup></td>
                  <td>0.745<sup>f</sup></td>
                  <td>0.738<sup>f</sup></td>
                  <td>0.714<sup>f</sup></td>
                  <td colspan="2">KNN<sup>h</sup></td>
                  <td>0.69</td>
                  <td>0.784</td>
                  <td>0.734</td>
                  <td>0.633</td>
                </tr>
                <tr valign="top">
                  <td>7</td>
                  <td>CatBoost</td>
                  <td>0.731<sup>f</sup></td>
                  <td>0.745<sup>f</sup></td>
                  <td>0.738<sup>f</sup></td>
                  <td>0.714<sup>f</sup></td>
                  <td colspan="2">—<sup>i,j</sup></td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>8</td>
                  <td>DT</td>
                  <td>0.750<sup>k</sup></td>
                  <td>0.706<sup>k</sup></td>
                  <td>0.727<sup>k</sup></td>
                  <td>0.755<sup>k</sup></td>
                  <td colspan="2">—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>9</td>
                  <td>DT</td>
                  <td>0.766<sup>l</sup></td>
                  <td>0.706<sup>l</sup></td>
                  <td>0.735<sup>l</sup></td>
                  <td>0.776<sup>l</sup></td>
                  <td colspan="2">—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>10</td>
                  <td>LGBM<sup>m</sup></td>
                  <td>0.695</td>
                  <td>0.804</td>
                  <td>0.745</td>
                  <td>0.633</td>
                  <td colspan="2">—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>11</td>
                  <td>LGBM</td>
                  <td>0.712</td>
                  <td>0.725</td>
                  <td>0.718</td>
                  <td>0.694</td>
                  <td colspan="2">—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>12</td>
                  <td>XGB</td>
                  <td>0.691</td>
                  <td>0.745</td>
                  <td>0.717</td>
                  <td>0.653</td>
                  <td colspan="2">—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>13</td>
                  <td>XGB</td>
                  <td>0.702</td>
                  <td>0.784</td>
                  <td>0.741</td>
                  <td>0.653</td>
                  <td colspan="2">—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>14</td>
                  <td>GB</td>
                  <td>0.698</td>
                  <td>0.725</td>
                  <td>0.712</td>
                  <td>0.673</td>
                  <td colspan="2">—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>15</td>
                  <td>LGBM</td>
                  <td>0.714</td>
                  <td>0.686</td>
                  <td>0.700</td>
                  <td>0.714</td>
                  <td colspan="2">—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>16</td>
                  <td>GB</td>
                  <td>0.700</td>
                  <td>0.686</td>
                  <td>0.693</td>
                  <td>0.694</td>
                  <td colspan="2">—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>17</td>
                  <td>DT</td>
                  <td>0.778</td>
                  <td>0.686</td>
                  <td>0.729</td>
                  <td>0.796</td>
                  <td colspan="2">—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>18</td>
                  <td>LGBM</td>
                  <td>0.704</td>
                  <td>0.745</td>
                  <td>0.724</td>
                  <td>0.673</td>
                  <td colspan="2">—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>19</td>
                  <td>XGB</td>
                  <td>0.712</td>
                  <td>0.725</td>
                  <td>0.718</td>
                  <td>0.694</td>
                  <td colspan="2">—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>20</td>
                  <td>XGB</td>
                  <td>0.720</td>
                  <td>0.706</td>
                  <td>0.713</td>
                  <td>0.714</td>
                  <td colspan="2">—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table1fn1">
                <p><sup>a</sup>FS: feature selection.</p>
              </fn>
              <fn id="table1fn2">
                <p><sup>b</sup>IG: information gain.</p>
              </fn>
              <fn id="table1fn3">
                <p><sup>c</sup>The number of features selected by Boruta and stable FS was rounded to make it comparable to the other FS approaches.</p>
              </fn>
              <fn id="table1fn4">
                <p><sup>d</sup>DT: decision tree.</p>
              </fn>
              <fn id="table1fn5">
                <p><sup>e</sup>GB: gradient boost.</p>
              </fn>
              <fn id="table1fn6">
                <p><sup>f</sup>Low-performing (rank 3) classifiers in each approach.</p>
              </fn>
              <fn id="table1fn7">
                <p><sup>g</sup>XGB: XGBoost.</p>
              </fn>
              <fn id="table1fn8">
                <p><sup>h</sup>KNN: K-nearest neighbor.</p>
              </fn>
              <fn id="table1fn9">
                <p><sup>i</sup>N/A: not applicable.</p>
              </fn>
              <fn id="table1fn10">
                <p><sup>j</sup>In the Boruta method, the number of maximum important selected features was 5.5, so we set all values for 7-20 selected features as N/A.</p>
              </fn>
              <fn id="table1fn11">
                <p><sup>k</sup>Medium-performing (rank 2) classifiers in each approach.</p>
              </fn>
              <fn id="table1fn12">
                <p><sup>l</sup>High-performing (rank 1) classifiers in each approach.</p>
              </fn>
              <fn id="table1fn13">
                <p><sup>m</sup>LGBM: light gradient boosting machine.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
          <table-wrap position="float" id="table2">
            <label>Table 2</label>
            <caption>
              <p>Performance of the best models while selecting n features in the embedded and stable FS<sup>a</sup> approaches.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="100"/>
              <col width="90"/>
              <col width="90"/>
              <col width="90"/>
              <col width="90"/>
              <col width="90"/>
              <col width="0"/>
              <col width="90"/>
              <col width="90"/>
              <col width="90"/>
              <col width="90"/>
              <col width="90"/>
              <thead>
                <tr valign="top">
                  <td>Features, n</td>
                  <td colspan="6">Embedded method (RF<sup>b</sup>)</td>
                  <td colspan="5">Stable method<sup>c</sup></td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Best model</td>
                  <td>Precision</td>
                  <td>Sensitivity</td>
                  <td><italic>F</italic><sub>1</sub>-score</td>
                  <td>Specificity</td>
                  <td colspan="2">Best model</td>
                  <td>Precision</td>
                  <td>Sensitivity</td>
                  <td><italic>F</italic><sub>1</sub>-score</td>
                  <td>Specificity</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>5</td>
                  <td>CatBoost</td>
                  <td>0.649</td>
                  <td>0.725</td>
                  <td>0.685</td>
                  <td>0.592</td>
                  <td colspan="2">RF</td>
                  <td>0.691</td>
                  <td>0.745</td>
                  <td>0.717</td>
                  <td>0.653</td>
                </tr>
                <tr valign="top">
                  <td>6</td>
                  <td>XGB<sup>d</sup></td>
                  <td>0.679</td>
                  <td>0.706</td>
                  <td>0.692</td>
                  <td>0.653</td>
                  <td colspan="2">LGBM<sup>e</sup></td>
                  <td>0.773</td>
                  <td>0.667</td>
                  <td>0.716</td>
                  <td>0.796</td>
                </tr>
                <tr valign="top">
                  <td>7</td>
                  <td>GB<sup>f</sup></td>
                  <td>0.707</td>
                  <td>0.804</td>
                  <td>0.752</td>
                  <td>0.653</td>
                  <td colspan="2">LGBM</td>
                  <td>0.760</td>
                  <td>0.745</td>
                  <td>0.752</td>
                  <td>0.755</td>
                </tr>
                <tr valign="top">
                  <td>8</td>
                  <td>DT<sup>g</sup></td>
                  <td>0.735</td>
                  <td>0.706</td>
                  <td>0.720</td>
                  <td>0.735</td>
                  <td colspan="2">LGBM</td>
                  <td>0.704</td>
                  <td>0.745</td>
                  <td>0.724</td>
                  <td>0.673</td>
                </tr>
                <tr valign="top">
                  <td>9</td>
                  <td>LGBM</td>
                  <td>0.731<sup>h</sup></td>
                  <td>0.745<sup>h</sup></td>
                  <td>0.738<sup>h</sup></td>
                  <td>0.714<sup>h</sup></td>
                  <td colspan="2">LGBM</td>
                  <td>0.690</td>
                  <td>0.784</td>
                  <td>0.734</td>
                  <td>0.633</td>
                </tr>
                <tr valign="top">
                  <td>10</td>
                  <td>LGBM</td>
                  <td>0.731<sup>h</sup></td>
                  <td>0.745</td>
                  <td>0.738<sup>h</sup></td>
                  <td>0.714<sup>h</sup></td>
                  <td colspan="2">LGBM</td>
                  <td>0.737</td>
                  <td>0.824</td>
                  <td>0.778</td>
                  <td>0.694</td>
                </tr>
                <tr valign="top">
                  <td>11</td>
                  <td>LGBM</td>
                  <td>0.755<sup>i</sup></td>
                  <td>0.725<sup>i</sup></td>
                  <td>0.740<sup>i</sup></td>
                  <td>0.755<sup>i</sup></td>
                  <td colspan="2">LGBM</td>
                  <td>0.750<sup>j</sup></td>
                  <td>0.824<sup>j</sup></td>
                  <td>0.785<sup>j</sup></td>
                  <td>0.714<sup>j</sup></td>
                </tr>
                <tr valign="top">
                  <td>12</td>
                  <td>LGBM</td>
                  <td>0.755<sup>i</sup></td>
                  <td>0.725<sup>i</sup></td>
                  <td>0.740<sup>i</sup></td>
                  <td>0.755<sup>i</sup></td>
                  <td colspan="2">LGBM</td>
                  <td>0.750<sup>h</sup></td>
                  <td>0.765<sup>h</sup></td>
                  <td>0.757<sup>h</sup></td>
                  <td>0.735<sup>h</sup></td>
                </tr>
                <tr valign="top">
                  <td>13</td>
                  <td>DT</td>
                  <td>0.735</td>
                  <td>0.706</td>
                  <td>0.720</td>
                  <td>0.735</td>
                  <td colspan="2">LGBM</td>
                  <td>0.750<sup>h</sup></td>
                  <td>0.765<sup>h</sup></td>
                  <td>0.757<sup>h</sup></td>
                  <td>0.735<sup>h</sup></td>
                </tr>
                <tr valign="top">
                  <td>14</td>
                  <td>KNN<sup>k</sup></td>
                  <td>0.720</td>
                  <td>0.706</td>
                  <td>0.713</td>
                  <td>0.714</td>
                  <td colspan="2">LGBM</td>
                  <td>0.731</td>
                  <td>0.745</td>
                  <td>0.738</td>
                  <td>0.714</td>
                </tr>
                <tr valign="top">
                  <td>15</td>
                  <td>GB</td>
                  <td>0.741<sup>j</sup></td>
                  <td>0.784<sup>j</sup></td>
                  <td>0.762<sup>j</sup></td>
                  <td>0.714<sup>j</sup></td>
                  <td colspan="2">LGBM</td>
                  <td>0.740</td>
                  <td>0.725</td>
                  <td>0.733</td>
                  <td>0.735</td>
                </tr>
                <tr valign="top">
                  <td>16</td>
                  <td>LGBM</td>
                  <td>0.712</td>
                  <td>0.725</td>
                  <td>0.718</td>
                  <td>0.694</td>
                  <td colspan="2">LGBM</td>
                  <td>0.765<sup>i</sup></td>
                  <td>0.765<sup>i</sup></td>
                  <td>0.765<sup>i</sup></td>
                  <td>0.755<sup>i</sup></td>
                </tr>
                <tr valign="top">
                  <td>17</td>
                  <td>RF</td>
                  <td>0.696</td>
                  <td>0.765</td>
                  <td>0.729</td>
                  <td>0.653</td>
                  <td colspan="2">LGBM</td>
                  <td>0.680</td>
                  <td>0.667</td>
                  <td>0.673</td>
                  <td>0.673</td>
                </tr>
                <tr valign="top">
                  <td>18</td>
                  <td>DT</td>
                  <td>0.660</td>
                  <td>0.686</td>
                  <td>0.673</td>
                  <td>0.633</td>
                  <td colspan="2">DT</td>
                  <td>0.700</td>
                  <td>0.686</td>
                  <td>0.693</td>
                  <td>0.694</td>
                </tr>
                <tr valign="top">
                  <td>19</td>
                  <td>LGBM</td>
                  <td>0.729</td>
                  <td>0.686</td>
                  <td>0.707</td>
                  <td>0.735</td>
                  <td colspan="2">LGBM</td>
                  <td>0.698</td>
                  <td>0.725</td>
                  <td>0.712</td>
                  <td>0.673</td>
                </tr>
                <tr valign="top">
                  <td>20</td>
                  <td>GB</td>
                  <td>0.712</td>
                  <td>0.725</td>
                  <td>0.718</td>
                  <td>0.694</td>
                  <td colspan="2">LGBM</td>
                  <td>0.725</td>
                  <td>0.725</td>
                  <td>0.725</td>
                  <td>0.714</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table2fn1">
                <p><sup>a</sup>FS: feature selection.</p>
              </fn>
              <fn id="table2fn2">
                <p><sup>b</sup>RF: random forest.</p>
              </fn>
              <fn id="table2fn3">
                <p><sup>c</sup>The number of features selected by Boruta and stable FS was rounded to make it comparable to the other FS approaches.</p>
              </fn>
              <fn id="table2fn4">
                <p><sup>d</sup>XGB: XGBoost.</p>
              </fn>
              <fn id="table2fn5">
                <p><sup>e</sup>LGBM: light gradient boosting machine.</p>
              </fn>
              <fn id="table2fn6">
                <p><sup>f</sup>GB: gradient boost.</p>
              </fn>
              <fn id="table2fn7">
                <p><sup>g</sup>DT: decision tree.</p>
              </fn>
              <fn id="table2fn8">
                <p><sup>h</sup>Low-performing (rank 3) classifiers in each approach.</p>
              </fn>
              <fn id="table2fn9">
                <p><sup>i</sup>Medium-performing (rank 2) classifiers in each approach.</p>
              </fn>
              <fn id="table2fn10">
                <p><sup>j</sup>High-performing (rank 1) classifiers in each approach.</p>
              </fn>
              <fn id="table2fn11">
                <p><sup>k</sup>KNN: K-nearest neighbor.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
        <sec>
          <title>Performance of the Stacking Models</title>
          <p>After finding the optimal set of features for each FS approach, we built stacking models based on the top 5 classifiers. While selecting classifiers based on the embedded method’s features, we found that although a model based on 15 features demonstrated the maximum <italic>F</italic><sub>1</sub>-score (<xref ref-type="table" rid="table1">Tables 1</xref> and <xref ref-type="table" rid="table2">2</xref>), most classifiers’ performance remained higher while using 12 features (see <xref ref-type="table" rid="table3">Table 3</xref>; for comparison, see Table E3 of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). However, in the IG, Boruta, and stable methods, the best set of top 5 classifiers was found in 9 features, at the base estimator’s maximum depth of 6, and at a threshold of 0.77, respectively (for details, see Tables E1, E2, and E4 of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
          <p>Interestingly, from the top 5 classifiers of each FS approach, it was apparent that boosting models can find important behavioral patterns that make their predictions more accurate, keeping most of them in the top 5 classifiers list (<xref ref-type="table" rid="table3">Table 3</xref>), although we used a baseline dummy classifier and 13 different ML algorithms where linear and nonlinear algorithms were present. We found at least one variation of the GB models remained as one of the top 2 classifiers. The LGBM model in particular performed better across different sets of features. The LGBM model showed good performance consistently on most feature sets selected by the stable FS approach (<xref ref-type="table" rid="table1">Tables 1</xref> and <xref ref-type="table" rid="table2">2</xref>). Even when the number of features remained constant, the LGBM model remained one of the top 5 classifiers in each FS approach (<xref ref-type="table" rid="table3">Table 3</xref>).</p>
          <p>The stacking models based on features selected by the filter, wrapper, and embedded methods had precision, sensitivity, specificity, and <italic>F</italic><sub>1</sub>-score values of more than 70%. The stacking model based on the features selected by the wrapper method Boruta correctly identified 80.4% (n=41; sensitivity=80.4%) of depressed participants. The predicted depressed group was also accurate in 77.4% (n=41) of cases (precision=77.4%), making this the most accurate model among all 4 stacking classifiers, as presented in <xref ref-type="table" rid="table4">Table 4</xref>. However, it was surprising to see that the stable method–selected feature-based stacking model had a precision and specificity lower than 70% (<xref ref-type="table" rid="table4">Table 4</xref>), although this method’s selected feature set at a threshold of 0.77 produced the LGBM model with a higher sensitivity (82.4%) and <italic>F</italic><sub>1</sub>-score (78.5%) than any other individual model (<xref ref-type="table" rid="table3">Table 3</xref>). Additionally, we found the LGBM model had a relatively lower balanced accuracy— (sensitivity + specificity/2)—than the best stacking model: (82.4% + 71.4%)/2 = 76.9% for the LGBM model (<xref ref-type="table" rid="table3">Table 3</xref>) versus (80.4% + 75.5%)/2 = 77.9% for the Boruta-selected feature-based stacking model (<xref ref-type="table" rid="table4">Table 4</xref>).</p>
          <table-wrap position="float" id="table3">
            <label>Table 3</label>
            <caption>
              <p>Top 5 classifiers and the baseline classifier’s performance based on the performance of the best set of features of each FS<sup>a</sup> approach.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="30"/>
              <col width="540"/>
              <col width="0"/>
              <col width="120"/>
              <col width="0"/>
              <col width="120"/>
              <col width="0"/>
              <col width="100"/>
              <col width="0"/>
              <col width="90"/>
              <thead>
                <tr valign="top">
                  <td colspan="3">Method and model name</td>
                  <td colspan="2">Precision</td>
                  <td colspan="2">Sensitivity</td>
                  <td colspan="2"><italic>F</italic><sub>1</sub>-score</td>
                  <td>Specificity</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="3">
                    <bold>Filter method (IG<sup>b</sup>; n=9 features)</bold>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>DT<sup>c</sup></td>
                  <td colspan="2">0.766</td>
                  <td colspan="2">0.706</td>
                  <td colspan="2">0.735</td>
                  <td colspan="2">0.776</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>GB<sup>d</sup></td>
                  <td colspan="2">0.717</td>
                  <td colspan="2">0.745</td>
                  <td colspan="2">0.731</td>
                  <td colspan="2">0.694</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>AdaBoost</td>
                  <td colspan="2">0.729</td>
                  <td colspan="2">0.686</td>
                  <td colspan="2">0.707</td>
                  <td colspan="2">0.735</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>LGBM<sup>e</sup></td>
                  <td colspan="2">0.704</td>
                  <td colspan="2">0.745</td>
                  <td colspan="2">0.724</td>
                  <td colspan="2">0.673</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>XGB<sup>f</sup></td>
                  <td colspan="2">0.692</td>
                  <td colspan="2">0.706</td>
                  <td colspan="2">0.699</td>
                  <td colspan="2">0.673</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Baseline (dummy)</td>
                  <td colspan="2">0.510</td>
                  <td colspan="2">1.000</td>
                  <td colspan="2">0.675</td>
                  <td colspan="2">0</td>
                </tr>
                <tr valign="top">
                  <td colspan="3">
                    <bold>Wrapper method (Boruta; base estimator’s maximum depth=6)</bold>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>GB</td>
                  <td colspan="2">0.731</td>
                  <td colspan="2">0.745</td>
                  <td colspan="2">0.738</td>
                  <td colspan="2">0.714</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>KNN<sup>g</sup></td>
                  <td colspan="2">0.707</td>
                  <td colspan="2">0.804</td>
                  <td colspan="2">0.752</td>
                  <td colspan="2">0.653</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>XGB</td>
                  <td colspan="2">0.725</td>
                  <td colspan="2">0.725</td>
                  <td colspan="2">0.725</td>
                  <td colspan="2">0.714</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>AdaBoost</td>
                  <td colspan="2">0.696</td>
                  <td colspan="2">0.765</td>
                  <td colspan="2">0.729</td>
                  <td colspan="2">0.653</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>LGBM</td>
                  <td colspan="2">0.714</td>
                  <td colspan="2">0.686</td>
                  <td colspan="2">0.700</td>
                  <td colspan="2">0.714</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Baseline (dummy)</td>
                  <td colspan="2">0.510</td>
                  <td colspan="2">1.000</td>
                  <td colspan="2">0.675</td>
                  <td colspan="2">0</td>
                </tr>
                <tr valign="top">
                  <td colspan="3">
                    <bold>Embedded method (RF<sup>h</sup>; n=12 features)</bold>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>GB</td>
                  <td colspan="2">0.732</td>
                  <td colspan="2">0.804</td>
                  <td colspan="2">0.766</td>
                  <td colspan="2">0.694</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>LGBM</td>
                  <td colspan="2">0.755</td>
                  <td colspan="2">0.725</td>
                  <td colspan="2">0.740</td>
                  <td colspan="2">0.755</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Logit<sup>i</sup></td>
                  <td colspan="2">0.750</td>
                  <td colspan="2">0.706</td>
                  <td colspan="2">0.727</td>
                  <td colspan="2">0.755</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>DT</td>
                  <td colspan="2">0.729</td>
                  <td colspan="2">0.686</td>
                  <td colspan="2">0.707</td>
                  <td colspan="2">0.735</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>KNN</td>
                  <td colspan="2">0.706</td>
                  <td colspan="2">0.706</td>
                  <td colspan="2">0.706</td>
                  <td colspan="2">0.694</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Baseline (dummy)</td>
                  <td colspan="2">0.510</td>
                  <td colspan="2">1.000</td>
                  <td colspan="2">0.675</td>
                  <td colspan="2">0</td>
                </tr>
                <tr valign="top">
                  <td colspan="3">
                    <bold>Stable method (threshold=0.77)</bold>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>LGBM</td>
                  <td colspan="2">0.750</td>
                  <td colspan="2">0.824</td>
                  <td colspan="2">0.785</td>
                  <td colspan="2">0.714</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>XGB</td>
                  <td colspan="2">0.745</td>
                  <td colspan="2">0.745</td>
                  <td colspan="2">0.745</td>
                  <td colspan="2">0.735</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>DT</td>
                  <td colspan="2">0.706</td>
                  <td colspan="2">0.706</td>
                  <td colspan="2">0.706</td>
                  <td colspan="2">0.694</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>GB</td>
                  <td colspan="2">0.706</td>
                  <td colspan="2">0.706</td>
                  <td colspan="2">0.706</td>
                  <td colspan="2">0.694</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>CatBoost</td>
                  <td colspan="2">0.691</td>
                  <td colspan="2">0.745</td>
                  <td colspan="2">0.717</td>
                  <td colspan="2">0.653</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Baseline (dummy)</td>
                  <td colspan="2">0.510</td>
                  <td colspan="2">1.000</td>
                  <td colspan="2">0.675</td>
                  <td colspan="2">0</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table3fn1">
                <p><sup>a</sup>FS: feature selection.</p>
              </fn>
              <fn id="table3fn2">
                <p><sup>b</sup>IG: information gain.</p>
              </fn>
              <fn id="table3fn3">
                <p><sup>c</sup>DT: decision tree.</p>
              </fn>
              <fn id="table3fn4">
                <p><sup>d</sup>GB: gradient boost.</p>
              </fn>
              <fn id="table3fn5">
                <p><sup>e</sup>LGBM: light gradient boosting machine.</p>
              </fn>
              <fn id="table3fn6">
                <p><sup>f</sup>XGB: XGBoost.</p>
              </fn>
              <fn id="table3fn7">
                <p><sup>g</sup>KNN: K-nearest neighbor.</p>
              </fn>
              <fn id="table3fn8">
                <p><sup>h</sup>RF: random forest.</p>
              </fn>
              <fn id="table3fn9">
                <p><sup>i</sup>Logit: logistic regression.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
          <table-wrap position="float" id="table4">
            <label>Table 4</label>
            <caption>
              <p>Performance of the stacking classifiers based on the top 5 classifiers of the best set of features of each FS<sup>a</sup> method.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="380"/>
              <col width="100"/>
              <col width="100"/>
              <col width="100"/>
              <col width="100"/>
              <col width="110"/>
              <col width="110"/>
              <thead>
                <tr valign="top">
                  <td>FS method</td>
                  <td>Precision</td>
                  <td>Sensitivity</td>
                  <td><italic>F</italic><sub>1</sub>-score</td>
                  <td>Specificity</td>
                  <td>AUC<sup>b</sup> score</td>
                  <td>Accuracy</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>Filter method (IG<sup>c</sup>; n=9 features)</td>
                  <td>0.735</td>
                  <td>0.706</td>
                  <td>0.72</td>
                  <td>0.735</td>
                  <td>0.72</td>
                  <td>0.72</td>
                </tr>
                <tr valign="top">
                  <td>Wrapper method (Boruta; maximum depth=6)</td>
                  <td>0.774</td>
                  <td>0.804</td>
                  <td>0.788</td>
                  <td>0.755</td>
                  <td>0.78</td>
                  <td>0.78</td>
                </tr>
                <tr valign="top">
                  <td>Embedded method (RF<sup>d</sup>; n=12 features)</td>
                  <td>0.725</td>
                  <td>0.725</td>
                  <td>0.725</td>
                  <td>0.714</td>
                  <td>0.72</td>
                  <td>0.72</td>
                </tr>
                <tr valign="top">
                  <td>Stable method (threshold=0.77)</td>
                  <td>0.65</td>
                  <td>0.765</td>
                  <td>0.703</td>
                  <td>0.571</td>
                  <td>0.668</td>
                  <td>0.67</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table4fn1">
                <p><sup>a</sup>FS: feature selection.</p>
              </fn>
              <fn id="table4fn2">
                <p><sup>b</sup>AUC: area under the curve.</p>
              </fn>
              <fn id="table4fn3">
                <p><sup>c</sup>IG: information gain.</p>
              </fn>
              <fn id="table4fn4">
                <p><sup>d</sup>RF: random forest.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
      </sec>
      <sec>
        <title>Important Features and Explanation of the Models</title>
        <p>Although each FS approach works differently, we found several common features as being important (<xref rid="figure7" ref-type="fig">Figure 7</xref>). There were 3 entropy-based features that were used more than 80% of the time among all iterations of LOPOCV in each of the 4 FS approaches. These features included two that measure the entropy based on the app usage of weekdays and weekends spanning a 24-hour period, as well as the feature that calculated the average entropy of weekdays during 4 time intervals (morning, afternoon, evening, and night; <xref rid="figure7" ref-type="fig">Figure 7</xref>). Although we used 12 different types of data, 40% (n=14) of the top 35 important features (all features are presented in Table F2 of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) were based on entropy, hamming distance, and session data (<xref rid="figure7" ref-type="fig">Figure 7</xref>). In fact, at a threshold of 0.97 of the stable FS approach, 98% of iterations of LOPOCV contained the <italic>Weekday_Communication_Ratio_of_Hamming_6_Hour_Mean</italic> feature (Table F3 of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), which is also based on hamming distance data. The hamming distance presents the app usage uniqueness, whereas entropy presents the app usage pattern, which decreases with higher inequality in app usage data. This reveals that complex app usage patterns can reflect better differentiable behavior, which can output higher classification accuracy.</p>
        <p>In our extracted features, there were diurnal features presenting the app usage behavior in 6-hour intervals, as well as features based on the whole day. However, compared to the whole day’s app usage, we found a larger number of important features regarding diurnal app usage behavior (n=19, 54.3%, for diurnal usage vs n=16, 45.7%, for 24-hour usage; <xref rid="figure7" ref-type="fig">Figure 7</xref>). In particular, a higher number of features (n=12, 34.3%) regarding the deviation of app usage behavior over the night, morning, afternoon, and evening periods was selected as important. We also found that although only 22.9% (n=8) of the top 35 features were based on overall smartphone usage data (regardless of the app category), 77.1% (n=27) were based on different app categories. We found the Communication, Social, and Tools app category–based features to be especially superior (<xref rid="figure7" ref-type="fig">Figure 7</xref>).</p>
        <p>To explain the features’ impact on the ML models’ output, we used the SHAP approach. To check consistency, we explored the features’ impact on the training as well as the test data for the best individual model (LGBM; <xref rid="figure8" ref-type="fig">Figure 8</xref>a,b) and the best stacking model (<xref rid="figure8" ref-type="fig">Figure 8</xref>c,d). In LOPOCV, (N – 1) participants’ data were used for training and the remaining 1 participant’s data were used for testing purposes. Therefore, a participant appeared <italic>n</italic> times during the training, whereas during the testing, a participant appeared only one time. This scenario is reflected in <xref rid="figure8" ref-type="fig">Figure 8</xref>, where there are more feature values in the summary plot based on training data. Interestingly, we observed consistency in the impact of the features on the model output. In the case of both training and testing data–based summary plots of the LGBM and stacking models, higher entropy in smartphone usage during the weekdays over a 24-hour period showed a negative impact (shifting the prediction toward the nondepressed group), while lower entropy showed a positive impact (moving toward the depressed group; <xref rid="figure8" ref-type="fig">Figure 8</xref>a-d). However, a higher mean entropy based on 4 time periods (ie, night, morning, afternoon, and evening) demonstrated an impact in the reverse direction (<xref rid="figure8" ref-type="fig">Figure 8</xref>a,b).</p>
        <p>We also found in the Communication category that having a higher mean ratio of hamming distances in the 4 time periods during weekdays increased the predicted probability toward the depressed group, showing a positive impact (<xref rid="figure8" ref-type="fig">Figure 8</xref>a,b). Similarly, we found that higher Photo and Video app usage on the weekends moved the predicted probability toward the depressed group (<xref rid="figure8" ref-type="fig">Figure 8</xref>a,b). However, in the Education category, more time spent on weekdays appeared to increase the probability toward the nondepressed group (<xref rid="figure8" ref-type="fig">Figure 8</xref>a,b).</p>
        <p>By local interpretations, we investigated how each participant’s class probability was impacted by different features. As a sample, we presented 2 participants’ group prediction approaches by the LGBM and stacking models, in which cases the prediction was accurate. We found that in the case of the nondepressed participant (ID 77), smartphone entropy based on a 24-hour period during the weekdays was 1.204 (<xref rid="figure9" ref-type="fig">Figure 9</xref>d), whereas in the case of the depressed participant (ID 46), this feature’s value was –0.148 (<xref rid="figure9" ref-type="fig">Figure 9</xref>a), which was much lower. This finding indicates the same relationship as that presented in the summary plot in <xref rid="figure8" ref-type="fig">Figure 8</xref>. Moreover, the higher SD over the day in the number of photo and video apps in the case of depressed participants (<xref rid="figure9" ref-type="fig">Figure 9</xref>a) compared to nondepressed participants (<xref rid="figure9" ref-type="fig">Figure 9</xref>c) reflected the findings demonstrated in <xref rid="figure8" ref-type="fig">Figure 8</xref>, where we found the higher SD classifying the predicted group as depressed. From <xref rid="figure9" ref-type="fig">Figure 9</xref>, it is also apparent that to predict the group of this participant, a relatively smaller number of features were used in the Boruta-selected feature-based stacking model. For example, to predict the group of the depressed participant, the stable feature-based LGBM model used 8 features (<xref rid="figure9" ref-type="fig">Figure 9</xref>a), whereas for the same participant, the Boruta-selected feature-based model used only 5 features (<xref rid="figure9" ref-type="fig">Figure 9</xref>b), although both the models’ predictions were correct.</p>
        <fig id="figure7" position="float">
          <label>Figure 7</label>
          <caption>
            <p>Top 35 features among the features used for the best set of top 5 classifiers based on the filter method IG (n=9 features), wrapper method Boruta (base estimator’s maximum depth=6), embedded method RF (n=12 features), and stable method (threshold=0.77). Here, features are ranked based on the mean appearance in the FS methods. The smartphone denotes data regardless of the app category. The values present the percentage of times (among all iterations of LOPOCV) a feature appeared. FS: feature selection; IG: information gain; LOPOCV: leave-one-participant-out cross-validation; RF: random forest.</p>
          </caption>
          <graphic xlink:href="formative_v7i1e28848_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure8" position="float">
          <label>Figure 8</label>
          <caption>
            <p>Summary plot showing the impact of features on the output of the LGBM model and the stacking model: (a, c) training data and (b, d) testing data. Features are ranked by importance, which is calculated based on Shapley values. Here, we present the features that appeared in all iterations of LOPOCV. LGBM: light gradient boosting machine; LOPOCV: leave-one-participant-out cross-validation; SHAP: Shapley additive explanations.</p>
          </caption>
          <graphic xlink:href="formative_v7i1e28848_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure9" position="float">
          <label>Figure 9</label>
          <caption>
            <p>Force plot showing the identification of a participant with depression (participant ID 46) and a participant without depression (participant ID 77) by the LGBM (a, c) and stacking (b, d) models. Text in bold color shows the probability of remaining in the respected class (depressed, nondepressed). (a, b) Text in blue color shows the features moving the predicted class to 1 (depressed), while text in red color shows the features moving the predicted class to 0 (nondepressed). (c, d) The direction is reversed. Numerical values after each feature present the standardized feature value in the case of the participant that was used in model development. LGBM: light gradient boosting machine.</p>
          </caption>
          <graphic xlink:href="formative_v7i1e28848_fig9.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings and Comparison With Prior Work</title>
        <p>In this study, we presented Mon Majhi, a pervasive smartphone technology that aims to detect depression following a minimalistic approach in terms of data collection and detection time. It retrieves the past 7 days’ app usage behavioral data within 1 second (mean 307.94, SD 1103.91 ms). Compared to the existing promising systems that leverage various data, including sensed data [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref87">87</xref>], phone usage [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>], and network traffic [<xref ref-type="bibr" rid="ref89">89</xref>], our system is faster and minimalistic, as presented in <xref ref-type="table" rid="table5">Table 5</xref>. For instance, an existing state-of-the-art systems [<xref ref-type="bibr" rid="ref20">20</xref>] required 106 days to collect data of an equal number of days, and using those data, the model correctly identified 84.7% of depressed participants. However, using only our system’s instantly (&lt;1 second) accessed 7 days’ data, our LGBM model correctly identified 82.4% of depressed participants. In addition, although previous studies have developed promising models to identify depressed participants, the systems in most studies rely on sensors, such as accelerometers [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref32">32</xref>], audio [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref88">88</xref>], Bluetooth [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref28">28</xref>], and GPS [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref88">88</xref>]. Using such sensors may be energy inefficient due to high power consumption (eg, by GPS [<xref ref-type="bibr" rid="ref41">41</xref>]), which significantly reduces the battery life [<xref ref-type="bibr" rid="ref41">41</xref>]. In addition, the need for current phone data–based systems [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref88">88</xref>,<xref ref-type="bibr" rid="ref89">89</xref>] to run in the background may create reluctance as users want a long battery life [<xref ref-type="bibr" rid="ref90">90</xref>] and running services in the background increases power consumption [<xref ref-type="bibr" rid="ref91">91</xref>]. Moreover, students may not use systems for assessing mental health that negatively impact battery life [<xref ref-type="bibr" rid="ref92">92</xref>]. Our system, on the other hand, does not use any such sensors or run in the background. We also do not need to run any resource-intensive systems (eg, a conversation classifier [<xref ref-type="bibr" rid="ref32">32</xref>] or an audio signal processor [<xref ref-type="bibr" rid="ref88">88</xref>]) to extract behavioral data. Instead, we perform simple mathematical calculations for feature extraction, which makes our system cheap, minimalistic, and largely scalable for resource-constrained settings. Our system can also be complementary to existing systems where faster detection can be followed by other systems for long-term evaluation. The minimalistic design opens opportunities for this system to be used in low-resource settings, such as an LMIC like Bangladesh.</p>
        <p>Based on all evaluation metrics, our best stacking model had a performance of over 75%, while the robust models in a study [<xref ref-type="bibr" rid="ref35">35</xref>] based on phone usage and internet connectivity had a performance of over 85% with a maximum accuracy of 98.1%. However, in addition to the general limitations discussed before, their models were limited by several other factors. For example, when classifying responses and considering that approximately 50% of participants had more than one response, it becomes possible for the same participants’ responses to appear in both the training and testing data sets. This introduces the potential for biased models and overestimated performance [<xref ref-type="bibr" rid="ref93">93</xref>]. Similarly, compared to a study by Leigh et al [<xref ref-type="bibr" rid="ref27">27</xref>] where researchers developed ML models solely based on phone usage data, our stacking model demonstrated 18.4% higher sensitivity than their best model. There can be several reasons behind this enhanced performance. For instance, our feature importance analysis showed that a higher number of features pertaining to diurnal usage data are more important than the 24-hour aggregated data, which was unexplored by Leigh et al [<xref ref-type="bibr" rid="ref27">27</xref>]. In the SHAP analysis, we found that a higher entropy based on smartphone usage in 24 hours of weekdays increased the model’s predicted probability toward the nondepressed group, while an increase in average entropy in the 4 time periods of a day increased the predicted probability toward the depressed group. This also indicates that the diurnal usage pattern is different from the whole day’s behavior. Additionally, in our study, features regarding entropy, hamming distance, and session data appeared as important, which also remained unexplored in the previous study [<xref ref-type="bibr" rid="ref27">27</xref>]. At a threshold of 0.77 of the stable FS approach, a feature regarding the hamming distance appeared in each iteration of LOPOCV, where we found the best individual model: LGBM (precision=77%, sensitivity=82.4%). In addition, we found that a higher number of features based on app categories was important compared to the aggregated data regardless of app category. Behavioral markers of the particular app categories are associated with depression [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>] and also with the rhythmic patterns of our body [<xref ref-type="bibr" rid="ref95">95</xref>], as presented by researchers through conventional statistical methods [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref94">94</xref>] and also by a qualitative study [<xref ref-type="bibr" rid="ref94">94</xref>]. Therefore, our findings suggest that while developing ML models, instead of leveraging only the aggregated phone usage data, as in the previous studies [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref35">35</xref>], incorporation of the features regarding app categories and extraction of features such as hamming distance may improve the performance of the ML models.</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Comparison of our system’s performance with that of previous studies using pervasive devices to identify depressed and nondepressed participants. Researchers used binary classification in the included studies. The time required to collect data in each study based on the description of the data collection tool is reported.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="100"/>
            <col width="110"/>
            <col width="110"/>
            <col width="90"/>
            <col width="70"/>
            <col width="50"/>
            <col width="70"/>
            <col width="70"/>
            <col width="70"/>
            <col width="70"/>
            <col width="90"/>
            <col width="70"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Reference and country (if available)</td>
                <td>Sample size for models, N</td>
                <td>Collected data</td>
                <td>System needs to run in the background</td>
                <td>Duration of explored data</td>
                <td>Time to retrieve data</td>
                <td>Accuracy</td>
                <td>Precision</td>
                <td>Sensitivity</td>
                <td>Specificity</td>
                <td>AUC<sup>a</sup> score</td>
                <td><italic>F</italic><sub>1</sub>-score</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="13">
                  <bold>Xu et al [<xref ref-type="bibr" rid="ref19">19</xref>], United States</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Data set 1</td>
                <td>138</td>
                <td>Fitbit sensed, phone sensed, usage</td>
                <td>Yes</td>
                <td>106 days</td>
                <td>106 days</td>
                <td>0.807 and 0.818</td>
                <td>0.765 and 0.843</td>
                <td>0.886 and 0.843</td>
                <td>—<sup>b</sup></td>
                <td>—</td>
                <td>0.821 and 0.843</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Data set 2</td>
                <td>212</td>
                <td>Fitbit sensed, phone sensed, usage</td>
                <td>Yes</td>
                <td>113 days</td>
                <td>113 days</td>
                <td>0.689-0.840</td>
                <td>0.757-0.877</td>
                <td>0.779-0.907</td>
                <td>—</td>
                <td>—</td>
                <td>0.768-0.881</td>
              </tr>
              <tr valign="top">
                <td colspan="13">
                  <bold>Xu et al [<xref ref-type="bibr" rid="ref20">20</xref>], United States</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Data set 1</td>
                <td>138</td>
                <td>Fitbit sensed, phone sensed, usage</td>
                <td>Yes</td>
                <td>106 days</td>
                <td>106 days</td>
                <td>0.825</td>
                <td>0.862</td>
                <td>0.847</td>
                <td>—</td>
                <td>—</td>
                <td>0.855</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Data set 2</td>
                <td>169</td>
                <td>Fitbit sensed, phone sensed, usage</td>
                <td>Yes</td>
                <td>166 days</td>
                <td>166 days</td>
                <td>0.791</td>
                <td>0.814</td>
                <td>0.854</td>
                <td>—</td>
                <td>—</td>
                <td>0.833</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Wang et al [<xref ref-type="bibr" rid="ref32">32</xref>], United States</td>
                <td>83</td>
                <td>Microsoft Band sensed, phone sensed, usage</td>
                <td>Yes</td>
                <td>63 days (9-week terms)</td>
                <td>63 days</td>
                <td>—</td>
                <td>0.691</td>
                <td>0.815</td>
                <td>—</td>
                <td>0.809</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Saeb et al [<xref ref-type="bibr" rid="ref27">27</xref>], United States</td>
                <td>21 (for phone usage data-based analysis)</td>
                <td>Phone usage</td>
                <td>Yes</td>
                <td>14 days</td>
                <td>14 days</td>
                <td>Mean 0.742 (SD 0.034)</td>
                <td>—</td>
                <td>Mean 0.640</td>
                <td>Mean 0.839</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Nickels et al [<xref ref-type="bibr" rid="ref28">28</xref>], United States</td>
                <td>186 and 197</td>
                <td>Phone sensed, usage</td>
                <td>Yes</td>
                <td>84 days</td>
                <td>84 days</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>Mean 0.620 (SD 0.062) and mean 0.656 (SD 0.079)</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Opoku et al [<xref ref-type="bibr" rid="ref35">35</xref>], mostly developed countries</td>
                <td>629</td>
                <td>Phone usage, internet, demography</td>
                <td>Yes</td>
                <td>Mean 22.1 (SD 17.9) days</td>
                <td>Mean 22.1 (SD 17.9) days</td>
                <td>0.964-0.981</td>
                <td>0.856-0.925</td>
                <td>0.922-0.956</td>
                <td>—</td>
                <td>0.947-0.991</td>
                <td>0.887-0.940</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Opoku et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td>54</td>
                <td>Demographics, Oura ring sensed, phone sensed, usage</td>
                <td>Yes</td>
                <td>Mean 28.21 days</td>
                <td>Mean 28.21 days</td>
                <td>0.814</td>
                <td>Dep<sup>c</sup>: 0.6997<break/>Nondep<sup>d</sup>: 0.841</td>
                <td>0.505</td>
                <td>0.924</td>
                <td>0.823</td>
                <td>Dep: 0.587<break/>Nondep: 0.880</td>
              </tr>
              <tr valign="top">
                <td colspan="13">
                  <bold>Dogrucu et al [<xref ref-type="bibr" rid="ref88">88</xref>]</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>PHQ-9<sup>e</sup> cutoff score=10 and undersampling</td>
                <td>294</td>
                <td>Contacts, GPS, call log, social media, voice recording</td>
                <td>Yes</td>
                <td>14 days</td>
                <td>—</td>
                <td>0.588</td>
                <td>0.599</td>
                <td>0.554</td>
                <td>0.623</td>
                <td>—</td>
                <td>0.575</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>PHQ-9 cutoff score=20 and undersampling</td>
                <td>96</td>
                <td>Contacts, GPS, call log, social media, voice recording</td>
                <td>Yes</td>
                <td>14 days</td>
                <td>—</td>
                <td>0.771</td>
                <td>0.783</td>
                <td>0.75</td>
                <td>0.792</td>
                <td>—</td>
                <td>0.766</td>
              </tr>
              <tr valign="top">
                <td colspan="13">
                  <bold>Yue et al [<xref ref-type="bibr" rid="ref89">89</xref>], United States</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>iOS users</td>
                <td>40</td>
                <td>Network traffic</td>
                <td>Yes</td>
                <td>Several months</td>
                <td>Several months</td>
                <td>—</td>
                <td>0.71</td>
                <td>0.71</td>
                <td>0.63</td>
                <td>—</td>
                <td>0.71</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Android users</td>
                <td>13</td>
                <td>Network traffic, screen on-off</td>
                <td>Yes</td>
                <td>Several months</td>
                <td>Several months</td>
                <td>—</td>
                <td>0.75</td>
                <td>0.86</td>
                <td>0.77</td>
                <td>—</td>
                <td>0.80</td>
              </tr>
              <tr valign="top">
                <td colspan="13">
                  <bold>This study, Bangladesh</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Performance of our best single classifier–based model: LGBM<sup>f</sup></td>
                <td>100</td>
                <td>Phone usage data</td>
                <td>No</td>
                <td>Past 7 days</td>
                <td>Mean 307.94 (SD 1103.91) ms</td>
                <td>.770</td>
                <td>0.750</td>
                <td>0.824</td>
                <td>0.714</td>
                <td>0.769</td>
                <td>0.785</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Performance of our best stacking model based on the top 5 classifiers</td>
                <td>100</td>
                <td>Phone usage data</td>
                <td>No</td>
                <td>Past 7 days</td>
                <td>Mean 307.94 (SD 1103.91) ms</td>
                <td>0.780</td>
                <td>0.774</td>
                <td>0.804</td>
                <td>0.755</td>
                <td>0.780</td>
                <td>0.788</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>AUC: area under the curve.</p>
            </fn>
            <fn id="table5fn2">
              <p><sup>b</sup>Not available.</p>
            </fn>
            <fn id="table5fn3">
              <p><sup>c</sup>Dep: depressed.</p>
            </fn>
            <fn id="table5fn4">
              <p><sup>d</sup>Nondep: nondepressed.</p>
            </fn>
            <fn id="table5fn5">
              <p><sup>e</sup>PHQ-9: Patient Health Questionnaire-9.</p>
            </fn>
            <fn id="table5fn6">
              <p><sup>f</sup>LGBM: light gradient boosting machine.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Implications of Study Findings</title>
        <p>In the stable FS approach, starting from a threshold of 0.5, we gradually increased the threshold by 0.01 until there remained 0 features and we found the best model in selecting the features that appeared at least 77% of the time among the 1000 bootstrapped subsamples. This finding highlights the need for empirical investigation of the threshold while using the stable FS approach. This finding also extends previous studies that have used random thresholds of 0.25 [<xref ref-type="bibr" rid="ref75">75</xref>] and 0.75 [<xref ref-type="bibr" rid="ref76">76</xref>] to select features for depression identification and also in other contexts (eg, Ing et al [<xref ref-type="bibr" rid="ref95">95</xref>] used a threshold of 0.90 in neurobehavioral symptom identification). While comparing FS approaches, we found that to achieve the same performance (precision=73.1%, sensitivity=74.5%) as an ML model developed using around 5 features selected by Boruta, we need 6, 9, and ~14 features of the filter, wrapper, and stable approaches, respectively. In fact, using those 5 features of Boruta, our stacking model performed the best (precision=77.4%, balanced accuracy=77.95%). Unlike other FS approaches, selecting all-relevant features in Boruta [<xref ref-type="bibr" rid="ref73">73</xref>], instead of selecting minimal-optimal features, can be a plausible reason for having better performance. Higher performance with a relatively lower number of features demonstrates the development of a parsimonious model that can have potential for resource-constrained settings where the usage of a higher number of features can increase the computational models’ complexity and use relatively more resources. Additionally, the parsimonious model, based on all-relevant features in particular, can have potential implications in presenting plausible behavioral markers for intervention.</p>
        <p>After comparing the performance of the ML models, we found the GB-based models GB, XGB, and LGBM to be superior, although we developed models using a baseline dummy classifier and 13 different classification algorithms, including the support vector, KNN, Logit, and neural network (MLP) algorithms, where each model was developed based on features selected by 4 different FS methods. In the GB ML models, the weak learners are converted to strong learners by correcting the predecessors through the gradient descent algorithm [<xref ref-type="bibr" rid="ref82">82</xref>], and GB can effectively handle a complex relationship with nonlinearity [<xref ref-type="bibr" rid="ref96">96</xref>]. This is reflected in the findings of our study, where we found better performance among GB-based models compared to linear models, such as Logit. In particular, we found the LGBM to be one of the top 5 classifiers among models based on features selected by each of the 4 methods. In fact, the best individual ML model was based on the LGBM algorithm, as mentioned before. A plausible reason for having better performance is the leafwise growth of the LGBM, which makes the model complex and also increases the complex relation-learning capability. Although complexity increases the possibility to have an overfitted model, we used the nested CV method, which is used for overfitting prevention and has an unbiased performance [<xref ref-type="bibr" rid="ref83">83</xref>]. Our findings suggest that while using behavioral data for developing ML models to identify depression, GB-based ML algorithms, particularly the LGBM, may be a preferable choice, considering their lower consumption of memory and higher speed in computation [<xref ref-type="bibr" rid="ref80">80</xref>].</p>
        <p>While explaining the LGBM model through the SHAP method [<xref ref-type="bibr" rid="ref87">87</xref>], it appeared that the greater the time spent on apps in the Education category during the weekday, the lower the probability of being depressed. In this study, apps including Zoom, Google Meet, and Google Classroom were in this category, and in Bangladesh, these apps have been used for online learning since the start of the COVID-19 pandemic [<xref ref-type="bibr" rid="ref68">68</xref>]. Using these apps, students can support and communicate with their classmates and teachers. The positive impact of peer support on mental health [<xref ref-type="bibr" rid="ref97">97</xref>] explains the plausible reason for the association with a lower probability of being depressed. A SHAP analysis of the model also showed that the higher number of photo and video apps used and also the higher deviation over the day in terms of the number of apps used in this category on the weekends increase the predictive probability toward the depressed group. The photos of depressed users are different, where their photos appear to be grayer, bluer, and darker [<xref ref-type="bibr" rid="ref98">98</xref>]. In addition, studies have shown that those with mental health problems post photos on social media [<xref ref-type="bibr" rid="ref99">99</xref>] and watch videos on YouTube [<xref ref-type="bibr" rid="ref100">100</xref>] to share thoughts and seek support to overcome their problems. Therefore, as different apps have different features, the usage of a higher number of photo and video apps by depressed individuals can present their support-seeking behavior, which they prefer to do in a particular period of the day as there is a higher deviation over the day. Extending the previous studies [<xref ref-type="bibr" rid="ref99">99</xref>,<xref ref-type="bibr" rid="ref100">100</xref>], these findings show that in addition to visual attributes in social media, the behavioral features regarding the number of photo and video apps can also distinguish people who are or are not depressed. Meanwhile, in the case of the Communication category, we found that a higher ratio of hamming distances in communication apps is likely to increase the probability of being depressed, which denotes that depressed individuals are more likely to use a higher number of different communication apps. This finding is in line with a previous study [<xref ref-type="bibr" rid="ref26">26</xref>] conducted using the conventional statistical method, which demonstrated the diverse nature of app usage among depressed people presenting their support-seeking behavior. Thus, going beyond depression identification, these explanations through SHAP analysis have the potential to help mental health care professionals better understand depressed individuals and take steps for intervention accordingly.</p>
      </sec>
      <sec>
        <title>Strengths and Limitations</title>
        <p>Through our developed system Mon Majhi, we have contributed to the mobile and ubiquitous health research area in the following ways:</p>
        <list list-type="bullet">
          <list-item>
            <p>Using only data retrieved in 1 second (mean 307.94, SD 1103.91 ms), our ML model correctly identified 82.4% of depressed individuals. To the best of our knowledge, in identifying a psychological problem, our approach is faster and more minimalistic than any other existing smartphone data–based systems, which can enable our system to be largely scalable in resource-constrained settings, such as in LMICs.</p>
          </list-item>
          <list-item>
            <p>We presented important behavioral markers and the best ML models after selecting features via 3 main types of FS approaches along with the stable approach and also after developing ML models based on 13 different classification algorithms. Due to the large exploration, our findings can have real-world implications. In addition, after a comprehensive exploration, we presented a parsimonious model based on features selected by the all-relevant FS method Boruta, which showed better predictability with a lower number of features. This can have potential for future studies to develop parsimonious computational models to identify psychological problems in low-resource settings leveraging behavioral data.</p>
          </list-item>
          <list-item>
            <p>Through explainable ML techniques, we interpreted the models where we demonstrated how different behavioral features impact predicting depression and also discussed the implications that can have potential for understanding the smartphone usage behavior of depressed students and in taking steps for intervention.</p>
          </list-item>
        </list>
        <p>Our study was limited by the small sample size (N=100). Although there was diversity among the participants in terms of regions, institutions, and departments, and we used state-of-the-art methods to evaluate ML models, due to having a small sample size comprising mostly male participants, evaluation of a large sample is needed before applying the system in the real world. Additionally, while translating the PHQ-9 [<xref ref-type="bibr" rid="ref53">53</xref>], we removed the word “dead” from the ninth item (eg, considering the students’ concerns about the word “dead” [<xref ref-type="bibr" rid="ref92">92</xref>]) through a process that is described in detail in section B of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. It should be noted that even after we removed the ninth item completely and considered the cutoff score of the 8-item Patient Health Questionnaire-8 (score ≥10: depressed) [<xref ref-type="bibr" rid="ref101">101</xref>], all the depressed participants were still categorized as depressed. It is worthwhile to mention that since we constructed the data set of this study amid the COVID-19 pandemic in 2020 when classes were online, it was difficult to reach out to a large number of participants. However, we have been conducting a countrywide study where we have overcome the aforementioned limitations and constructed a large-scale data set. In our future work, we expect to present a more robust system to the research community.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>The performance of our system Mon Majhi showed that depressed and nondepressed students can be classified accurately, faster, and unobtrusively with minimal data. Although we developed models using a diverse set of ML algorithms, we found that the LGBM model using only instantly accessed data (&lt;1 second) can correctly identify 82.4% of depressed students, with a precision of 75%. Additionally, we found the all-relevant FS approach Boruta-based stacking model (sensitivity=80.4%, precision=77.4%) as a parsimonious model due to higher performance with a lower number of features. Through a SHAP analysis, we also demonstrated how different app usage behavioral markers impact the models. These findings are novel and show the feasibility of our minimal system for faster depression prediction. Hence, we believe that our system can facilitate minimization of depression rates in low-resource settings.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Description and analyses.</p>
        <media xlink:href="formative_v7i1e28848_app1.docx" xlink:title="DOCX File , 267 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">API</term>
          <def>
            <p>application programming interface</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">BDT</term>
          <def>
            <p>Bangladeshi Taka</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CV</term>
          <def>
            <p>cross-validation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">DT</term>
          <def>
            <p>decision tree</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">FS</term>
          <def>
            <p>feature selection</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">GB</term>
          <def>
            <p>gradient boost</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">IG</term>
          <def>
            <p>information gain</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">KNN</term>
          <def>
            <p>K-nearest neighbor</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">LGBM</term>
          <def>
            <p>light gradient boosting machine</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">LMIC</term>
          <def>
            <p>low- and middle-income country</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">Logit</term>
          <def>
            <p>logistic regression</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">LOPOCV</term>
          <def>
            <p>leave-one-participant-out cross-validation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">ML</term>
          <def>
            <p>machine learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">MLP</term>
          <def>
            <p>multilayer perceptron</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">PCP</term>
          <def>
            <p>primary care provider</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb16">PHQ-9</term>
          <def>
            <p>Patient Health Questionnaire-9</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb17">RF</term>
          <def>
            <p>random forest</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb18">SHAP</term>
          <def>
            <p>Shapley additive explanations</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb19">XGB</term>
          <def>
            <p>XGBoost</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>We thank all participants who voluntarily donated data. We are grateful to Tanvir Hasan and the faculties of the various universities that supported us in the data collection phase.</p>
      <p>All authors declared that they had insufficient or no funding to support open access publication of this manuscript, including from affiliated organizations or institutions, funding agencies, or other organizations. JMIR Publications provided article processing fee (APF) support for the publication of this article.</p>
    </ack>
    <sec>
      <title>Data Availability</title>
      <p>The data sets generated during and/or analyzed during this study are not publicly available due to data privacy and safety issues but are available from the corresponding author on reasonable request.</p>
    </sec>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <article-title>Global health data exchange (GHDx)</article-title>
          <source>Institute for Health Metrics and Evaluation</source>
          <year>2019</year>
          <access-date>2022-04-23</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://ghdx.healthdata.org/gbd-results-tool?params=gbd-api-2019-permalink/d780dffbe8a381b25e1416884959e88b">http://ghdx.healthdata.org/gbd-results-tool?params=gbd-api-2019-permalink/d780dffbe8a381b25e1416884959e88b</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <article-title>80% of depression burden is among people living in low- and middle-income countries (LMICs)</article-title>
          <source>European Commission</source>
          <year>2017</year>
          <access-date>2022-05-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cordis.europa.eu/article/id/134176-80-of-depression-burden-is-among-people-living-in-low-and-middleincome-countries-lmics/fr">https://cordis.europa.eu/article/id/134176-80-of-depression-burden-is-among-people-living-in-low-and-middlein come-countries-lmics/fr</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <article-title>National Mental Health Survey of Bangladesh 2018-19: provisional fact sheet</article-title>
          <source>World Health Organization</source>
          <access-date>2023-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/docs/default-source/searo/bangladesh/pdf-reports/cat-2/nimh-fact-sheet-5-11-19.pdf?sfvrsn=3e62d4b0_2">https://www.who.int/docs/default-source/searo/bangladesh/pdf-reports/cat-2/nimh-fact-sheet-5-11-19.pdf?sfvrsn=3e62d4b0_2</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hosen</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Mamun</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Mamun</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>Prevalence and risk factors of the symptoms of depression, anxiety, and stress during the COVID-19 pandemic in Bangladesh: a systematic review and meta-analysis</article-title>
          <source>Glob Ment Health (Camb)</source>
          <year>2021</year>
          <volume>8</volume>
          <fpage>e47</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35145709"/>
          </comment>
          <pub-id pub-id-type="doi">10.1017/gmh.2021.49</pub-id>
          <pub-id pub-id-type="medline">35145709</pub-id>
          <pub-id pub-id-type="pii">S2054425121000492</pub-id>
          <pub-id pub-id-type="pmcid">PMC8794743</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Goodwin</surname>
              <given-names>GM</given-names>
            </name>
          </person-group>
          <article-title>Depression and associated physical diseases and symptoms</article-title>
          <source>Dialogues Clin Neurosci</source>
          <year>2006</year>
          <volume>8</volume>
          <issue>2</issue>
          <fpage>259</fpage>
          <lpage>265</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/16889110"/>
          </comment>
          <pub-id pub-id-type="doi">10.31887/DCNS.2006.8.2/mgoodwin</pub-id>
          <pub-id pub-id-type="medline">16889110</pub-id>
          <pub-id pub-id-type="pmcid">PMC3181771</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Marshall</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>The hidden links between mental disorders</article-title>
          <source>Nature</source>
          <year>2020</year>
          <month>05</month>
          <day>05</day>
          <volume>581</volume>
          <issue>7806</issue>
          <fpage>19</fpage>
          <lpage>21</lpage>
          <pub-id pub-id-type="doi">10.1038/d41586-020-00922-8</pub-id>
          <pub-id pub-id-type="medline">32372044</pub-id>
          <pub-id pub-id-type="pii">10.1038/d41586-020-00922-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
          <article-title>Depression</article-title>
          <source>World Health Organization</source>
          <access-date>2022-04-23</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/news-room/fact-sheets/detail/depression">https://www.who.int/news-room/fact-sheets/detail/depression</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Coyne</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Schwenk</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>Fechner-Bates</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Nondetection of depression by primary care physicians reconsidered</article-title>
          <source>Gen Hosp Psychiatry</source>
          <year>1995</year>
          <month>01</month>
          <volume>17</volume>
          <issue>1</issue>
          <fpage>3</fpage>
          <lpage>12</lpage>
          <pub-id pub-id-type="doi">10.1016/0163-8343(94)00056-j</pub-id>
          <pub-id pub-id-type="medline">7737492</pub-id>
          <pub-id pub-id-type="pii">016383439400056J</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cepoiu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>McCusker</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cole</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Sewitch</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ciampi</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Recognition of depression in older medical inpatients</article-title>
          <source>J Gen Intern Med</source>
          <year>2007</year>
          <month>05</month>
          <volume>22</volume>
          <issue>5</issue>
          <fpage>559</fpage>
          <lpage>564</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/17443361"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11606-006-0085-0</pub-id>
          <pub-id pub-id-type="medline">17443361</pub-id>
          <pub-id pub-id-type="pmcid">PMC1852909</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chesney</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Goodwin</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Fazel</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Risks of all-cause and suicide mortality in mental disorders: a meta-review</article-title>
          <source>World Psychiatry</source>
          <year>2014</year>
          <month>06</month>
          <day>02</day>
          <volume>13</volume>
          <issue>2</issue>
          <fpage>153</fpage>
          <lpage>160</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/24890068"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/wps.20128</pub-id>
          <pub-id pub-id-type="medline">24890068</pub-id>
          <pub-id pub-id-type="pmcid">PMC4102288</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>CWM</given-names>
            </name>
            <name name-style="western">
              <surname>How</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>YP</given-names>
            </name>
          </person-group>
          <article-title>Depression in primary care: assessing suicide risk</article-title>
          <source>Singapore Med J</source>
          <year>2017</year>
          <month>03</month>
          <volume>58</volume>
          <issue>2</issue>
          <fpage>72</fpage>
          <lpage>77</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28210741"/>
          </comment>
          <pub-id pub-id-type="doi">10.11622/smedj.2017006</pub-id>
          <pub-id pub-id-type="medline">28210741</pub-id>
          <pub-id pub-id-type="pii">j58/2/72</pub-id>
          <pub-id pub-id-type="pmcid">PMC5311887</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kraus</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kadriu</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lanzenberger</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zarate</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Kasper</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Prognosis and improved outcomes in major depression: a review</article-title>
          <source>Transl Psychiatry</source>
          <year>2019</year>
          <month>04</month>
          <day>03</day>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>127</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41398-019-0460-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41398-019-0460-3</pub-id>
          <pub-id pub-id-type="medline">30944309</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41398-019-0460-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC6447556</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zulfiker</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Kabir</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Biswas</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Nazneen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Uddin</surname>
              <given-names>MS</given-names>
            </name>
          </person-group>
          <article-title>An in-depth analysis of machine learning approaches to predict depression</article-title>
          <source>Curr Res Behav Sci</source>
          <year>2021</year>
          <month>11</month>
          <volume>2</volume>
          <fpage>100044</fpage>
          <pub-id pub-id-type="doi">10.1016/j.crbeha.2021.100044</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Munir</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Kaiser</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Islam</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Siddiqui</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Kaiser</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Ray</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Bandyopadhyay</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jacob</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Long</surname>
              <given-names>KS</given-names>
            </name>
          </person-group>
          <article-title>Machine learning classification algorithms for predicting depression among university students in Bangladesh</article-title>
          <source>Proceedings of the Third International Conference on Trends in Computational and Cognitive Engineering. Lecture Notes in Networks and Systems, vol 348</source>
          <year>2022</year>
          <publisher-loc>Singapore</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>69</fpage>
          <lpage>80</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ren</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Predicting depression among rural and urban disabled elderly in China using a random forest classifier</article-title>
          <source>BMC Psychiatry</source>
          <year>2022</year>
          <month>03</month>
          <day>15</day>
          <volume>22</volume>
          <issue>1</issue>
          <fpage>118</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpsychiatry.biomedcentral.com/articles/10.1186/s12888-022-03742-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12888-022-03742-4</pub-id>
          <pub-id pub-id-type="medline">35168579</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12888-022-03742-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC8845343</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Voelker</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Joshi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Daly</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Papademetriou</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Rotter</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sheehan</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kuvadia</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Dasgupta</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Potluri</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>How well do clinical and demographic characteristics predict Patient Health Questionnaire-9 scores among patients with treatment-resistant major depressive disorder in a real-world setting?</article-title>
          <source>Brain Behav</source>
          <year>2021</year>
          <month>03</month>
          <volume>11</volume>
          <issue>2</issue>
          <fpage>e02000</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33403828"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/brb3.2000</pub-id>
          <pub-id pub-id-type="medline">33403828</pub-id>
          <pub-id pub-id-type="pmcid">PMC7882175</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Haque</surname>
              <given-names>UM</given-names>
            </name>
            <name name-style="western">
              <surname>Kabir</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Khanam</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Detection of child depression using machine learning methods</article-title>
          <source>PLoS One</source>
          <year>2021</year>
          <volume>16</volume>
          <issue>12</issue>
          <fpage>e0261131</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0261131"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0261131</pub-id>
          <pub-id pub-id-type="medline">34914728</pub-id>
          <pub-id pub-id-type="pii">PONE-D-21-30505</pub-id>
          <pub-id pub-id-type="pmcid">PMC8675644</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Doryab</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Villalba</surname>
              <given-names>DK</given-names>
            </name>
            <name name-style="western">
              <surname>Chikersal</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Dutcher</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Tumminia</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Creswell</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mankoff</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Creswell</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Dey</surname>
              <given-names>AK</given-names>
            </name>
          </person-group>
          <article-title>Identifying behavioral phenotypes of loneliness and social isolation with passive sensing: statistical analysis, data mining and machine learning of smartphone and Fitbit data</article-title>
          <source>JMIR Mhealth Uhealth</source>
          <year>2019</year>
          <month>07</month>
          <day>24</day>
          <volume>7</volume>
          <issue>7</issue>
          <fpage>e13209</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mhealth.jmir.org/2019/7/e13209/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/13209</pub-id>
          <pub-id pub-id-type="medline">31342903</pub-id>
          <pub-id pub-id-type="pii">v7i7e13209</pub-id>
          <pub-id pub-id-type="pmcid">PMC6685126</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chikersal</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Doryab</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Villalba</surname>
              <given-names>DK</given-names>
            </name>
            <name name-style="western">
              <surname>Dutcher</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Tumminia</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Althoff</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Creswell</surname>
              <given-names>KG</given-names>
            </name>
            <name name-style="western">
              <surname>Creswell</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Mankoff</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dey</surname>
              <given-names>AK</given-names>
            </name>
          </person-group>
          <article-title>Leveraging routine behavior and contextually-filtered features for depression detection among college students</article-title>
          <source>Proc ACM Interact Mob Wearable Ubiquitous Technol</source>
          <year>2019</year>
          <month>09</month>
          <day>09</day>
          <volume>3</volume>
          <issue>3</issue>
          <fpage>1</fpage>
          <lpage>33</lpage>
          <pub-id pub-id-type="doi">10.1145/3351274</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chikersal</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Dutcher</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Sefidgar</surname>
              <given-names>YS</given-names>
            </name>
            <name name-style="western">
              <surname>Seo</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Tumminia</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Villalba</surname>
              <given-names>DK</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Creswell</surname>
              <given-names>KG</given-names>
            </name>
            <name name-style="western">
              <surname>Creswell</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Doryab</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nurius</surname>
              <given-names>PS</given-names>
            </name>
            <name name-style="western">
              <surname>Riskin</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Dey</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Mankoff</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Leveraging Collaborative-Filtering for Personalized Behavior Modeling</article-title>
          <source>Proc ACM Interact Mob Wearable Ubiquitous Technol</source>
          <year>2021</year>
          <month>03</month>
          <day>19</day>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>27</lpage>
          <pub-id pub-id-type="doi">10.1145/3448107</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chikersal</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Doryab</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tumminia</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Villalba</surname>
              <given-names>DK</given-names>
            </name>
            <name name-style="western">
              <surname>Dutcher</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Creswell</surname>
              <given-names>KG</given-names>
            </name>
            <name name-style="western">
              <surname>Mankoff</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Creswell</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Goel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dey</surname>
              <given-names>AK</given-names>
            </name>
          </person-group>
          <article-title>Detecting depression and predicting its onset using longitudinal symptoms captured by passive sensing</article-title>
          <source>ACM Trans Comput-Hum Interact</source>
          <year>2021</year>
          <month>02</month>
          <day>28</day>
          <volume>28</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>41</lpage>
          <pub-id pub-id-type="doi">10.1145/3422821</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Elias</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Why wearables are out of reach for people who need them most</article-title>
          <source>Forbes</source>
          <year>2015</year>
          <access-date>2022-04-23</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.forbes.com/sites/jenniferelias/2015/10/27/the-leftovers-part-i-the-cost-of-activity/?sh=a0e5ffc63c9b">https://www.forbes.com/sites/jenniferelias/2015/10/27/the-leftovers-part-i-the-cost-of-activity/?sh=a0e5ffc63c9b</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lohchab</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Affordable smartphone sales shoot up as demand grows due to e-learning needs Internet</article-title>
          <source>Economic Times</source>
          <year>2020</year>
          <access-date>2022-05-26</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://economictimes.indiatimes.com/tech/hardware/affordable-smartphone-sales-shoot-up-as-demand-grows/articleshow/78241563.cms">https://economictimes.indiatimes.com/tech/hardware/affordable-smartphone-sales-shoot-up-as-demand-grows/articleshow/78241563.cms</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Atske</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Use of smartphones and social media is common across most emerging economies</article-title>
          <source>Pew Research Center: Internet, Science &amp; Tech</source>
          <year>2019</year>
          <access-date>2022-04-23</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.pewresearch.org/internet/2019/03/07/use-of-smartphones-and-social-media-is-common-across-most-emerging-economies/">https://www.pewresearch.org/internet/2019/03/07/use-of-smartphones-and-social-media-is- common-across-most-emerging-economies/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rony</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hasan</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Smartphone usage behavior between depressed and non-depressed students: an exploratory study in the context of Bangladesh</article-title>
          <year>2020</year>
          <conf-name>Adjunct Proceedings of the 2020 ACM International Joint Conference on Pervasive and Ubiquitous Computing and Proceedings of the 2020 ACM International Symposium on Wearable Computers</conf-name>
          <conf-date>Sept 12-17</conf-date>
          <conf-loc>Virtual Event/Mexico</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3410530.3414441</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Exploring unique app signature of the depressed and non-depressed through their fingerprints on apps</article-title>
          <source>Lecture Notes of the Institute for Computer Sciences, Social Informatics and Telecommunications Engineering</source>
          <year>2022</year>
          <publisher-loc>Cham</publisher-loc>
          <publisher-name>Springer International</publisher-name>
          <fpage>218</fpage>
          <lpage>239</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Saeb</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Karr</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Schueller</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Corden</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Kording</surname>
              <given-names>KP</given-names>
            </name>
            <name name-style="western">
              <surname>Mohr</surname>
              <given-names>DC</given-names>
            </name>
          </person-group>
          <article-title>Mobile phone sensor correlates of depressive symptom severity in daily-life behavior: an exploratory study</article-title>
          <source>J Med Internet Res</source>
          <year>2015</year>
          <month>07</month>
          <day>15</day>
          <volume>17</volume>
          <issue>7</issue>
          <fpage>e175</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2015/7/e175/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.4273</pub-id>
          <pub-id pub-id-type="medline">26180009</pub-id>
          <pub-id pub-id-type="pii">v17i7e175</pub-id>
          <pub-id pub-id-type="pmcid">PMC4526997</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nickels</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Edwards</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Poole</surname>
              <given-names>SF</given-names>
            </name>
            <name name-style="western">
              <surname>Winter</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Gronsbell</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rozenkrants</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>DP</given-names>
            </name>
            <name name-style="western">
              <surname>Fleck</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>McLean</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hwang</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rust-Smith</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Brant</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Campbell</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Walter</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Arean</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Hsin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Myers</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Marks</surname>
              <given-names>WJ</given-names>
            </name>
            <name name-style="western">
              <surname>Mega</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Schlosser</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Conrad</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Califf</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Fromer</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Toward a mobile platform for real-world digital measurement of depression: user-centered design, data quality, and behavioral and clinical modeling</article-title>
          <source>JMIR Ment Health</source>
          <year>2021</year>
          <month>08</month>
          <day>10</day>
          <volume>8</volume>
          <issue>8</issue>
          <fpage>e27589</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mental.jmir.org/2021/8/e27589/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/27589</pub-id>
          <pub-id pub-id-type="medline">34383685</pub-id>
          <pub-id pub-id-type="pii">v8i8e27589</pub-id>
          <pub-id pub-id-type="pmcid">PMC8386379</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hunt</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Marx</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lipson</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Young</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>No more FOMO: limiting social media decreases loneliness and depression</article-title>
          <source>J Soc Clin Psychol</source>
          <year>2018</year>
          <month>12</month>
          <volume>37</volume>
          <issue>10</issue>
          <fpage>751</fpage>
          <lpage>768</lpage>
          <pub-id pub-id-type="doi">10.1521/jscp.2018.37.10.751</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wetzel</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Pryss</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Baumeister</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Edler</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gonçalves</surname>
              <given-names>ASO</given-names>
            </name>
            <name name-style="western">
              <surname>Cohrdes</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>"How come you don't call me?" Smartphone communication app usage as an indicator of loneliness and social well-being across the adult lifespan during the COVID-19 pandemic</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2021</year>
          <month>06</month>
          <day>08</day>
          <volume>18</volume>
          <issue>12</issue>
          <fpage>6212</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph18126212"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph18126212</pub-id>
          <pub-id pub-id-type="medline">34201322</pub-id>
          <pub-id pub-id-type="pii">ijerph18126212</pub-id>
          <pub-id pub-id-type="pmcid">PMC8227237</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>How smartphone usage correlates with social anxiety and loneliness</article-title>
          <source>PeerJ</source>
          <year>2016</year>
          <volume>4</volume>
          <fpage>e2197</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27478700"/>
          </comment>
          <pub-id pub-id-type="doi">10.7717/peerj.2197</pub-id>
          <pub-id pub-id-type="medline">27478700</pub-id>
          <pub-id pub-id-type="pii">2197</pub-id>
          <pub-id pub-id-type="pmcid">PMC4950540</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>daSilva</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Huckins</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Kelley</surname>
              <given-names>WM</given-names>
            </name>
            <name name-style="western">
              <surname>Heatherton</surname>
              <given-names>TF</given-names>
            </name>
            <name name-style="western">
              <surname>Campbell</surname>
              <given-names>AT</given-names>
            </name>
          </person-group>
          <article-title>Tracking depression dynamics in college students using mobile phone and wearable sensing</article-title>
          <source>Proc ACM Interact Mob Wearable Ubiquitous Technol</source>
          <year>2018</year>
          <month>03</month>
          <day>26</day>
          <volume>2</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>26</lpage>
          <pub-id pub-id-type="doi">10.1145/3191775</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Masud</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Mamun</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Thapa</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>DH</given-names>
            </name>
            <name name-style="western">
              <surname>Griffiths</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Unobtrusive monitoring of behavior and movement patterns to detect clinical depression severity level via smartphone</article-title>
          <source>J Biomed Inform</source>
          <year>2020</year>
          <month>03</month>
          <volume>103</volume>
          <fpage>103371</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(19)30291-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2019.103371</pub-id>
          <pub-id pub-id-type="medline">31935462</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(19)30291-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Truong</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Banu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Sabharwal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Moukaddam</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Tracking and predicting depressive symptoms of adolescents using smartphone-based self-reports, parental evaluations, and passive phone sensor data: development and usability study</article-title>
          <source>JMIR Ment Health</source>
          <year>2020</year>
          <month>01</month>
          <day>24</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>e14045</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mental.jmir.org/2020/1/e14045/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/14045</pub-id>
          <pub-id pub-id-type="medline">32012072</pub-id>
          <pub-id pub-id-type="pii">v7i1e14045</pub-id>
          <pub-id pub-id-type="pmcid">PMC7007590</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Opoku Asare</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Terhorst</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Vega</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Peltonen</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Lagerspetz</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ferreira</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Predicting depression from smartphone behavioral markers using machine learning methods, hyperparameter optimization, and feature importance analysis: exploratory study</article-title>
          <source>JMIR Mhealth Uhealth</source>
          <year>2021</year>
          <month>07</month>
          <day>12</day>
          <volume>9</volume>
          <issue>7</issue>
          <fpage>e26540</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mhealth.jmir.org/2021/7/e26540/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/26540</pub-id>
          <pub-id pub-id-type="medline">34255713</pub-id>
          <pub-id pub-id-type="pii">v9i7e26540</pub-id>
          <pub-id pub-id-type="pmcid">PMC8314163</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Opoku Asare</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Moshe</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Terhorst</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Vega</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hosio</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Baumeister</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Pulkki-Råback</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ferreira</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Mood ratings and digital biomarkers from smartphone and wearable data differentiates and predicts depression status: A longitudinal data analysis</article-title>
          <source>Pervasive Mob Comput</source>
          <year>2022</year>
          <month>07</month>
          <volume>83</volume>
          <fpage>101621</fpage>
          <pub-id pub-id-type="doi">10.1016/j.pmcj.2022.101621</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ware</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yue</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Morillo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kamath</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Russell</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bamis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Predicting depressive symptoms using smartphone data</article-title>
          <source>Smart Health</source>
          <year>2020</year>
          <month>03</month>
          <volume>15</volume>
          <fpage>100093</fpage>
          <pub-id pub-id-type="doi">10.1016/j.smhl.2019.100093</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yue</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ware</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Morillo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kamath</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Russell</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bamis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Fusing location data for depression prediction</article-title>
          <source>IEEE Trans Big Data</source>
          <year>2021</year>
          <month>6</month>
          <day>1</day>
          <volume>7</volume>
          <issue>2</issue>
          <fpage>355</fpage>
          <lpage>370</lpage>
          <pub-id pub-id-type="doi">10.1109/tbdata.2018.2872569</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Farhan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yue</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Morillo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ware</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kamath</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Russell</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bamis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Behavior vs. introspection: refining prediction of clinical depression via smartphone sensing data</article-title>
          <year>2016</year>
          <conf-name>2016 IEEE Wireless Health (WH)</conf-name>
          <conf-date>Oct 25-27</conf-date>
          <conf-loc>Bethesda, MD</conf-loc>
          <pub-id pub-id-type="doi">10.1109/wh.2016.7764553</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Canzian</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Musolesi</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Trajectories of depression: unobtrusive monitoring of depressive states by means of smartphone mobility traces analysis</article-title>
          <year>2015</year>
          <conf-name>2015 ACM International Joint Conference on Pervasive and Ubiquitous Computing - UbiComp '15</conf-name>
          <conf-date>Sept 7-11</conf-date>
          <conf-loc>Osaka, Japan</conf-loc>
          <pub-id pub-id-type="doi">10.1145/2750858.2805845</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ben Abdesslem</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Phillips</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Henderson</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Less is more: energy-efficient mobile sensing with senseless</article-title>
          <year>2009</year>
          <conf-name>1st ACM Workshop on Networking, Systems, and Applications for Mobile Handhelds - MobiHeld ‘09</conf-name>
          <conf-date>Aug 17</conf-date>
          <conf-loc>Barcelona, Spain</conf-loc>
          <pub-id pub-id-type="doi">10.1145/1592606.1592621</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dougan</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Curran</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Detection of social interaction using mobile phones via device free passive localisation</article-title>
          <source>Int J Handheld Comput Res</source>
          <year>2014</year>
          <volume>5</volume>
          <issue>4</issue>
          <fpage>35</fpage>
          <pub-id pub-id-type="doi">10.4018/ijhcr.2014100102</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Boase</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ling</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Measuring mobile phone use: self-report versus log data</article-title>
          <source>J Comput-Mediat Comm</source>
          <year>2013</year>
          <month>06</month>
          <day>10</day>
          <volume>18</volume>
          <issue>4</issue>
          <fpage>508</fpage>
          <lpage>519</lpage>
          <pub-id pub-id-type="doi">10.1111/jcc4.12021</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ernala</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Burke</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Leavitt</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ellison</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>How well do people report time spent on Facebook?: an evaluation of established survey questions with recommendations</article-title>
          <year>2020</year>
          <conf-name>2020 CHI Conference on Human Factors in Computing Systems</conf-name>
          <conf-date>Apr 25-30</conf-date>
          <conf-loc>Honolulu, HI</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3313831.3376435</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>MS</given-names>
            </name>
          </person-group>
          <article-title>Mon Majhi</article-title>
          <source>Google Play</source>
          <access-date>2023-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://play.google.com/store/apps/details?id=net.mn.u">https://play.google.com/store/apps/details?id=net.mn.u</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="web">
          <article-title>Mobile operating system market share Bangladesh</article-title>
          <source>StatCounter Global Stats</source>
          <year>2022</year>
          <access-date>2022-04-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://gs.statcounter.com/os-market-share/mobile/bangladesh">https://gs.statcounter.com/os-mar ket-share/mobile/bangladesh</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="web">
          <article-title>UsageStatsManager</article-title>
          <source>Android Developers</source>
          <year>2022</year>
          <access-date>2023-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://developer.android.com/reference/android/app/usage/UsageStatsManager">https://developer.android.com/reference/android/app/usage/UsageSta tsManager</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>App usage</article-title>
          <source>Google</source>
          <access-date>2022-04-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://play.google.com/store/apps/details?id=com.a0soft.gphone.uninstaller">https://play.google.com/store/apps/details?id=com.a0soft.gphone.uninstaller</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="web">
          <article-title>YourHour - screentime control</article-title>
          <source>Mindefy Labs</source>
          <access-date>2023-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://play.google.com/store/apps/details?id=com.mindefy.phoneaddiction.mobilepe">https://play.google.com/store/apps/details?id=com.mindefy.phoneaddi ction.mobilepe</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Islam</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Akter</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sikder</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Griffiths</surname>
              <given-names>MD</given-names>
            </name>
          </person-group>
          <article-title>Prevalence and factors associated with depression and anxiety among first-year university students in Bangladesh: a cross-sectional study</article-title>
          <source>Int J Ment Health Addiction</source>
          <year>2020</year>
          <month>03</month>
          <day>02</day>
          <volume>20</volume>
          <issue>3</issue>
          <fpage>1289</fpage>
          <lpage>1302</lpage>
          <pub-id pub-id-type="doi">10.1007/s11469-020-00242-y</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>86pc university students own smartphones in Bangladesh: survey</article-title>
          <source>Prothom Alo</source>
          <year>2020</year>
          <month>6</month>
          <day>6</day>
          <access-date>2023-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://en.prothomalo.com/youth/education/86pc-university-students-own-smartphones-in-bangladesh-survey">https://en.prothomalo.com/youth/education/86pc-university-students-own-smartphones-in-bangladesh-survey</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Velloza</surname>
              <given-names>Jennifer</given-names>
            </name>
            <name name-style="western">
              <surname>Njoroge</surname>
              <given-names>John</given-names>
            </name>
            <name name-style="western">
              <surname>Ngure</surname>
              <given-names>Kenneth</given-names>
            </name>
            <name name-style="western">
              <surname>Thuo</surname>
              <given-names>Nicholas</given-names>
            </name>
            <name name-style="western">
              <surname>Kiptinness</surname>
              <given-names>Catherine</given-names>
            </name>
            <name name-style="western">
              <surname>Momanyi</surname>
              <given-names>Richard</given-names>
            </name>
            <name name-style="western">
              <surname>Ayub</surname>
              <given-names>Snaidah</given-names>
            </name>
            <name name-style="western">
              <surname>Gakuo</surname>
              <given-names>Stephen</given-names>
            </name>
            <name name-style="western">
              <surname>Mugo</surname>
              <given-names>Nelly</given-names>
            </name>
            <name name-style="western">
              <surname>Simoni</surname>
              <given-names>Jane</given-names>
            </name>
            <name name-style="western">
              <surname>Heffron</surname>
              <given-names>Renee</given-names>
            </name>
          </person-group>
          <article-title>Cognitive testing of the PHQ-9 for depression screening among pregnant and postpartum women in Kenya</article-title>
          <source>BMC Psychiatry</source>
          <year>2020</year>
          <month>01</month>
          <day>29</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>31</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpsychiatry.biomedcentral.com/articles/10.1186/s12888-020-2435-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12888-020-2435-6</pub-id>
          <pub-id pub-id-type="medline">31996166</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12888-020-2435-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC6990517</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kroenke</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Spitzer</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>JB</given-names>
            </name>
          </person-group>
          <article-title>The PHQ-9: validity of a brief depression severity measure</article-title>
          <source>J Gen Intern Med</source>
          <year>2001</year>
          <month>09</month>
          <volume>16</volume>
          <issue>9</issue>
          <fpage>606</fpage>
          <lpage>613</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/11556941"/>
          </comment>
          <pub-id pub-id-type="doi">10.1046/j.1525-1497.2001.016009606.x</pub-id>
          <pub-id pub-id-type="medline">11556941</pub-id>
          <pub-id pub-id-type="pii">jgi01114</pub-id>
          <pub-id pub-id-type="pmcid">PMC1495268</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jung</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ko</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>U</given-names>
            </name>
          </person-group>
          <article-title>GoalKeeper: exploring interaction lockout mechanisms for regulating smartphone use</article-title>
          <source>Proc ACM Interact Mob Wearable Ubiquitous Technol</source>
          <year>2019</year>
          <month>03</month>
          <day>29</day>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>29</lpage>
          <pub-id pub-id-type="doi">10.1145/3314403</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Mark</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>The context of college students' Facebook use and academic performance: an empirical study</article-title>
          <year>2018</year>
          <conf-name>2018 CHI Conference on Human Factors in Computing Systems</conf-name>
          <conf-date>Apr 21-26</conf-date>
          <conf-loc>Montreal, QC</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3173574.3173992</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lyngs</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Lukoff</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Slovak</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Seymour</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Webb</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Jirotka</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Van</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Shadbolt</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>'I just want to hack myself to not get distracted': evaluating design interventions for self-control on Facebook</article-title>
          <year>2020</year>
          <conf-name>2020 CHI Conference on Human Factors in Computing Systems</conf-name>
          <conf-date>Apr 25-30</conf-date>
          <conf-loc>Honolulu, HI</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3313831.3376672</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Burke</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Understanding perceptions of problematic Facebook use: when people experience negative life impact and a lack of control</article-title>
          <year>2019</year>
          <conf-name>2019 CHI Conference on Human Factors in Computing Systems</conf-name>
          <conf-date>May 4-9</conf-date>
          <conf-loc>Glasgow, Scotland</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3290605.3300429</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Böhmer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hecht</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Schöning</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Krüger</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bauer</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Falling asleep with Angry Birds, Facebook and Kindle: a large scale study on mobile application usage</article-title>
          <year>2011</year>
          <conf-name>13th International Conference on Human Computer Interaction with Mobile Devices and Services - MobileHCI '11</conf-name>
          <conf-date>Aug 30 - Sept 2</conf-date>
          <conf-loc>Stockholm, Sweden</conf-loc>
          <pub-id pub-id-type="doi">10.1145/2037373.2037383</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carrascal</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Church</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>An in-situ study of mobile app and mobile search interactions</article-title>
          <year>2015</year>
          <conf-name>33rd Annual ACM Conference on Human Factors in Computing Systems - CHI '15</conf-name>
          <conf-date>Apr 18-23</conf-date>
          <conf-loc>Seoul, Republic of Korea</conf-loc>
          <pub-id pub-id-type="doi">10.1145/2702123.2702486</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Soikkeli</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Karikoski</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hammainen</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Diversity and end user context in smartphone usage sessions</article-title>
          <year>2011</year>
          <conf-name>Fifth International Conference on Next Generation Mobile Applications, Services and Technologies (NGMAST 2011)</conf-name>
          <conf-date>Sept 14-16</conf-date>
          <conf-loc>Cardiff, UK</conf-loc>
          <pub-id pub-id-type="doi">10.1109/ngmast.2011.12</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>van Berkel</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Anagnostopoulos</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ferreira</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Goncalves</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hosio</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kostakos</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>A systematic assessment of smartphone usage gaps</article-title>
          <year>2016</year>
          <conf-name>2016 CHI Conference on Human Factors in Computing Systems</conf-name>
          <conf-date>May 7-12</conf-date>
          <conf-loc>San Jose, CA</conf-loc>
          <pub-id pub-id-type="doi">10.1145/2858036.2858348</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Banovic</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Brant</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mankoff</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dey</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>ProactiveTasks: the short of mobile device use sessions</article-title>
          <year>2014</year>
          <conf-name>16th International Conference on Human-Computer Interaction with Mobile Devices &amp; Services - MobileHCI ‘14</conf-name>
          <conf-date>Sept 23-26</conf-date>
          <conf-loc>Toronto, ON</conf-loc>
          <pub-id pub-id-type="doi">10.1145/2628363.2628380</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ferreira</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Goncalves</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kostakos</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Barkhuus</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Dey</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Contextual experience sampling of mobile application micro-usage</article-title>
          <year>2014</year>
          <conf-name>16th International Conference on Human-Computer Interaction with Mobile Devices &amp; Services - MobileHCI ‘14</conf-name>
          <conf-date>September 23-26</conf-date>
          <conf-loc>Toronto, ON</conf-loc>
          <pub-id pub-id-type="doi">10.1145/2628363.2628367</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shannon</surname>
              <given-names>CE</given-names>
            </name>
          </person-group>
          <article-title>A mathematical theory of communication</article-title>
          <source>SIGMOBILE Mob Comput Commun Rev</source>
          <year>2001</year>
          <month>01</month>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>3</fpage>
          <lpage>55</lpage>
          <pub-id pub-id-type="doi">10.1145/584091.584093</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hui</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Su</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Your apps give you away: distinguishing mobile users by their app usage fingerprints</article-title>
          <source>Proc ACM Interact Mob Wearable Ubiquitous Technol</source>
          <year>2018</year>
          <month>09</month>
          <day>18</day>
          <volume>2</volume>
          <issue>3</issue>
          <fpage>1</fpage>
          <lpage>23</lpage>
          <pub-id pub-id-type="doi">10.1145/3264948</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="book">
          <article-title>Hamming distance</article-title>
          <source>Encyclopedia of Biometrics</source>
          <year>2009</year>
          <publisher-loc>Boston, MA</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>668</fpage>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ramos</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Dey</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Discovering different kinds of smartphone users through their application usage behaviors</article-title>
          <year>2016</year>
          <conf-name>2016 ACM International Joint Conference on Pervasive and Ubiquitous Computing</conf-name>
          <conf-date>Sept 12-16</conf-date>
          <conf-loc>Heidelberg, Germany</conf-loc>
          <pub-id pub-id-type="doi">10.1145/2971648.2971696</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rahaman</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Moral</surname>
              <given-names>IH</given-names>
            </name>
            <name name-style="western">
              <surname>Rahman</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Sahabuddin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Samuel</surname>
              <given-names>AB</given-names>
            </name>
          </person-group>
          <article-title>Online learning in Bangladesh during COVID-19: perceived effectiveness, challenges, and suggestions</article-title>
          <source>J Educ Manag Dev Stud</source>
          <year>2021</year>
          <month>12</month>
          <day>30</day>
          <volume>1</volume>
          <issue>3</issue>
          <fpage>35</fpage>
          <lpage>47</lpage>
          <pub-id pub-id-type="doi">10.52631/jemds.v1i3.51</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Guyon</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Nikravesh</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gunn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zadeh</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <source>Feature Extraction: Foundations and Applications</source>
          <year>2006</year>
          <publisher-loc>Berlin, Heidelberg</publisher-loc>
          <publisher-name>Springer</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meinshausen</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Bühlmann</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Stability selection</article-title>
          <source>J R Stat Soc Series B Stat Methodol</source>
          <year>2010</year>
          <volume>72</volume>
          <issue>4</issue>
          <fpage>473</fpage>
          <pub-id pub-id-type="doi">10.1111/j.1467-9868.2010.00740.x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Geron</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <source>Hands-On Machine Learning with Scikit-Learn and TensorFlow</source>
          <year>2017</year>
          <publisher-loc>Sebastopol, CA</publisher-loc>
          <publisher-name>O'Reilly Media</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peduzzi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Concato</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kemper</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Holford</surname>
              <given-names>TR</given-names>
            </name>
            <name name-style="western">
              <surname>Feinstein</surname>
              <given-names>AR</given-names>
            </name>
          </person-group>
          <article-title>A simulation study of the number of events per variable in logistic regression analysis</article-title>
          <source>J Clin Epidemiol</source>
          <year>1996</year>
          <month>12</month>
          <volume>49</volume>
          <issue>12</issue>
          <fpage>1373</fpage>
          <lpage>1379</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0895-4356(96)00236-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/s0895-4356(96)00236-3</pub-id>
          <pub-id pub-id-type="medline">8970487</pub-id>
          <pub-id pub-id-type="pii">S0895-4356(96)00236-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kursa</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Rudnicki</surname>
              <given-names>WR</given-names>
            </name>
          </person-group>
          <article-title>Feature selection with the Boruta package</article-title>
          <source>J Stat Softw</source>
          <year>2010</year>
          <volume>36</volume>
          <issue>11</issue>
          <fpage>1</fpage>
          <lpage>13</lpage>
          <pub-id pub-id-type="doi">10.18637/jss.v036.i11</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref74">
        <label>74</label>
        <nlm-citation citation-type="web">
          <article-title>Boruta_py</article-title>
          <source>GitHub</source>
          <year>2019</year>
          <access-date>2022-04-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/scikit-learn-contrib/boruta_py">https://github.com/scikit-learn-contrib/boruta_py</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref75">
        <label>75</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Dutcher</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tumminia</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Villalba</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Creswell</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Creswell</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mankoff</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dey</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Doryab</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A computational framework for modeling biobehavioral rhythms from mobile and wearable data streams</article-title>
          <source>ACM Trans Intell Syst Technol</source>
          <year>2022</year>
          <month>06</month>
          <day>30</day>
          <volume>13</volume>
          <issue>3</issue>
          <fpage>1</fpage>
          <lpage>27</lpage>
          <pub-id pub-id-type="doi">10.1145/3510029</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref76">
        <label>76</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dinga</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Marquand</surname>
              <given-names>AF</given-names>
            </name>
            <name name-style="western">
              <surname>Veltman</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Beekman</surname>
              <given-names>ATF</given-names>
            </name>
            <name name-style="western">
              <surname>Schoevers</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>van Hemert</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Penninx</surname>
              <given-names>BWJH</given-names>
            </name>
            <name name-style="western">
              <surname>Schmaal</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Predicting the naturalistic course of depression from a wide range of clinical, psychological, and biological data: a machine learning approach</article-title>
          <source>Transl Psychiatry</source>
          <year>2018</year>
          <month>11</month>
          <day>05</day>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>241</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41398-018-0289-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41398-018-0289-1</pub-id>
          <pub-id pub-id-type="medline">30397196</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41398-018-0289-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC6218451</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref77">
        <label>77</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Andaur Navarro</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Damen</surname>
              <given-names>JAA</given-names>
            </name>
            <name name-style="western">
              <surname>Takada</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Nijman</surname>
              <given-names>SWJ</given-names>
            </name>
            <name name-style="western">
              <surname>Dhiman</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Bajpai</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Riley</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Moons</surname>
              <given-names>KGM</given-names>
            </name>
            <name name-style="western">
              <surname>Hooft</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Risk of bias in studies on prediction models developed using supervised machine learning techniques: systematic review</article-title>
          <source>BMJ</source>
          <year>2021</year>
          <month>10</month>
          <day>20</day>
          <volume>375</volume>
          <fpage>n2281</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.bmj.com/lookup/pmidlookup?view=long&amp;pmid=34670780"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.n2281</pub-id>
          <pub-id pub-id-type="medline">34670780</pub-id>
          <pub-id pub-id-type="pmcid">PMC8527348</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref78">
        <label>78</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Beriwal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Agrawal</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Techniques for suicidal ideation prediction: a qualitative systematic review</article-title>
          <year>2021</year>
          <conf-name>2021 International Conference on INnovations in Intelligent SysTems and Applications (INISTA)</conf-name>
          <conf-date>Aug 25-27</conf-date>
          <conf-loc>Kocaeli, Turkey</conf-loc>
          <pub-id pub-id-type="doi">10.1109/inista52262.2021.9548444</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref79">
        <label>79</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bernert</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Hilberg</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Melia</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>NH</given-names>
            </name>
            <name name-style="western">
              <surname>Abnousi</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence and suicide prevention: a systematic review of machine learning investigations</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2020</year>
          <month>08</month>
          <day>15</day>
          <volume>17</volume>
          <issue>16</issue>
          <fpage>5929</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph17165929"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph17165929</pub-id>
          <pub-id pub-id-type="medline">32824149</pub-id>
          <pub-id pub-id-type="pii">ijerph17165929</pub-id>
          <pub-id pub-id-type="pmcid">PMC7460360</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref80">
        <label>80</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ke</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Meng</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Finley</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>LightGBM: a highly efficient gradient boosting decision tree</article-title>
          <year>2017</year>
          <conf-name>31st International Conference on Neural Information Processing Systems</conf-name>
          <conf-date>Dec 4-9</conf-date>
          <conf-loc>Long Beach, CA</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref81">
        <label>81</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Prokhorenkova</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gusev</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Vorobev</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dorogush</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gulin</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>CatBoost: unbiased boosting with categorical features</article-title>
          <source>arXiv csLG</source>
          <year>2017</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/pdf/10.5555/3327757.3327770"/>
          </comment>
          <pub-id pub-id-type="doi">10.5555/3327757.3327770</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref82">
        <label>82</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>JH</given-names>
            </name>
          </person-group>
          <article-title>Greedy function approximation: a gradient boosting machine</article-title>
          <source>Ann Stat</source>
          <year>2001</year>
          <month>10</month>
          <volume>29</volume>
          <issue>5</issue>
          <fpage>1189</fpage>
          <lpage>1232</lpage>
          <pub-id pub-id-type="doi">10.1214/aos/1013203451</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref83">
        <label>83</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vabalas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gowen</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Poliakoff</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Casson</surname>
              <given-names>AJ</given-names>
            </name>
          </person-group>
          <article-title>Machine learning algorithm validation with a limited sample size</article-title>
          <source>PLoS One</source>
          <year>2019</year>
          <volume>14</volume>
          <issue>11</issue>
          <fpage>e0224365</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0224365"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0224365</pub-id>
          <pub-id pub-id-type="medline">31697686</pub-id>
          <pub-id pub-id-type="pii">PONE-D-19-13163</pub-id>
          <pub-id pub-id-type="pmcid">PMC6837442</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref84">
        <label>84</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Cross-validation for selecting a model selection procedure</article-title>
          <source>J Econom</source>
          <year>2015</year>
          <month>07</month>
          <volume>187</volume>
          <issue>1</issue>
          <fpage>95</fpage>
          <lpage>112</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jeconom.2015.02.006</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref85">
        <label>85</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bergstra</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yamins</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Cox</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Making a science of model search: hyperparameter optimization in hundreds of dimensions for vision architectures</article-title>
          <year>2013</year>
          <conf-name>30th International Conference on Machine Learning</conf-name>
          <conf-date>June 16-21</conf-date>
          <conf-loc>Atlanta, GA</conf-loc>
          <fpage>115</fpage>
          <lpage>123</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref86">
        <label>86</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pedregosa</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Varoquaux</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gramfort</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Michel</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Thirion</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Grisel</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Blondel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Müller</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nothman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Louppe</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Prettenhofer</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Weiss</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Dubourg</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Vanderplas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Passos</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cournapeau</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Brucher</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Perrot</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Duchesnay</surname>
              <given-names>É</given-names>
            </name>
          </person-group>
          <article-title>Scikit-learn: machine learning in Python</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online Jan 2, 2012</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/1201.0490"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1201.0490</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref87">
        <label>87</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lundberg</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S-I</given-names>
            </name>
          </person-group>
          <article-title>A unified approach to interpreting model predictions</article-title>
          <year>2017</year>
          <conf-name>Advances in Neural Information Processing Systems 30 (NIPS 2017)</conf-name>
          <conf-date>Dec 4-9</conf-date>
          <conf-loc>Long Beach, CA</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref88">
        <label>88</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dogrucu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Perucic</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Isaro</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ball</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Toto</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Rundensteiner</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Agu</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Davis-Martin</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Boudreaux</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Moodable: on feasibility of instantaneous depression assessment using machine learning on voice samples with retrospectively harvested smartphone and social media data</article-title>
          <source>Smart Health</source>
          <year>2020</year>
          <month>07</month>
          <volume>17</volume>
          <fpage>100118</fpage>
          <pub-id pub-id-type="doi">10.1016/j.smhl.2020.100118</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref89">
        <label>89</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yue</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ware</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Morillo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kamath</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Russell</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bamis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Automatic depression prediction using internet traffic characteristics on smartphones</article-title>
          <source>Smart Health (Amst)</source>
          <year>2020</year>
          <month>11</month>
          <volume>18</volume>
          <fpage>100137</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33043105"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.smhl.2020.100137</pub-id>
          <pub-id pub-id-type="medline">33043105</pub-id>
          <pub-id pub-id-type="pii">100137</pub-id>
          <pub-id pub-id-type="pmcid">PMC7544007</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref90">
        <label>90</label>
        <nlm-citation citation-type="web">
          <article-title>New research reveals mobile users want phones to be more resilient with longer battery life</article-title>
          <source>PR Newswire</source>
          <year>2013</year>
          <access-date>2022-05-23</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.prnewswire.com/news-releases/new-research-reveals-mobile-users-want-phones-to-be-more-resilient-with-longer-battery-life-233725021.html">https://www.prnewswire.com/news-releases/new-research-reveals-mobile-users-want-phones-to-be-more-resilient-with -longer-battery-life-233725021.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref91">
        <label>91</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Understanding application-battery interactions on smartphones: a large-scale empirical study</article-title>
          <source>IEEE Access</source>
          <year>2017</year>
          <volume>5</volume>
          <fpage>13387</fpage>
          <lpage>13400</lpage>
          <pub-id pub-id-type="doi">10.1109/access.2017.2728620</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref92">
        <label>92</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rooksby</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Morrison</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Murray-Rust</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Student perspectives on digital phenotyping: the acceptability of using smartphone data to assess mental health</article-title>
          <year>2019</year>
          <conf-name>2019 CHI Conference on Human Factors in Computing Systems</conf-name>
          <conf-date>May 4-9</conf-date>
          <conf-loc>Glasgow, Scotland</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3290605.3300655</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref93">
        <label>93</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Saeb</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lonini</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jayaraman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mohr</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kording</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>The need to approximate the use-case in clinical machine learning</article-title>
          <source>Gigascience</source>
          <year>2017</year>
          <month>05</month>
          <day>01</day>
          <volume>6</volume>
          <issue>5</issue>
          <fpage>1</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28327985"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/gigascience/gix019</pub-id>
          <pub-id pub-id-type="medline">28327985</pub-id>
          <pub-id pub-id-type="pii">3071704</pub-id>
          <pub-id pub-id-type="pmcid">PMC5441397</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref94">
        <label>94</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Murnane</surname>
              <given-names>EL</given-names>
            </name>
            <name name-style="western">
              <surname>Abdullah</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Matthews</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kay</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kientz</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Choudhury</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gay</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Cosley</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Mobile manifestations of alertness: connecting biological rhythms with patterns of smartphone app use</article-title>
          <source>MobileHCI</source>
          <year>2016</year>
          <month>09</month>
          <volume>2016</volume>
          <fpage>465</fpage>
          <lpage>477</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30931436"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/2935334.2935383</pub-id>
          <pub-id pub-id-type="medline">30931436</pub-id>
          <pub-id pub-id-type="pmcid">PMC6436843</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref95">
        <label>95</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ing</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sämann</surname>
              <given-names>Philipp G</given-names>
            </name>
            <name name-style="western">
              <surname>Chu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tay</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Biondo</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Robert</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Jia</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Wolfers</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Desrivières</surname>
              <given-names>Sylvane</given-names>
            </name>
            <name name-style="western">
              <surname>Banaschewski</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Bokde</surname>
              <given-names>ALW</given-names>
            </name>
            <name name-style="western">
              <surname>Bromberg</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Büchel</surname>
              <given-names>Christian</given-names>
            </name>
            <name name-style="western">
              <surname>Conrod</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Fadai</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Flor</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Frouin</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Garavan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Spechler</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Gowland</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Grimmer</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Heinz</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ittermann</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Kappel</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Martinot</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Meyer-Lindenberg</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Millenet</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nees</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>van Noort</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Orfanos</surname>
              <given-names>DP</given-names>
            </name>
            <name name-style="western">
              <surname>Martinot</surname>
              <given-names>MP</given-names>
            </name>
            <name name-style="western">
              <surname>Penttilä</surname>
              <given-names>Jani</given-names>
            </name>
            <name name-style="western">
              <surname>Poustka</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Quinlan</surname>
              <given-names>EB</given-names>
            </name>
            <name name-style="western">
              <surname>Smolka</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Stringaris</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Struve</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Veer</surname>
              <given-names>IM</given-names>
            </name>
            <name name-style="western">
              <surname>Walter</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Whelan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Andreassen</surname>
              <given-names>OA</given-names>
            </name>
            <name name-style="western">
              <surname>Agartz</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Lemaitre</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Barker</surname>
              <given-names>ED</given-names>
            </name>
            <name name-style="western">
              <surname>Ashburner</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Binder</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Buitelaar</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Marquand</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Robbins</surname>
              <given-names>TW</given-names>
            </name>
            <name name-style="western">
              <surname>Schumann</surname>
              <given-names>G</given-names>
            </name>
            <collab>IMAGEN Consortium</collab>
          </person-group>
          <article-title>Identification of neurobehavioural symptom groups based on shared brain mechanisms</article-title>
          <source>Nat Hum Behav</source>
          <year>2019</year>
          <month>12</month>
          <volume>3</volume>
          <issue>12</issue>
          <fpage>1306</fpage>
          <lpage>1318</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://hal.archives-ouvertes.fr/hal-02443809"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41562-019-0738-8</pub-id>
          <pub-id pub-id-type="medline">31591521</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41562-019-0738-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref96">
        <label>96</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Natekin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Knoll</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Gradient boosting machines, a tutorial</article-title>
          <source>Front Neurorobot</source>
          <year>2013</year>
          <volume>7</volume>
          <fpage>21</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/24409142"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fnbot.2013.00021</pub-id>
          <pub-id pub-id-type="medline">24409142</pub-id>
          <pub-id pub-id-type="pmcid">PMC3885826</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref97">
        <label>97</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Suresh</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Alam</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Karkossa</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Using peer support to strengthen mental health during the COVID-19 pandemic: a review</article-title>
          <source>Front Psychiatry</source>
          <year>2021</year>
          <volume>12</volume>
          <fpage>714181</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34322045"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fpsyt.2021.714181</pub-id>
          <pub-id pub-id-type="medline">34322045</pub-id>
          <pub-id pub-id-type="pmcid">PMC8310946</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref98">
        <label>98</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Reece</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Danforth</surname>
              <given-names>CM</given-names>
            </name>
          </person-group>
          <article-title>Instagram photos reveal predictive markers of depression</article-title>
          <source>EPJ Data Sci</source>
          <year>2017</year>
          <month>8</month>
          <day>8</day>
          <volume>6</volume>
          <issue>15</issue>
          <fpage>9</fpage>
          <pub-id pub-id-type="doi">10.1140/epjds/s13688-017-0110-z</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref99">
        <label>99</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Manikonda</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>De Choudhury</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Modeling and understanding visual attributes of mental health disclosures in social media</article-title>
          <year>2017</year>
          <conf-name>2017 CHI Conference on Human Factors in Computing Systems</conf-name>
          <conf-date>May 6-11</conf-date>
          <conf-loc>Denver, CO</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3025453.3025932</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref100">
        <label>100</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gaus</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Jolliff</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Moreno</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>A content analysis of YouTube depression personal account videos and their comments</article-title>
          <source>Comput Hum Behav Rep</source>
          <year>2021</year>
          <month>01</month>
          <volume>3</volume>
          <fpage>100050</fpage>
          <pub-id pub-id-type="doi">10.1016/j.chbr.2020.100050</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref101">
        <label>101</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kroenke</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Strine</surname>
              <given-names>TW</given-names>
            </name>
            <name name-style="western">
              <surname>Spitzer</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>JBW</given-names>
            </name>
            <name name-style="western">
              <surname>Berry</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Mokdad</surname>
              <given-names>AH</given-names>
            </name>
          </person-group>
          <article-title>The PHQ-8 as a measure of current depression in the general population</article-title>
          <source>J Affect Disord</source>
          <year>2009</year>
          <month>04</month>
          <volume>114</volume>
          <issue>1-3</issue>
          <fpage>163</fpage>
          <lpage>173</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jad.2008.06.026</pub-id>
          <pub-id pub-id-type="medline">18752852</pub-id>
          <pub-id pub-id-type="pii">S0165-0327(08)00282-6</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
