<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR AI</journal-id><journal-id journal-id-type="publisher-id">ai</journal-id><journal-id journal-id-type="index">41</journal-id><journal-title>JMIR AI</journal-title><abbrev-journal-title>JMIR AI</abbrev-journal-title><issn pub-type="epub">2817-1705</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v5i1e69494</article-id><article-id pub-id-type="doi">10.2196/69494</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Using Digital Phenotyping for Depression Screening in Community-Dwelling Older Adults: Bayesian Multilevel Hurdle Model Machine Learning Approach</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Chung</surname><given-names>Moo-Kwon</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Lim</surname><given-names>Hyo-Sang</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Lee</surname><given-names>Sang Yup</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Baek</surname><given-names>Hyo Seok</given-names></name><degrees>BSc</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lee</surname><given-names>Jinhee</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lee</surname><given-names>Kyoung Joung</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Shin</surname><given-names>Taeksoo</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff7">7</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Kim</surname><given-names>Min-Hyuk</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Hwang</surname><given-names>Sangwon</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff8">8</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Urtnasan</surname><given-names>Erdenebayar</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff9">9</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Park</surname><given-names>Ji Young</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff10">10</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Kwon</surname><given-names>Dan Hee</given-names></name><degrees>BSc</degrees><xref ref-type="aff" rid="aff11">11</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Lee</surname><given-names>Jin-kyung</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff12">12</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Global Public Administration, Yonsei University Mirae Campus</institution><addr-line>Wonju</addr-line><country>Republic of Korea</country></aff><aff id="aff2"><institution>Division of Software, Yonsei University Mirae Campus</institution><addr-line>Wonju</addr-line><country>Republic of Korea</country></aff><aff id="aff3"><institution>Department of Communication, Yonsei University Sinchon Campus</institution><addr-line>Seoul</addr-line><country>Republic of Korea</country></aff><aff id="aff4"><institution>Department of Computer Science, Yonsei University Mirae Campus</institution><addr-line>Wonju</addr-line><country>Republic of Korea</country></aff><aff id="aff5"><institution>Department of Psychiatry, Yonsei University Wonju College of Medicine</institution><addr-line>Wonju</addr-line><country>Republic of Korea</country></aff><aff id="aff6"><institution>Office of the President, Songho University</institution><addr-line>Hoengseong</addr-line><addr-line>Gangwon-do</addr-line><country>Republic of Korea</country></aff><aff id="aff7"><institution>Department of Business Administration, Yonsei University Mirae Campus</institution><addr-line>Wonju</addr-line><country>Republic of Korea</country></aff><aff id="aff8"><institution>Department of Precision Medicine, Yonsei University Wonju College of Medicine</institution><addr-line>Wonju</addr-line><country>Republic of Korea</country></aff><aff id="aff9"><institution>Division of AI Semiconductor, Yonsei University Mirae Campus</institution><addr-line>Wonju</addr-line><country>Republic of Korea</country></aff><aff id="aff10"><institution>Department of Social Welfare, Sangji University</institution><addr-line>Wonju</addr-line><country>Republic of Korea</country></aff><aff id="aff11"><institution>Department of Health Administration, Yonsei University Mirae Campus</institution><addr-line>Wonju</addr-line><country>Republic of Korea</country></aff><aff id="aff12"><institution>Health IT Center, Gachon University Gil Hospital</institution><addr-line>773, Namdong-daero, Namdong-gu</addr-line><addr-line>Incheon</addr-line><country>Republic of Korea</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Coristine</surname><given-names>Andrew</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>El-Gayar</surname><given-names>Omar</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Chen</surname><given-names>Zequn</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Jin-kyung Lee, PhD, Health IT Center, Gachon University Gil Hospital, 773, Namdong-daero, Namdong-gu, Incheon, 21556, Republic of Korea, 82 32 460 8090; <email>2jinkyung.lee@gmail.com</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>15</day><month>5</month><year>2026</year></pub-date><volume>5</volume><elocation-id>e69494</elocation-id><history><date date-type="received"><day>01</day><month>12</month><year>2024</year></date><date date-type="rev-recd"><day>07</day><month>03</month><year>2026</year></date><date date-type="accepted"><day>10</day><month>03</month><year>2026</year></date></history><copyright-statement>&#x00A9; Moo-Kwon Chung, Hyo-Sang Lim, Sang Yup Lee, Hyo Seok Baek, Jinhee Lee, Kyoung Joung Lee, Taeksoo Shin, Min-Hyuk Kim, Sangwon Hwang, Erdenebayar Urtnasan, Ji Young Park, Dan Hee Kwon, Jin-kyung Lee. Originally published in JMIR AI (<ext-link ext-link-type="uri" xlink:href="https://ai.jmir.org">https://ai.jmir.org</ext-link>), 15.5.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR AI, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.ai.jmir.org/">https://www.ai.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://ai.jmir.org/2026/1/e69494"/><abstract><sec><title>Background</title><p>With the rapidly aging population, mental health among older adults has received growing attention. Although the likelihood of experiencing depressive symptoms is higher in late adulthood, older adults are more reluctant to visit a clinic due to the stigma surrounding mental health issues, and many remain undiagnosed and untreated. Digital phenotyping has emerged as a promising approach to mitigate this problem. Longitudinal monitoring via wearable devices can facilitate the timely identification of depressive symptoms in older adults. However, there has not been sufficient investigation to develop a machine learning approach that accounts for between-person and within-person characteristics.</p></sec><sec><title>Objective</title><p>This study aimed to investigate the utility of active and passive digital phenotyping data collected via wearable devices for monitoring the probability and severity of depressive symptoms. Specifically, we applied multilevel hurdle modeling within a machine learning framework to enable efficient depression screening in the general population, with a focus on community-dwelling older adults.</p></sec><sec sec-type="methods"><title>Methods</title><p>We analyzed 1011 cases reported by 147 older Korean adults for 2 years. Participants were asked to complete the 9-item Patient Health Questionnaire (PHQ-9) items in our mobile app during the last week of each month. In addition to the annual in-person data collection, we also collected active and passive sensing data from participants via smartphones and smartwatches. For dimensionality reduction on 44 features, parallel analysis and principal component analysis were used. With the extracted 6 principal components (PCs), a Bayesian multilevel hurdle model was used.</p></sec><sec sec-type="results"><title>Results</title><p>When constructing PCs, the weekly stress rating from active data and sleep-related features from passive data were the top 5 contributing features. Among the 6 PCs, the PC consisting of low psychological distress and high social support was significantly associated with depressive symptoms in community-dwelling older adults. This Bayesian multilevel hurdle model showed good performance in screening for depressive symptom severity (<italic>R</italic><sup>2</sup>=0.53) and in distinguishing between those with and without symptoms (area under the receiver operating characteristic curve=0.88 and <italic>F</italic><sub>1</sub>-score=0.75) on the test data. The between-person variance was larger than the within-person variance, especially in explaining the probability of depressive symptoms.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>In mental health screening, active and passive digital phenotyping data can be used in conjunction with traditional clinical screening tools to monitor depressive symptoms among community-dwelling older adults. Dimensionality reduction via parallel analysis and principal component analysis can help identify latent risk profiles. Given the nested data structure and heterogeneity in depressive symptoms, a Bayesian multilevel hurdle model within a machine learning framework may be helpful for depression screening. Overall, digital phenotyping can be a useful tool for personalized, within-person health tracking, even after accounting for substantial between-person variance. We recommend future work to address data imbalance to further strengthen this approach.</p></sec></abstract><kwd-group><kwd>digital phenotyping</kwd><kwd>depression</kwd><kwd>older adults</kwd><kwd>machine learning</kwd><kwd>Bayesian modeling</kwd><kwd>multilevel modeling</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Depression is a highly prevalent mental health disorder, with approximately 5% of the global population affected by this disease [<xref ref-type="bibr" rid="ref1">1</xref>]. Depression can be considered dangerous because it can lead to suicidal ideation when it is not appropriately treated in a timely manner [<xref ref-type="bibr" rid="ref1">1</xref>]. Despite its high prevalence, many people with depressive symptoms neither recognize their need for medical treatment nor receive appropriate medical care [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. Within this group, one particularly vulnerable segment of society is older adults. In the developmental stage, late adulthood is the period of a higher likelihood of experiencing depressive symptoms [<xref ref-type="bibr" rid="ref4">4</xref>]. However, this population tends to have a strong taboo against seeing psychiatrists for their mental health [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. Consequently, many older adults with depressive symptoms are likely to remain undiagnosed and untreated, which can increase their mortality and other health problems [<xref ref-type="bibr" rid="ref7">7</xref>].</p><p>Compared to many other physical health problems that are objectively screened by physical biomarkers, many mental health problems, such as depressive disorder, are diagnosed based exclusively on a client&#x2019;s subjective statements about experiencing symptoms [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. Unless the patient is open and willing to undergo treatment, it is much harder to detect depressive symptoms and prescribe an appropriate treatment regimen at the onset of illness. The recent innovation of digital phenotyping has been receiving increasing global attention due to its potential to remotely monitor and screen for early signals of depressive symptoms [<xref ref-type="bibr" rid="ref9">9</xref>]. One of the biggest benefits of digital phenotyping is its ability to reduce recall bias, a prevalent issue in traditional screening methods. Traditional depression screening tools are limited by recall bias because they rely solely on retrospective survey measures. By using smart devices, digital phenotyping enables the collection of in situ data on participants&#x2019; mood, activity, sleep, and other behaviors [<xref ref-type="bibr" rid="ref10">10</xref>]. With digital phenotyping, it is possible to monitor real-time data regarding depressive symptoms and to identify individuals experiencing depressive symptoms promptly [<xref ref-type="bibr" rid="ref8">8</xref>]. Since digital phenotyping can enable real-time monitoring in natural settings, advances in smartphone technology have spurred academic interest in this area in psychiatry [<xref ref-type="bibr" rid="ref8">8</xref>]. By applying digital phenotyping to real-time monitoring, it is possible to reach out to those in need for early intervention. It would be helpful to identify individuals with depressive symptoms in the general population who may otherwise remain undetected.</p><p>In terms of the types of data collected in digital phenotyping, there are mainly 2 categories: active data and passive sensing data [<xref ref-type="bibr" rid="ref8">8</xref>]. Active data includes self-report survey responses collected through smartphone apps, and passive sensing data includes moment-by-moment data collected unintentionally by sensors (eg, step counts or sleep log data collected via smart wearable devices) [<xref ref-type="bibr" rid="ref9">9</xref>]. Active data is beneficial for understanding people&#x2019;s subjective perceptions of their moods, stress, and life experiences; however, one drawback of this method is that it requires significant human effort to respond to screening questionnaires. Passive sensing data, on the other hand, enables real-time status monitoring [<xref ref-type="bibr" rid="ref10">10</xref>] with easy access and minimal user input, which has attracted attention in psychiatry, particularly in studies on depression [<xref ref-type="bibr" rid="ref11">11</xref>]. However, collecting passive sensing data often requires additional expensive digital devices (eg, smartwatches). Interestingly, despite the large number of theoretical frameworks, there have been relatively few empirical studies that build machine learning models using both active and passive digital phenotyping features. This might be because collecting digital phenotyping features from a large sample requires abundant funding and resources. Although smartphones are prevalent, the features of digital phenotyping that can be collected only by smartphones are limited, which can result in a modest sample size. The potential cost burdens that may arise when incorporating digital phenotyping into practice settings pose a risk that significantly diminishes its benefits for monitoring individuals experiencing depressive symptoms, especially in socioeconomically disadvantaged communities or those with limited access to medical services. Using a Bayesian machine learning approach, this study aims to explore how digital phenotyping features collected by smartphones and smartwatches can be used to screen for depressive symptoms among community-dwelling older adults. By doing this, we aim to examine how we can leverage active and passive digital phenotyping features despite the challenge of a moderate sample size.</p><p>In this study, one careful methodological consideration is the data structure accumulated in real-time monitoring. Given the nested longitudinal structure of the data, collected features should be treated differently at at least 2 levels: time-varying and time-invariant covariates. Despite the rapid increase in academic interest in machine learning algorithms following the rise of artificial intelligence, many machine learning studies have been based on cross-sectional designs. There has not been sufficient consideration of how to handle longitudinal data collected over different time points. To handle nested data appropriately, this study will combine a machine learning approach with a 2-level Bayesian multilevel model comprising within-person and between-person levels.</p><p>Expanding on the Bayesian multilevel model using digital phenotyping data, this study uses a hurdle model. Digital phenotyping enables easy data collection from the general population to screen for depressive symptoms. When screening a general population for depressive symptoms longitudinally, various depressive symptom trajectories are often reported. Although there is no consensus on how many trajectories exist or how these trajectory patterns appear, it is commonly reported that there is a significant proportion of those who have a stable low probability of depression, and that there are qualitatively heterogeneous groups experiencing different levels of depressive symptoms and varying levels of changes in depressive symptoms [<xref ref-type="bibr" rid="ref12">12</xref>-<xref ref-type="bibr" rid="ref14">14</xref>]. Those who have experienced depressive symptoms in the past are more vulnerable to depressive symptoms in the future [<xref ref-type="bibr" rid="ref15">15</xref>]. Furthermore, those who have subthreshold depressive symptoms tend to experience more fluctuations in depressive symptoms over time [<xref ref-type="bibr" rid="ref16">16</xref>]. It is common to see a large proportion of zeros in depressive symptoms when analyzing depression trajectories with longitudinal data from the general population. Since those without depressive symptoms differ qualitatively from those with depressive symptoms, applying a single regression or classification model to the entire dataset may not yield accurate estimates of feature importance. To address this issue, the zero-inflated model has been widely used for 9-item Patient Health Questionnaire (PHQ-9) data. However, when considering the theoretical assumption of sampling zeros, a hurdle model would be more appropriate to apply than the zero-inflated model [<xref ref-type="bibr" rid="ref17">17</xref>]. In the zero-inflated model, structural zeros are treated differently from sampling zeros. For example, sampling zeros include cases where none are obtained despite trying, while structural zeros are cases of never trying. However, for the PHQ-9, a total score of 0 indicates no depressive symptoms. In other words, sampling zeros exactly reflect structural zeros. In a hurdle model, all sampling zeros are assumed to indicate true structural zeros [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. Thus, this study will use a Bayesian multilevel hurdle model to examine the presence and severity of depressive symptoms in community-dwelling older adults. To better explain the associations between covariates and the target outcome variable, a hurdle model estimates 2 regression equations [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. In the binary part, the hurdle model uses logistic regression to estimate the probability of having any depressive symptoms vs none [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. In the continuous part, the hurdle model estimates linear regression coefficients for the severity of depressive symptoms among those with nonzero depressive symptom scores [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>].</p><p>In summary, this study aims to investigate how active and passive digital phenotyping data collected from wearable devices can help monitor depressive symptoms in community-dwelling older adults using a Bayesian hurdle model with 2-level longitudinal data within a machine learning framework.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Procedure</title><p>To develop a machine learning algorithm for depressive symptoms in older adults, we recruited 685 Korean adults in their 50s to 80s residing in Wonju, a large city with both urban and rural areas in South Korea. The inclusion criteria were voluntary participation in this study, being 55 years of age or older, having no cognitive impairments, no alcohol or substance use disorders, no physical disabilities, and being able to concentrate throughout the 1.5-hour baseline interview. Data from 2 participants were excluded because they were identified as duplicates. Of 683 older adults who visited our campus and completed a one-on-one interview with our trained researchers, 411 participants agreed to monitor their depressive symptoms longitudinally and to install our smartphone app, developed exclusively for this research. Through in-person baseline data collection, participants reported their demographic characteristics, physical health, and psychological functioning using traditional survey tools. Soon after, we developed a smartphone app to monitor the depressive symptoms of the participants, which invited the participants to report their daily mood, weekly stress exposure, and monthly depressive symptoms. These app-based surveys collected active data over approximately 24 months (from March 2021 to March 2023) through smartphones. In total, 4566 cases reported by 352 respondents were included in the analysis, which included in-person annual screening data and active data (ie, mobile app survey responses), such as monthly PHQ-9 scores. For passive sensing data, however, the sample size became smaller due to the limited number of available smartwatches for the research. Our smartphone app, designed for daily, weekly, and monthly mobile app surveys, was also linked to the Samsung Health app, allowing step counts and sleep log data collected from smartwatches to be sent to our server through collaboration. The study protocol was published in an international, peer-reviewed medical journal [<xref ref-type="bibr" rid="ref19">19</xref>]. In this study, we analyzed 1011 cases collected via smartwatches from 147 participants, including active and passive sensing data alongside traditional in-person survey tools.</p></sec><sec id="s2-2"><title>Measures</title><p>Subjective depressive symptoms were measured by PHQ-9 [<xref ref-type="bibr" rid="ref20">20</xref>] within our smartphone app. In this study, we used 2 types of depressive symptoms as independent outcome variables. To investigate the association between digital phenotyping and depressive symptom severity, we first used the total PHQ-9 score as the outcome for the continuous part. In addition, to explore the potential application of our model for screening individuals with depressive symptoms in the general population, we also classified structural zeros vs nonzeros for the outcome in the binary part of our model.</p><p>Features extracted from active data collection from the participants&#x2019; reports through the smartphone app included the average and SD of the daily mood score, which ranged from very good &#x201C;(1)&#x201D; to very depressed &#x201C;(5)&#x201D; during a month, the average score and its SD of weekly stress exposure during a month, the frequency that a participant was exposed to stress related to their job, the frequency that a participant was exposed to stress related to interpersonal relationships, the frequency that a participant was exposed to stress related to major life events (ie, death, divorce, marriage, or birth), the frequency that a participant was exposed to stress related to health problems, the frequency that a participant was exposed to stress related to financial issues, and the frequency that a participant was exposed to stress related to extraordinary traumatic life events (eg, a crime, a natural disaster, or an accident) during each month.</p><p>Features extracted from passive sensing data collection included the average and SD of daily step counts during a month, the average duration (in minutes) spent in deep sleep, the average duration (in minutes) spent in light sleep, and the average duration (in minutes) spent in rapid eye movement (REM) sleep during daily sleep within a month, the average duration (in minutes) and SD of the first nonawake sleep stage after getting into bed, the average duration (in minutes) and SD of the last nonawake sleep stage before waking up, the efficacy of daily sleep, the frequency of awakening longer than 5 minutes during a night, and the difference between the average sleep duration on a weekday vs the average sleep duration on a weekend. All features were standardized before running the analyses.</p><p>In addition, the month variable and 3 categorical variables for seasons were also time-varying features, but we treated them differently. Given our assumption that depression is not linearly changing over time, we added 3 binary variables to reflect the 4 seasons. Given that summer has the longest period of sunlight, we set summer as the reference season, and other seasons (spring, fall, and winter) were coded as binary variables. After that, we tested the direct associations between the month variable or the 3 categorical variables and depressive symptom outcome variables. We found a significant relationship with the month variable, but we did not detect any significant direct relationships between the 3 seasonal binary variables and any outcome variable. Thus, we included only the month variable as the time variable in the final Bayesian model. For the 3 seasonal binary variables, we included them in the principal component analysis (PCA) with other features, but we did not include them separately from the principal components (PCs) in the final Bayesian model.</p><p>As constant features which were unchanging over time, demographic characteristics included participants&#x2019; sex (1: male; 0: female), age, education, average monthly income, the number of family members in a household, marital status (1: married and living with a spouse; 0: else), and whether a participant worked in agriculture (1: yes; 0: no). The monthly income was log-transformed because it was nonnormal. To screen participants&#x2019; physical and mental health conditions, features were included such as whether a participant regularly exercised (1: yes; 0: no), whether a participant had a history of smoking (1: yes; 0: no), how many alcoholic drinks a participant consumed in a month, how many hours a participant slept in a day, how many chronic diseases a participant had experienced in their lifetime, whether a participant had ever been diagnosed with major depressive disorder at a clinic, how many depressive episodes a participant had ever experienced in their lifetime based on the Mini-International Neuropsychiatric Interview (MINI) [<xref ref-type="bibr" rid="ref21">21</xref>], the degree of generalized anxiety disorder based on the total score of the 7-item Generalized Anxiety Disorder scale (GAD-7) [<xref ref-type="bibr" rid="ref22">22</xref>], the degree of loneliness based on the total score of the 20-item University of California Los Angeles Loneliness Scale (UCLA Loneliness) [<xref ref-type="bibr" rid="ref23">23</xref>], the degree of perceived social support based on the total score of the 12-item Multidimensional Scale of Perceived Social Support (MSPSS) [<xref ref-type="bibr" rid="ref24">24</xref>], and the number of types of early childhood traumas based on the total score of the 27-item Early Trauma Inventory&#x2013;Short Form (ETI-SF) [<xref ref-type="bibr" rid="ref25">25</xref>].</p></sec><sec id="s2-3"><title>Statistical Analysis</title><p>As a machine learning approach, we split the data at the observational level chronologically for each participant into 80% for training and 20% for testing. During data preprocessing, we examined all features from in-person, active, and passive sensing data and used Multiple Imputation by Chained Equations (MICE) to impute missing values separately to avoid data leakage. Of 1011 cases in total, 5 (0.49%) cases were missing from the daily mood surveys, and 22 (2.18%) cases were missing from the weekly stress surveys within the active data. Also, 11 (1.09%) cases did not have an answer about the number of depressive episodes in one&#x2019;s lifetime in the in-person data. On the other hand, passive sensing data were largely complete, except for step counts. Because passive sensing data were collected at the millisecond level while depressive symptoms were assessed monthly, it was hard to observe missing data in passive sensing. In this study, we transformed all active and passive sensing features to the month level. Regarding step counts, 157 (15.53%) cases were treated as missing due to a technical transmission issue. That is, smartwatch-recorded step counts were not consistently transmitted to the server, whereas smartphone-recorded step counts were accurately captured. Upon identifying this issue during participant house visits, the collected step count data during this period were treated as missing to avoid the use of inaccurate values. Accordingly, MICE was applied to address these technically induced missing values, assuming that missingness was unrelated to depressive symptoms or physical activity behaviors. When imputing missing data among 43 features using MICE, we included the ID and time to preserve the longitudinal data structure. After that, to reduce feature dimensionality, PCA was performed. Using the recipes workflow in R, variables were first standardized to a mean of 0 and an SD of 1. The number of PCs to retain was determined using parallel analysis and the Cattell scree test. For PCA, we conducted a parallel analysis to determine the number of PCs for data reduction. In the PCA stage, using the recipe function, we calculated the means and SDs of the parameters from the training data and computed the PCA rotation. We applied these parameters to both the training and test data.</p><p>When we developed the machine learning algorithm, we used Bayesian modeling in R, considering our sample size. Unlike frequentist methods such as traditional linear or logistic regression models, which produce a single value for each estimate, Bayesian models use a posterior distribution by Markov Chain Monte Carlo sampling for each model parameter. By accounting for model uncertainty, a Bayesian model is known to produce more accurate estimates, and its benefits are even more pronounced when the sample size is modest. We used 4 chains, 4000 iterations, 4 cores, and 2000 warmup iterations. To account for the longitudinal data structure, with repeated measurements from participants, we used Bayesian multilevel modeling with the &#x201C;<italic>brms</italic>&#x201D; package and included a random intercept for individual ID. Finally, we used the hurdle model to account for the presence and severity of symptoms. By using 2 separate equations, such as regression in the continuous part and logistic regression in the binary part, the hurdle model aims to explain the probability of having depression and the severity of depressive symptoms effectively. Model coefficients were estimated using the training data, and we evaluated predictive performance and generalizability on independent test data. The model evaluation metrics for the continuous part, when the outcome is the total depressive symptom score, included <italic>R</italic><sup>2</sup>, root-mean-square error (RMSE), and mean absolute error (MAE). Model evaluation metrics for the binary part, when the outcome is the probability of having depression, included the area under the receiver operating characteristic curve (AUC-ROC), precision, sensitivity, specificity, and <italic>F</italic><sub>1</sub>-score. In the Bayesian multilevel hurdle model with 2 types of outcome variables, each parameter was reported with a regression coefficient, 95% credible intervals (CrIs), R-hat, bulk effective sample size (bulk-ESS), and tail-ESS. For the model diagnostics of the Bayesian multilevel hurdle model, we assessed model adequacy using posterior predictive checks, comparing observed data with replicated datasets drawn from the posterior predictive distribution. We also conducted Pareto smoothed importance sampling leave-one-out (PSIS-LOO) cross-validation. The reliability of the PSIS-LOO approximation was assessed using Pareto k diagnostic values.</p></sec><sec id="s2-4"><title>Ethical Considerations</title><p>Before collecting the data, the Institutional Review Board of the Yonsei University Mirae Campus (IRB no 1041849&#x2010;202401-SB-020-11) reviewed and approved all the procedures and measures involving human participants in this research. All participants provided written informed consent to participate in this study. All obtained data were deidentified. Participants received 30,000 won (approximately US $21.29) after completing the baseline in-person survey and received 10,000 Won (approximately US $7) every 3 months based on their completion rates in mobile app surveys. In this paper, no identification of individual participants is included in any text, images, or tables.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Attrition Analysis Results</title><p>Among 411 participants who installed our smartphone app for data collection exclusively for research purposes, depressive symptoms (PHQ-9) and active data (eg, daily mood and weekly stress) were collected through the app from 352 participants. Passive sensing data (eg, daily step counts and sleep logs in milliseconds) were collected from 147 participants using a Samsung Galaxy smartwatch in addition to our mobile app. The sample characteristics of the participants in our datasets are presented in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. As shown in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>, logistic regression was conducted to assess whether attrition bias was associated with demographic characteristics and health-related information. Regarding attrition for passive sensing data, there was no noticeable difference in all characteristics between 147 participants with smartwatches and 205 participants without smartwatches. Further, we tested for attrition bias in the outcome variables; however, no group difference was found due to attrition in the active and passive digital phenotyping data (<italic>t</italic><sub>350</sub>=0.94; <italic>P</italic>=.35 for the severity of depressive symptoms and <italic>t</italic><sub>350</sub>=&#x2212;0.13; <italic>P</italic>=.89 for the probability of experiencing depressive symptoms).</p></sec><sec id="s3-2"><title>Parallel Analysis and PCA Results for Dimensional Reduction</title><p>To reduce the feature dimensionality, we first conducted parallel analysis and PCA. <xref ref-type="fig" rid="figure1">Figure 1</xref> shows the scree plot from the parallel analysis, and <xref ref-type="table" rid="table1">Table 1</xref> shows the PCA results with eigenvalues greater than 1.0 retained. While the Kaiser criterion (eigenvalues &#x003E;1) suggested 16 components, the parallel analysis results indicated that 12 components significantly exceeded the eigenvalues of a random dataset. However, we needed to reduce the number of PCs given the total sample size, and the scree plot showed that the slope flattened after the sixth component (<xref ref-type="fig" rid="figure1">Figure 1</xref>). We ultimately retained 6 components for interpretability, accounting for 36.53% of the total variance (<xref ref-type="table" rid="table1">Table 1</xref>).</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Parallel analysis scree plot for determining the number of principal components (PCs). Blue X marks on the line indicate eigenvalues of PCs produced from the observed dataset. A red dotted line indicates the average eigenvalues from randomly generated datasets. A red long-dashed line indicates eigenvalues from bootstrapped samples. In this plot, the red dotted line and the red long-dashed line overlap.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v5i1e69494_fig01.png"/></fig><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Principal component analysis results.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Principal components (n)</td><td align="left" valign="bottom">Eigenvalue</td><td align="left" valign="bottom">Percent of total variance explained</td><td align="left" valign="bottom">Cumulative percent of total variance explained</td></tr></thead><tbody><tr><td align="left" valign="top">1</td><td align="left" valign="top">4.14</td><td align="left" valign="top">9.62</td><td align="left" valign="top">9.62</td></tr><tr><td align="left" valign="top">2</td><td align="left" valign="top">2.83</td><td align="left" valign="top">6.59</td><td align="left" valign="top">16.22</td></tr><tr><td align="left" valign="top">3</td><td align="left" valign="top">2.44</td><td align="left" valign="top">5.67</td><td align="left" valign="top">21.88</td></tr><tr><td align="left" valign="top">4</td><td align="left" valign="top">2.32</td><td align="left" valign="top">5.39</td><td align="left" valign="top">27.27</td></tr><tr><td align="left" valign="top">5</td><td align="left" valign="top">2.17</td><td align="left" valign="top">5.05</td><td align="left" valign="top">32.32</td></tr><tr><td align="left" valign="top">6</td><td align="left" valign="top">1.81</td><td align="left" valign="top">4.22</td><td align="left" valign="top">36.53</td></tr><tr><td align="left" valign="top">7</td><td align="left" valign="top">1.64</td><td align="left" valign="top">3.82</td><td align="left" valign="top">40.35</td></tr><tr><td align="left" valign="top">8</td><td align="left" valign="top">1.53</td><td align="left" valign="top">3.56</td><td align="left" valign="top">43.91</td></tr><tr><td align="left" valign="top">9</td><td align="left" valign="top">1.49</td><td align="left" valign="top">3.48</td><td align="left" valign="top">47.38</td></tr><tr><td align="left" valign="top">10</td><td align="left" valign="top">1.39</td><td align="left" valign="top">3.24</td><td align="left" valign="top">50.62</td></tr><tr><td align="left" valign="top">11</td><td align="left" valign="top">1.32</td><td align="left" valign="top">3.07</td><td align="left" valign="top">53.69</td></tr><tr><td align="left" valign="top">12</td><td align="left" valign="top">1.22</td><td align="left" valign="top">2.84</td><td align="left" valign="top">56.53</td></tr><tr><td align="left" valign="top">13</td><td align="left" valign="top">1.16</td><td align="left" valign="top">2.69</td><td align="left" valign="top">59.22</td></tr><tr><td align="left" valign="top">14</td><td align="left" valign="top">1.14</td><td align="left" valign="top">2.66</td><td align="left" valign="top">61.88</td></tr><tr><td align="left" valign="top">15</td><td align="left" valign="top">1.11</td><td align="left" valign="top">2.58</td><td align="left" valign="top">64.45</td></tr><tr><td align="left" valign="top">16</td><td align="left" valign="top">1.08</td><td align="left" valign="top">2.52</td><td align="left" valign="top">66.97</td></tr></tbody></table></table-wrap><p><xref ref-type="table" rid="table2">Table 2</xref> shows the factor loadings of the top 5 contributing features for 6 PCs. For PC1, anxiety (&#x03BB;=0.32), social support (&#x03BB;=&#x2212;0.32), loneliness (&#x03BB;=0.29), the average of daily negative mood (&#x03BB;=0.27), and the average weekly stress (&#x03BB;=0.27) had higher factor loadings. This PC represented a dimension of psychological stress and low social support. The eigenvalue of PC1 was 4.14, which explained 9.62% of the total variance. For PC2, the top 5 contributing features were participants&#x2019; gender (&#x03BB;=0.40 for males), smoking (&#x03BB;=0.40), sleep time in the light sleep stage (&#x03BB;=0.27), sleep time in the deep sleep stage (&#x03BB;=0.24), and education level (&#x03BB;=0.23). This PC reflected a high-sleep, educated, male smoker profile. It had an eigenvalue of 2.83 and explained 6.59% of the total variance. Combining participants&#x2019; demographic and psychological characteristics, PC3 reflected another profile. To be specific, income (&#x03BB;=0.36), the average weekly stress (&#x03BB;=0.28), SD of weekly stress (&#x03BB;=0.26), and education level (&#x03BB;=0.24) had positive factor loadings, while loneliness (&#x03BB;=&#x2212;0.26) had negative factor loadings for this PC. This PC reflected a high socioeconomic status, high-stress, and low-loneliness profile. It had an eigenvalue of 2.44 and explained 5.67% of the total variance. For PC4, light sleep minutes (&#x03BB;=&#x2212;0.33), REM sleep minutes (&#x03BB;=&#x2212;0.33), and deep sleep minutes (&#x03BB;=&#x2212;0.31) had higher factor loadings in a negative direction, whereas smoking (&#x03BB;=0.25) and male (&#x03BB;=0.25) had positive factor loadings. PC4 reflected a profile of a male smoker with low sleep duration. This PC had an eigenvalue of 2.32 and explained 5.39% of the total variance. For PC5, SD of sleep onset time (&#x03BB;=0.29), working in agriculture (&#x03BB;=0.28), and married status (&#x03BB;=0.27) had positive factor loadings, while drinking (&#x03BB;=&#x2212;0.33) and total sleep hours (&#x03BB;=-0.21) had negative factor loadings. This PC reflected a farmer&#x2019;s profile with irregular sleep. It had an eigenvalue of 2.17 and explained 5.05% of the total variance. For PC6, higher factor loadings were found when participants had a higher education level (&#x03BB;=0.39), walked less (&#x03BB;=&#x2212;0.34), had a higher income (&#x03BB;=0.30), had more family members (&#x03BB;=0.30), and had greater loneliness (&#x03BB;=0.26). This PC reflected a high socioeconomic status, low-activity, and high-loneliness profile. It had an eigenvalue of 1.81 and explained 4.22% of the total variance.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Top 5 contributing features for the 6 principal components.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Component and top 5 features</td><td align="left" valign="bottom">Loading</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="2">Principal component 1</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Anxiety</td><td align="left" valign="top">0.32</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Social support</td><td align="left" valign="top">&#x2212;0.32</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Loneliness</td><td align="left" valign="top">0.29</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mean of daily negative mood</td><td align="left" valign="top">0.27</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mean of weekly stress</td><td align="left" valign="top">0.27</td></tr><tr><td align="left" valign="top" colspan="2">Principal component 2</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Male</td><td align="left" valign="top">0.40</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Smoking</td><td align="left" valign="top">0.40</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Light sleep minutes</td><td align="left" valign="top">0.27</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Deep sleep minutes</td><td align="left" valign="top">0.24</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Education</td><td align="left" valign="top">0.23</td></tr><tr><td align="left" valign="top" colspan="2">Principal component 3</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Income</td><td align="left" valign="top">0.36</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mean of weekly stress</td><td align="left" valign="top">0.28</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SD of weekly stress</td><td align="char" char="." valign="top">0.26</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Loneliness</td><td align="left" valign="top">&#x2212;0.26</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Education</td><td align="left" valign="top">0.24</td></tr><tr><td align="left" valign="top" colspan="2">Principal component 4</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Light sleep minutes</td><td align="left" valign="top">&#x2212;0.33</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>REM<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup> sleep minutes</td><td align="left" valign="top">&#x2212;0.33</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Deep sleep minutes</td><td align="left" valign="top">&#x2212;0.31</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Smoking</td><td align="left" valign="top">0.25</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Male</td><td align="left" valign="top">0.25</td></tr><tr><td align="left" valign="top" colspan="2">Principal component 5</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Drinking</td><td align="left" valign="top">&#x2212;0.33</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SD of sleep onset time</td><td align="left" valign="top">0.29</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Employed in agriculture</td><td align="left" valign="top">0.28</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Married status</td><td align="left" valign="top">0.27</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Total sleep hours</td><td align="left" valign="top">&#x2212;0.21</td></tr><tr><td align="left" valign="top" colspan="2">Principal component 6</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Education</td><td align="left" valign="top">0.39</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mean of daily step counts</td><td align="left" valign="top">&#x2212;0.34</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Income</td><td align="left" valign="top">0.30</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Family size</td><td align="left" valign="top">0.30</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Loneliness</td><td align="left" valign="top">0.26</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>REM: rapid eye movement.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-3"><title>Bayesian Multilevel Hurdle Model for the Continuous Part: Total Score of Depressive Symptoms in Older Adults</title><p>In this continuous part, the outcome variable was the severity of depressive symptoms measured by the original PHQ-9 total score, ranging from 0 to 27. <xref ref-type="table" rid="table3">Table 3</xref> shows the model results, including a regression coefficient for each PC. Among the 6 PCs, the first (<italic>&#x03B3;</italic>=0.15, 95% CrI 0.08&#x2010;0.23) and the fourth (<italic>&#x03B3;</italic>=0.09, 95% CrI 0.01&#x2010;0.18) were significantly associated with depressive symptom severity among community-dwelling older adults. That is, the severity of depressive symptoms was likely to be higher when a community-dwelling older adult experienced greater psychological distress and lower social support (PC1). Also, the severity of depressive symptoms was likely to be higher when an older adult had shorter REM, light, and deep sleep and was male with greater smoking. A significant variance in the intercepts (variance 0.435, 95% CrI 0.24&#x2010;0.76) indicates differences in depressive symptom severity across individuals. However, no significant trend over time was found (<italic>&#x03B3;</italic>=&#x2212;0.02, 95% CrI &#x2013;0.03 to 0.00). R-hat measures whether the Markov Chain Monte Carlo chains have converged to the same posterior distribution. All R-hat values for the parameters were 1.00, indicating excellent convergence. Bulk-ESS shows whether the posterior mean is reliable, and tail-ESS shows whether CrIs are reliable. Bulk-ESS greater than 1000 and tail-ESS greater than 1000 are regarded as excellent. Bulk-ESS and tail-ESS were large enough, ranging from 3162 to 6267.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Bayesian multilevel hurdle model estimates for the depressive symptoms.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Depressive symptom</td><td align="left" valign="bottom">Estimate (95% CrI<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup>)</td><td align="left" valign="bottom">Estimate error</td><td align="left" valign="bottom">R-hat</td><td align="left" valign="bottom">Bulk-ESS<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup></td><td align="left" valign="bottom">Tail-ESS<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup></td></tr></thead><tbody><tr><td align="left" valign="top" colspan="6">Fixed effects</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Continuous part</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Intercept</td><td align="char" char="." valign="top">0.78 (0.51 to 1.04)</td><td align="char" char="." valign="top">0.14</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">5544</td><td align="char" char="." valign="top">5945</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>PC1<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup></td><td align="char" char="." valign="top">0.15 (0.08 to 0.23)</td><td align="char" char="." valign="top">0.04</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">3327</td><td align="char" char="." valign="top">4148</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>PC2</td><td align="char" char="." valign="top">0.01 (&#x2013;0.08 to 0.10)</td><td align="char" char="." valign="top">0.05</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">3162</td><td align="char" char="." valign="top">4615</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>PC3</td><td align="char" char="." valign="top">&#x2013;0.09 (&#x2013;0.18 to 0.00)</td><td align="char" char="." valign="top">0.05</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">3378</td><td align="char" char="." valign="top">4694</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>PC4</td><td align="char" char="." valign="top">0.09 (0.01 to 0.18)</td><td align="char" char="." valign="top">0.04</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">3647</td><td align="char" char="." valign="top">5729</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>PC5</td><td align="char" char="." valign="top">0.03 (&#x2013;0.07 to 0.14)</td><td align="char" char="." valign="top">0.05</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">4391</td><td align="char" char="." valign="top">5859</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>PC6</td><td align="char" char="." valign="top">0.05 (&#x2013;0.05 to 0.15)</td><td align="char" char="." valign="top">0.05</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">4286</td><td align="char" char="." valign="top">5348</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Month</td><td align="char" char="." valign="top">&#x2013;0.02 (&#x2013;0.03 to 0.00)</td><td align="char" char="." valign="top">0.01</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">8307</td><td align="char" char="." valign="top">6267</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Binary part</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Intercept</td><td align="char" char="." valign="top">&#x2013;1.36 (&#x2013;2.29 to &#x2013;0.47)</td><td align="char" char="." valign="top">0.46</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">2817</td><td align="char" char="." valign="top">4779</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>PC1</td><td align="char" char="." valign="top">&#x2013;0.79 (&#x2013;1.12 to &#x2013;0.49)</td><td align="char" char="." valign="top">0.16</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">2792</td><td align="char" char="." valign="top">4282</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>PC2</td><td align="char" char="." valign="top">0.07 (&#x2013;0.29 to 0.43)</td><td align="char" char="." valign="top">0.18</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">2336</td><td align="char" char="." valign="top">3958</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>PC3</td><td align="char" char="." valign="top">&#x2013;0.18 (&#x2013;0.51 to 0.15)</td><td align="char" char="." valign="top">0.17</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">2851</td><td align="char" char="." valign="top">4578</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>PC4</td><td align="char" char="." valign="top">&#x2013;0.22 (&#x2013;0.52 to 0.08)</td><td align="char" char="." valign="top">0.15</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">3379</td><td align="char" char="." valign="top">4768</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>PC5</td><td align="char" char="." valign="top">&#x2013;0.09 (&#x2013;0.43 to 0.24)</td><td align="char" char="." valign="top">0.17</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">3359</td><td align="char" char="." valign="top">5312</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>PC6</td><td align="char" char="." valign="top">0.05 (&#x2013;0.31 to 0.41)</td><td align="char" char="." valign="top">0.18</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">3850</td><td align="char" char="." valign="top">5927</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Month</td><td align="char" char="." valign="top">0.11 (0.06 to 0.17)</td><td align="char" char="." valign="top">0.03</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">6808</td><td align="char" char="." valign="top">5793</td></tr><tr><td align="left" valign="top" colspan="6">Random effects</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SD (intercept: continuous part)</td><td align="char" char="." valign="top">0.66 (0.49 to 0.87)</td><td align="char" char="." valign="top">0.1</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">2821</td><td align="char" char="." valign="top">4134</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SD (intercept: binary part)</td><td align="char" char="." valign="top">3.07 (2.31 to 4.06)</td><td align="char" char="." valign="top">0.44</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">2803</td><td align="char" char="." valign="top">4710</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>CrI: credible interval.  </p></fn><fn id="table3fn2"><p><sup>b</sup>Bulk-ESS: bulk effective sample size.</p></fn><fn id="table3fn3"><p><sup>c</sup>Tail-ESS: tail effective sample size.</p></fn><fn id="table3fn4"><p><sup>d</sup>PC: principal component.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-4"><title>Bayesian Multilevel Hurdle Model for the Binary Part: Identification of the Presence of Depressive Symptoms in Older Adults</title><p>In the Bayesian multilevel hurdle model for the probability of depression, the binary part modeled the probability that an observation belonged to the structural-zero group, while the continuous part modeled the outcome magnitude among observations capable of generating nonzero values. For the binary part, we used the same 6 PCs as in the continuous part, based on the rule of 10 and the scree plot pattern. The Bayesian multilevel hurdle model results for the binary part are presented in <xref ref-type="table" rid="table3">Table 3</xref>. Regarding the logistic regression coefficients for each parameter, the first PC (<italic>&#x03B3;</italic>=&#x2212;0.79, 95% CrI &#x2013;1.12 to &#x2013;0.49) was negatively associated with the outcome. In this binary part, there was a trend of increasing zeros over time (<italic>&#x03B3;</italic>=0.11, 95% CrI 0.06&#x2010;0.17). All R-hat values for the parameters were 1.00, and bulk-ESS and tail-ESS were large enough, ranging from 2336 to 5927. The SD of the random intercepts for the binary outcome was 3.07 (95% CrI 2.31&#x2010;4.06).</p></sec><sec id="s3-5"><title>Model Diagnostics of the Bayesian Multilevel Hurdle Model</title><p>In the continuous part, although model performance decreased in the test set, the overall predictive accuracy remained acceptable, indicating reasonable generalizability. As shown in <xref ref-type="table" rid="table4">Table 4</xref>, the <italic>R</italic><sup>2</sup> was 0.650, the RMSE was 1.60, and the MAE was 0.95 for the training data. Compared to these, in the test data, the <italic>R</italic><sup>2</sup> was 0.53, the RMSE was 2.25, and the MAE was 1.22. Although the model evaluation metrics on the test data tended to be lower than those on the training data, it is promising to see that the Bayesian multilevel hurdle model explained 53% of the total variance when applied to new, unseen data from the participants. Of course, there was a 12% performance gap between the training and test data, indicating unexplained &#x201C;noise&#x201D; or secondary factors not yet captured by the current PC set, while the core drivers are identified.</p><p>As performance metrics in the binary part (<xref ref-type="table" rid="table4">Table 4</xref>), the AUC-ROC was 0.95, the accuracy was 0.87, the precision was 0.86, the recall was 0.88, the specificity was 0.87, and the <italic>F</italic><sub>1</sub>-score was 0.87 on the training data. For the test data, the AUC-ROC was 0.88, the accuracy was 0.79, the precision was 0.76, the recall was 0.75, the specificity was 0.82, and the <italic>F</italic><sub>1</sub>-score was 0.75. <xref ref-type="fig" rid="figure2">Figure 2</xref> shows the ROC curve and area under the curve for screening for susceptibility to experiencing depressive symptoms in the test dataset. The actual zeros were 534 (52.82%) of 1011 data in total. In the 8:2 split data, the actual zeros were 159 (59.11%) cases out of 269 data in the test dataset. Predicted zeros were also 161 (59.85%) out of 269 cases. Out of 161 (59.85%) cases, 30 (11.15%) cases of predicted zeros were incorrect, whereas 131 (48.70%) cases were correct. The model demonstrated strong discrimination on the training data and maintained good predictive performance on the independent test data, suggesting no evidence of severe overfitting.</p><p>As shown in <xref ref-type="fig" rid="figure3">Figure 3</xref>, the posterior predictive checks indicated that the Bayesian multilevel hurdle model adequately reproduced the observed distribution, including the mass at zero and the variability among nonzero values. <xref ref-type="fig" rid="figure4">Figure 4</xref> demonstrates the Pareto smoothed importance sampling diagnostic test results of the model. When we examined the Pareto smoothed importance sampling diagnostic test results, most observations (97.8%) showed Pareto k values below 0.7, indicating a reliable leave-one-out cross-validation estimate (expected log predictive density calculated via leave-one-out cross-validation=&#x2212;946.0; SE 35.5).</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Performance metrics of the Bayesian multilevel hurdle model.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Performance metrics</td><td align="left" valign="bottom">Training set</td><td align="left" valign="bottom">Test set</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="3">Continuous part</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>RMSE<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup></td><td align="left" valign="top">1.60</td><td align="left" valign="top">2.25</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>MAE<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup></td><td align="left" valign="top">0.95</td><td align="left" valign="top">1.22</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>R</italic><sup>2<xref ref-type="table-fn" rid="table4fn3">c</xref></sup></td><td align="left" valign="top">0.65</td><td align="left" valign="top">0.53</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Calibration slope (95% CrI<sup><xref ref-type="table-fn" rid="table4fn4">d</xref></sup>)</td><td align="left" valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table4fn5">e</xref></sup></td><td align="left" valign="top">1.35 (1.06 to 1.64)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Calibration intercept (95% CrI)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">0.32 (&#x2013;0.13 to 0.77)</td></tr><tr><td align="left" valign="top" colspan="3">Binary part</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AUC-ROC<sup><xref ref-type="table-fn" rid="table4fn6">f</xref></sup></td><td align="left" valign="top">0.95</td><td align="left" valign="top">0.88</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Accuracy</td><td align="left" valign="top">0.87</td><td align="left" valign="top">0.79</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Sensitivity (recall)</td><td align="left" valign="top">0.88</td><td align="left" valign="top">0.75</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Specificity</td><td align="left" valign="top">0.87</td><td align="left" valign="top">0.82</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Precision (PPV<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup>)</td><td align="left" valign="top">0.86</td><td align="left" valign="top">0.76</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">0.87</td><td align="left" valign="top">0.75</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Brier score</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">0.14</td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>RMSE: root-mean-square error.</p></fn><fn id="table4fn2"><p><sup>b</sup>MAE: mean absolute error.</p></fn><fn id="table4fn3"><p><sup>c</sup><italic>R</italic><sup>2</sup>: coefficient of determination.</p></fn><fn id="table4fn4"><p><sup>d</sup>CrI: credible interval.</p></fn><fn id="table4fn5"><p><sup>e</sup>Not applicable.</p></fn><fn id="table4fn6"><p><sup>f</sup>AUC-ROC: area under the receiver operating characteristic curve.</p></fn><fn id="table4fn7"><p><sup>g</sup>PPV: positive predictive value.</p></fn></table-wrap-foot></table-wrap><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Receiver operating characteristic (ROC) curve for the probability of experiencing depressive symptoms in the test dataset using the Bayesian multilevel hurdle model (area under the curve [AUC]=0.88).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v5i1e69494_fig02.png"/></fig><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Posterior predictive checks of the Bayesian multilevel hurdle model. This plot indicates how well the fitted model can reproduce the observed data. A black, thick, solid line indicates the outcome distribution from the observed data. Solid grey lines indicate simulated outcome distributions generated from replicated data based on the fitted model. Y: outcomes from the observed data; Yrep: outcomes from the replicated data.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v5i1e69494_fig03.png"/></fig><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Pareto smoothed importance sampling (PSIS) diagnostic plot. This plot shows the reliability of evaluating a Bayesian model using leave-one-out cross-validation. Light blue cross marks indicate Pareto k values for each observation. Pareto k values under 0.5 are interpreted as very reliable importance sampling, and Pareto k values under 0.7 are regarded as acceptable.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v5i1e69494_fig04.png"/></fig></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>This study has investigated how digital phenotyping data collected from wearable devices, including smartphones and smartwatches, can help monitor depressive symptoms in older adults. The major findings of this study provide empirical evidence about the use of digital phenotyping data for older adults&#x2019; mental health, as previous conceptual framework studies have suggested [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>]. This study supports promising clinical implications for reducing the proportion of undiagnosed and untreated depressive symptoms.</p><p>Specifically, our results may expand the age range for which digital phenotyping can be used to monitor depressive symptoms. Our results demonstrate that including active and passive sensing digital phenotyping data alongside traditional in-person screening tools can enhance model performance, particularly in screening for total depressive symptom scores in older adults. In this study, the Bayesian multilevel hurdle model explains approximately 53% of the variance in depressive symptom severity (<italic>R</italic><sup>2</sup>=0.53) and performs well (AUC-ROC=0.88; <italic>F</italic><sub>1</sub>-score=0.75) in screening for the probability of experiencing any depressive symptoms among community-dwelling older adults. Machine learning is expected to be a valuable tool to screen for depression using a smartphone [<xref ref-type="bibr" rid="ref28">28</xref>]. As the young generation rapidly acquires cutting-edge technology, previous research on digital phenotyping has primarily focused on college students [<xref ref-type="bibr" rid="ref29">29</xref>]. However, given that help-seeking is unlikely to happen when taboos exist related to mental health problems [<xref ref-type="bibr" rid="ref30">30</xref>] and smart devices are designed to be used intuitively, it can be helpful for older adults. Older adults are less likely to approach professional mental health services since they have spent most of their lifetime with strong taboos and stigmas about mental health than younger generations. Our findings from the Bayesian multilevel machine learning approach support the applicability of active and passive sensing digital phenotyping data to make professional mental health surveillance efforts more accessible to older adults.</p><p>This study also suggests considering the multilevel structure of the data. Recently, there has been an increase in academic attention to developing machine learning algorithms; many attempts treat multimodal data as a single dimension, focusing on the roles of passive sensing data [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>]. Also, previous research reporting empirical evidence has tended to collect data over a short period [<xref ref-type="bibr" rid="ref29">29</xref>]. However, when applying digital phenotyping to monitor depressive symptoms, it would be more beneficial to use longitudinal monitoring within the target population [<xref ref-type="bibr" rid="ref33">33</xref>]. From a statistical perspective, data collected through longitudinal monitoring are nested data, with repeatedly collected data from the same individuals sharing characteristics at the person level. Thus, it violates the assumption of independence in simple linear or logistic regression. In this case, using a multilevel approach is necessary. So far, there has been little effort to apply a multilevel approach to machine learning models for continuous screening for depressive symptoms. The findings of this study show the potential applicability of multilevel modeling in developing machine learning models to screen for depressive symptoms. Interestingly, when we tested and compared the simple regression model vs the multilevel regression model results by using the same 6 PCs to explain the total score of depressive symptoms to handle our nested data, we saw that the Bayesian multilevel regression model results have a significantly higher <italic>R</italic><sup>2</sup> than the Bayesian regression model (<italic>R</italic><sup>2</sup> for test data: 0.32 in Bayesian regression &#x2192; 0.52 in Bayesian multilevel regression). It implies that thoughtful consideration of multilevel data structures would enhance model performance.</p><p>When screening for depressive symptoms in the general population, there is heterogeneity between those who have a consistently low susceptibility to depression and those who are vulnerable to depression [<xref ref-type="bibr" rid="ref12">12</xref>-<xref ref-type="bibr" rid="ref14">14</xref>]. In this study, we also observed excessive zeros in our data. We used a Bayesian multilevel hurdle model to handle this. The results of this study demonstrate that using a Bayesian multilevel hurdle model can achieve good performance. As shown in <xref ref-type="fig" rid="figure2">Figure 2</xref>, posterior predictive checks indicated good agreement between the observed and simulated data generated from the posterior predictive distribution. This shows that the model adequately captured the key distributional features of the outcomes. Also, as shown in <xref ref-type="fig" rid="figure3">Figure 3</xref>, PSIS-LOO diagnostics demonstrated that most Pareto shape parameters (k) were below 0.7 (97.8%), with only a few values exceeding 0.7. This suggests stable importance weights and reliable estimation of out-of-sample predictive accuracy. These results support the adequacy and robustness of our proposed model.</p><p>When applying digital phenotyping to real-time monitoring to screen for depressive symptoms, a large number of features will be collected via multimodal approaches. To reduce dimensionality, researchers may use feature extraction or feature selection to handle the large number of features, unless they obtain funding and resources to collect large-scale data from a huge number of people. To screen for depressive symptoms, we used PCA-based feature extraction over feature selection. Given that the primary goal of screening for depressive symptoms using digital phenotyping is to promptly identify individuals who may be experiencing depressive symptoms and to approach them for early intervention, we think PCA-based feature extraction has the advantage of flexibly identifying specific profiles within those experiencing depressive symptoms residing in that community at that moment of monitoring. The mechanisms underlying depressive symptoms are not a single one [<xref ref-type="bibr" rid="ref34">34</xref>], and thus using feature selection can introduce additional bias in explaining the targeted outcome, especially when the sample is modest in size or its representativeness is uncertain. Thus, we preferred feature extraction over feature selection, assuming it would lose less information. This study demonstrates interesting results from PCA and Bayesian modeling. For example, in the PCA results, the top 5 features for PC2 and those for PC4 appeared similar, but the rank of features and the directions of their factor loadings were shown differently in each latent PC. In other words, either in PC2 or in PC4, male and smoking had positive factor loadings. However, sleep-related features (light sleep and deep sleep) had positive factor loadings in PC2, whereas sleep-related features (light sleep, REM sleep, and deep sleep) had all negative factor loadings in PC4. In the Bayesian modeling, PC4 was significantly associated with the severity of depressive symptoms, while PC2 was not. We do not insist that the same PCA results would appear in other data. Rather, this result suggests that feature extraction using PCA may enhance more flexible and scalable community-based screening for depressive symptoms in older adults by uncovering high-risk profiles.</p><p>When extracting 6 PCs, we included all the features rather than separating time-varying features and time-invariant features. This is mainly because latent profiles for those experiencing depressive symptoms may emerge from combinations of personal characteristics and time-varying features, as we discussed in the Results section. If we separate time-varying features from time-invariant features at the PCA stage, PCs extracted from fragmented data will have less power to explain the target outcomes. In the PCA results of this study (<xref ref-type="table" rid="table2">Table 2</xref>), each PC shows a mixture of traditional survey tools and at least one active or passive digital phenotyping feature among the top 5 features for that PC. When extracting the PCs from the large number of parameters, our results showed that not only well-known in-person survey items such as social support (MSPSS), loneliness (UCLA Loneliness), and anxiety (GAD-7), but also active digital phenotyping parameters such as weekly stress, and passive sensing digital phenotyping parameters such as sleep-related features mainly contributed. By pooling time-varying states and time-invariant personal characteristics, we hope the PCA captures the overall covariance structure of features that co-occur in real-world digital phenotyping contexts. Consequently, the extracted components should be interpreted as composite trait-state dimensions reflecting joint patterns, rather than as pure latent traits or pure dynamic factors.</p><p>In this study, the Bayesian multilevel hurdle model results align with previous research findings. In either the continuous or the binary part, PC1 was significantly associated with the outcome. In extracting PC1, anxiety, loneliness, daily negative mood, and weekly stress had positive factor loadings, while social support had a negative factor loading. In the Bayesian modeling, PC1 was positively associated with the severity of depressive symptoms in the continuous part. This PC1 was negatively associated with structural zeros in the binary part. These findings align with previous research demonstrating that older adults with low psychosocial well-being are more likely to experience the occurrence of depressive symptoms and greater severity [<xref ref-type="bibr" rid="ref35">35</xref>-<xref ref-type="bibr" rid="ref37">37</xref>]. In addition, PC4 was not statistically significant for structural zeros, but it was positively associated with the severity of depressive symptoms. This means that male older adults who smoke heavily and have shorter REM, light, and deep sleep are likely to experience higher levels of depressive symptoms. It reveals a latent profile with the risk of greater depression severity in this community. This finding aligns with previous research addressing a positive association between smoking and depression, especially in older adults [<xref ref-type="bibr" rid="ref38">38</xref>]. This finding is also consistent with other research showing that greater wakefulness and reduced sleep efficiency (total time in bed minus awakened time) are associated with an increased risk of depression in male older adults [<xref ref-type="bibr" rid="ref39">39</xref>].</p><p>In the binary part, the hurdle model results show a trend of increasing zeros over time. We were concerned that participants might experience fatigue when responding to the monthly PHQ-9 survey. When we tested whether the variance of responses to each PHQ-9 item decreased, no such trend was observed. When we examined average step counts and sleep efficiency between cases in which participants reported zero and those in which they reported nonzero, the average step counts (8512 in nonzeros and 9724 in zeros) and sleep efficiency (85.9% in nonzeros and 86.1% in zeros) were higher in the zero cases. These results suggest that the increase in zeros over the month in the binary part can be interpreted as a signal of symptom improvement. This aligns with previous research on the subjective experience of long-term remote monitoring of depressive symptoms using technology [<xref ref-type="bibr" rid="ref40">40</xref>]. Through multisite, longitudinal qualitative interviews, participants reported participating in the study with an altruistic intention to help others by sharing their experiences, but they also experienced benefits, such as increased self-awareness. In our research, we also heard reports from some participants that their study engagement made them aware of their mood and more attentive to their health conditions. This implies that longitudinal monitoring using digital phenotyping itself can have clinical implications for enhancing older adults&#x2019; self-awareness and self-care in the community.</p><p>One thing to consider is that our results showed a random-intercept SD of 3.07 in the binary part, suggesting that baseline symptom propensity can inform a strong personal trait. By splitting the chronological data into 8:2 at the observational level for each participant, we allow our model to use known random intercepts for participants seen in the training data. As formalized in the multilevel logistic regression model equation [<xref ref-type="bibr" rid="ref41">41</xref>], our result indicates that approximately 74% of the variance is found at the between-person level, while there remains substantial within-person variance (approximately 26%) available for modeling. In fact, this degree of heterogeneity is common in longitudinal psychiatric research, where individuals with few symptoms contribute to wide separation in intercepts [<xref ref-type="bibr" rid="ref12">12</xref>-<xref ref-type="bibr" rid="ref16">16</xref>]. On the logit scale, this variance reflects the high degree of person-level stability in behavioral health, yet it leaves sufficient within-person variance to be modeled by using digital phenotyping features. In a recent study [<xref ref-type="bibr" rid="ref42">42</xref>], reanalyzing intraindividual consistency in secondary data by profiles of daily smartphone usage showed that within-person variance is better explained in personality research when accounting for between-person variance with longitudinal data collected from the same participants. Another previous research [<xref ref-type="bibr" rid="ref43">43</xref>] underscores the benefits of digital phenotyping for capturing unique data streams for each individual. Although it is challenging to establish population-level patterns given the heterogeneity of symptoms across the total population, digital phenotyping is a valuable tool for within-person health tracking, helping capture individual malfunctions effectively and develop tailored intervention plans [<xref ref-type="bibr" rid="ref43">43</xref>]. Taken together, digital phenotyping can be a useful tool for personalized, within-person health tracking, even after accounting for substantial between-person variance.</p><p>Additionally, this study&#x2019;s findings suggest that handling data imbalance will be a critical challenge when screening for depressive symptoms in the general population, even after accounting for active and passive digital phenotyping and a multilevel data structure. Although major depressive disorder is prevalent, the absolute number of individuals experiencing depressive symptoms would be much smaller than that of nonsymptom individuals. According to the National Center for Mental Health in South Korea [<xref ref-type="bibr" rid="ref44">44</xref>], for example, the annual prevalence of depressive disorder is 1.7%. In fact, regardless of the disease type, data imbalance has been observed and discussed in other medical studies. For example, a recent study [<xref ref-type="bibr" rid="ref45">45</xref>] developing a predictive model for a physical disease found that a massive dataset helps address data scarcity, but it still faces the challenge of data imbalance. Despite the enormous volume of data, a severely skewed distribution persists, and the minority class remains underrepresented. As recent studies have been exploring [<xref ref-type="bibr" rid="ref46">46</xref>-<xref ref-type="bibr" rid="ref48">48</xref>], future research needs to consider not only the increase in data size but also resampling and synthetic data generation.</p></sec><sec id="s4-2"><title>Limitations</title><p>This study has several limitations, which require readers to exercise caution. First, due to the high cost of smartwatches, this study targeting older Korean adults analyzed data from a modest sample. Also, we were unable to install our smartphone app on an iOS device (Apple Inc) because of technical issues. Thankfully, more than 85% of older Korean adults aged 50 to 80 use Android (Google LLC) smartphones [<xref ref-type="bibr" rid="ref49">49</xref>], so we proceeded with our research. However, future research would be better served by collecting data from mobile devices and smartwatches running both Android and iOS. In addition, given that the primary purpose of this research project was to reduce the risk of unrecognized depressive symptoms among older Korean adults, we targeted the general population. However, this led to a small proportion of clinical depression in our data. Although more research is needed to delve into interpersonal and intrapersonal differences in longitudinal patterns of depressive symptoms when applying digital phenotyping in practical settings [<xref ref-type="bibr" rid="ref50">50</xref>], this limitation hinders testing more complex dynamics between digital phenotyping data and different types of depressive disorders. Collecting more clinical cases would enable comparison of the relationship with digital phenotyping across mood disorder types. This approach could help develop more personalized mental health surveillance in digital phenotyping research. Finally, in this study, the calibration slope for the continuous part in the Bayesian multilevel hurdle model was 1.35, suggesting that it tends to underestimate severity at lower predicted values, although the model effectively captures relative differences in symptom severity. In the context of digital phenotyping applications, such miscalibration may lead to inflated risk stratification and premature escalation of clinical interventions if raw predicted scores are used directly. While the model appears suitable for ranking individuals by relative symptom burden and supporting population-level screening, additional screening is necessary before applying predicted PHQ-9 scores to guide individualized clinical decisions. These results underscore the importance of explicitly evaluating and correcting calibration when deploying machine learning&#x2013;based severity prediction models in real-world monitoring settings.</p></sec><sec id="s4-3"><title>Recommendations</title><p>Despite the limitations of this study, these findings can contribute to future research on mental health and digital phenotyping in related academic fields by providing empirical evidence from Bayesian multilevel machine learning models applied to older adults. Recently, there has been a rapid increase in protocol studies and review studies in digital phenotyping. It is recommended to gather additional empirical evidence to address challenges, replicate the findings, and explore more effective strategies to enhance the implementation of digital phenotyping for better screening of geriatric depression. Digital phenotyping, including active and passive data alongside traditional in-person screening tools, can help monitor depressive symptoms in older adults. Further investigation into the development and validation of effective digital biomarkers is also recommended to detect depression signals early in the general population.</p></sec><sec id="s4-4"><title>Conclusion</title><p>In this study, we investigated how digital phenotyping, including active and passive sensing data in addition to traditional in-person surveys, can help monitor depressive symptoms among older adults. To account for time-varying and time-invariant features, we analyzed the data using Bayesian multilevel modeling. Specifically, we used a Bayesian multilevel hurdle model to account for the data distribution reflecting heterogeneity in older adults&#x2019; experiences of depressive symptoms. Dimensional reduction using parallel analysis and PCA, covering all parameters collected from in-person, active, and passive data, can be helpful to reveal latent profiles with a high risk of depressive symptoms. A Bayesian multilevel hurdle model yields acceptable performance for depressive symptom severity and depressive symptom susceptibility for new data from participants. At least one active and one passive digital phenotyping feature were among the top 5 features for the major PCs. These results support the idea that digital phenotyping data help enable real-time monitoring to screen for depressive symptoms in the general population. Future research on effectively handling data imbalance would be beneficial for advancing academic research on digital phenotyping, particularly for monitoring depressive symptoms in community-dwelling older adults.</p></sec></sec></body><back><ack><p>We appreciate all the participants of this research for their precious time and the open hearts they willingly shared with us. We are also thankful to have many research assistants who diligently served throughout the data collection using multimodal methods for a long time, without any intention to draw attention to themselves. Administrative help from the Institute for Poverty Alleviation and International Development at Yonsei University and the Industry-Academic Cooperation Foundation at Yonsei University Mirae Campus is greatly appreciated as well.</p><p>In terms of generative artificial intelligence (GAI) use, no research output was produced by GAI tools. In this research, the use of GAI tools was limited to tasks such as troubleshooting R code and proofreading. Even when using GAIs for these purposes, authors used multiple tools, such as ChatGPT, Gemini, and Claude, to compare their responses, and the authors chose the best one after human review of possible solutions.</p></ack><notes><sec><title>Funding</title><p>This work was supported by the Ministry of Education of the Republic of Korea and the National Research Foundation of Korea (grant NRF-2020S1A5A2A03045088).</p></sec><sec><title>Data Availability</title><p>The datasets analyzed during this study are not publicly available due to the sensitive nature of mental health data and the need to protect participant anonymity but are available from the corresponding author on reasonable request.</p></sec></notes><fn-group><fn fn-type="con"><p>Conceptualization was performed by MKC, HSL, SYL, JL, KJL, TS, MHK, SH, EU, JYP, and JKL. Data curation was conducted by HSB and JKL. Formal analysis was performed by JKL. Funding acquisition was secured by MKC. An investigation was carried out by HSB, DHK, and JKL. Methodology was developed by JKL, HSL, and SYL. Project administration was managed by MKC and JKL. Supervision was provided by HSL and SYL. The original draft was written by JKL. Review and editing of the manuscript were performed by JKL.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AUC-ROC</term><def><p>area under the receiver operating characteristic curve</p></def></def-item><def-item><term id="abb2">CrI</term><def><p>credible interval</p></def></def-item><def-item><term id="abb3">ESS</term><def><p>effective sample size</p></def></def-item><def-item><term id="abb4">ETI-SF</term><def><p>27-item Early Trauma Inventory&#x2013;Short Form</p></def></def-item><def-item><term id="abb5">GAD-7</term><def><p>7-item Generalized Anxiety Disorder</p></def></def-item><def-item><term id="abb6">MAE</term><def><p>mean absolute error</p></def></def-item><def-item><term id="abb7">MICE</term><def><p>Multiple Imputation by Chained Equations</p></def></def-item><def-item><term id="abb8">MINI</term><def><p>Mini-International Neuropsychiatric Interview</p></def></def-item><def-item><term id="abb9">MSPSS</term><def><p>Multidimensional Scale of Perceived Social Support</p></def></def-item><def-item><term id="abb10">PC</term><def><p>principal component</p></def></def-item><def-item><term id="abb11">PCA</term><def><p>principal component analysis</p></def></def-item><def-item><term id="abb12">PHQ-9</term><def><p>9-item Patient Health Questionnaire</p></def></def-item><def-item><term id="abb13">PSIS-LOO</term><def><p>Pareto smoothed importance sampling leave-one-out</p></def></def-item><def-item><term id="abb14">REM</term><def><p>rapid eye movement</p></def></def-item><def-item><term id="abb15">RMSE</term><def><p>root-mean-square error</p></def></def-item><def-item><term id="abb16">UCLA Loneliness</term><def><p>University of California, Los Angeles Loneliness Scale</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="web"><article-title>Depressive disorder (depression)</article-title><source>World Health Organization</source><access-date>2026-03-07</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.who.int/news-room/fact-sheets/detail/depression">https://www.who.int/news-room/fact-sheets/detail/depression</ext-link></comment></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Williams</surname><given-names>SZ</given-names> </name><name name-style="western"><surname>Chung</surname><given-names>GS</given-names> </name><name name-style="western"><surname>Muennig</surname><given-names>PA</given-names> </name></person-group><article-title>Undiagnosed depression: a community diagnosis</article-title><source>SSM Popul Health</source><year>2017</year><month>12</month><volume>3</volume><fpage>633</fpage><lpage>638</lpage><pub-id pub-id-type="doi">10.1016/j.ssmph.2017.07.012</pub-id><pub-id pub-id-type="medline">29349251</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Faisal-Cury</surname><given-names>A</given-names> </name><name name-style="western"><surname>Ziebold</surname><given-names>C</given-names> </name><name name-style="western"><surname>Rodrigues</surname><given-names>DMDO</given-names> </name><name name-style="western"><surname>Matijasevich</surname><given-names>A</given-names> </name></person-group><article-title>Depression underdiagnosis: prevalence and associated factors. A population-based study</article-title><source>J Psychiatr Res</source><year>2022</year><month>07</month><volume>151</volume><fpage>157</fpage><lpage>165</lpage><pub-id pub-id-type="doi">10.1016/j.jpsychires.2022.04.025</pub-id><pub-id pub-id-type="medline">35486997</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tampubolon</surname><given-names>G</given-names> </name><name name-style="western"><surname>Maharani</surname><given-names>A</given-names> </name></person-group><article-title>When did old age stop being depressing? Depression trajectories of older Americans and Britons 2002-2012</article-title><source>Am J Geriatr Psychiatry</source><year>2017</year><month>11</month><volume>25</volume><issue>11</issue><fpage>1187</fpage><lpage>1195</lpage><pub-id pub-id-type="doi">10.1016/j.jagp.2017.06.006</pub-id><pub-id pub-id-type="medline">28734770</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lavingia</surname><given-names>R</given-names> </name><name name-style="western"><surname>Jones</surname><given-names>K</given-names> </name><name name-style="western"><surname>Asghar-Ali</surname><given-names>AA</given-names> </name></person-group><article-title>A systematic review of barriers faced by older adults in seeking and accessing mental health care</article-title><source>J Psychiatr Pract</source><year>2020</year><month>09</month><volume>26</volume><issue>5</issue><fpage>367</fpage><lpage>382</lpage><pub-id pub-id-type="doi">10.1097/PRA.0000000000000491</pub-id><pub-id pub-id-type="medline">32936584</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Park</surname><given-names>JE</given-names> </name><name name-style="western"><surname>Cho</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>JY</given-names> </name><etal/></person-group><article-title>Impact of stigma on use of mental health services by elderly Koreans</article-title><source>Soc Psychiatry Psychiatr Epidemiol</source><year>2015</year><month>05</month><volume>50</volume><issue>5</issue><fpage>757</fpage><lpage>766</lpage><pub-id pub-id-type="doi">10.1007/s00127-014-0991-0</pub-id><pub-id pub-id-type="medline">25491446</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Devita</surname><given-names>M</given-names> </name><name name-style="western"><surname>De Salvo</surname><given-names>R</given-names> </name><name name-style="western"><surname>Ravelli</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Recognizing depression in the elderly: practical guidance and challenges for clinical management</article-title><source>Neuropsychiatr Dis Treat</source><year>2022</year><volume>18</volume><fpage>2867</fpage><lpage>2880</lpage><pub-id pub-id-type="doi">10.2147/NDT.S347356</pub-id><pub-id pub-id-type="medline">36514493</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Torous</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kiang</surname><given-names>MV</given-names> </name><name name-style="western"><surname>Lorme</surname><given-names>J</given-names> </name><name name-style="western"><surname>Onnela</surname><given-names>JP</given-names> </name></person-group><article-title>New tools for new research in psychiatry: a scalable and customizable platform to empower data driven smartphone research</article-title><source>JMIR Ment Health</source><year>2016</year><month>05</month><day>5</day><volume>3</volume><issue>2</issue><fpage>e16</fpage><pub-id pub-id-type="doi">10.2196/mental.5165</pub-id><pub-id pub-id-type="medline">27150677</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Maatoug</surname><given-names>R</given-names> </name><name name-style="western"><surname>Oudin</surname><given-names>A</given-names> </name><name name-style="western"><surname>Adrien</surname><given-names>V</given-names> </name><etal/></person-group><article-title>Digital phenotype of mood disorders: a conceptual and critical review</article-title><source>Front Psychiatry</source><year>2022</year><volume>13</volume><fpage>895860</fpage><pub-id pub-id-type="doi">10.3389/fpsyt.2022.895860</pub-id><pub-id pub-id-type="medline">35958638</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cormack</surname><given-names>F</given-names> </name><name name-style="western"><surname>McCue</surname><given-names>M</given-names> </name><name name-style="western"><surname>Skirrow</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Characterizing longitudinal patterns in cognition, mood, and activity in depression with 6-week high-frequency wearable assessment: observational study</article-title><source>JMIR Ment Health</source><year>2024</year><month>05</month><day>31</day><volume>11</volume><fpage>e46895</fpage><pub-id pub-id-type="doi">10.2196/46895</pub-id><pub-id pub-id-type="medline">38819909</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Moura</surname><given-names>I</given-names> </name><name name-style="western"><surname>Teles</surname><given-names>A</given-names> </name><name name-style="western"><surname>Viana</surname><given-names>D</given-names> </name><name name-style="western"><surname>Marques</surname><given-names>J</given-names> </name><name name-style="western"><surname>Coutinho</surname><given-names>L</given-names> </name><name name-style="western"><surname>Silva</surname><given-names>F</given-names> </name></person-group><article-title>Digital phenotyping of mental health using multimodal sensing of multiple situations of interest: a systematic literature review</article-title><source>J Biomed Inform</source><year>2023</year><month>02</month><volume>138</volume><fpage>104278</fpage><pub-id pub-id-type="doi">10.1016/j.jbi.2022.104278</pub-id><pub-id pub-id-type="medline">36586498</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lim</surname><given-names>HJ</given-names> </name><name name-style="western"><surname>Cheng</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Kabir</surname><given-names>R</given-names> </name><name name-style="western"><surname>Thorpe</surname><given-names>L</given-names> </name></person-group><article-title>Trajectories of depression and their predictors in a population-based study of Korean older adults</article-title><source>Int J Aging Hum Dev</source><year>2021</year><month>10</month><volume>93</volume><issue>3</issue><fpage>834</fpage><lpage>853</lpage><pub-id pub-id-type="doi">10.1177/0091415020944405</pub-id><pub-id pub-id-type="medline">32830531</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Agustini</surname><given-names>B</given-names> </name><name name-style="western"><surname>Lotfaliany</surname><given-names>M</given-names> </name><name name-style="western"><surname>Mohebbi</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Trajectories of depressive symptoms in older adults and associated health outcomes</article-title><source>Nat Aging</source><year>2022</year><month>04</month><volume>2</volume><issue>4</issue><fpage>295</fpage><lpage>302</lpage><pub-id pub-id-type="doi">10.1038/s43587-022-00203-1</pub-id><pub-id pub-id-type="medline">37117752</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kerpershoek</surname><given-names>ML</given-names> </name><name name-style="western"><surname>Giltay</surname><given-names>EJ</given-names> </name><name name-style="western"><surname>Kok</surname><given-names>AAL</given-names> </name><etal/></person-group><article-title>Six-year trajectories of core depressive symptoms and insomnia symptoms in depressed older adults: a NESDO study</article-title><source>Aging Ment Health</source><year>2025</year><month>08</month><volume>29</volume><issue>8</issue><fpage>1468</fpage><lpage>1476</lpage><pub-id pub-id-type="doi">10.1080/13607863.2025.2496730</pub-id><pub-id pub-id-type="medline">40319495</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Burcusa</surname><given-names>SL</given-names> </name><name name-style="western"><surname>Iacono</surname><given-names>WG</given-names> </name></person-group><article-title>Risk for recurrence in depression</article-title><source>Clin Psychol Rev</source><year>2007</year><month>12</month><volume>27</volume><issue>8</issue><fpage>959</fpage><lpage>985</lpage><pub-id pub-id-type="doi">10.1016/j.cpr.2007.02.005</pub-id><pub-id pub-id-type="medline">17448579</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>YY</given-names> </name><name name-style="western"><surname>Stockings</surname><given-names>EA</given-names> </name><name name-style="western"><surname>Harris</surname><given-names>MG</given-names> </name><etal/></person-group><article-title>The risk of developing major depression among individuals with subthreshold depression: a systematic review and meta-analysis of longitudinal cohort studies</article-title><source>Psychol Med</source><year>2019</year><month>01</month><volume>49</volume><issue>1</issue><fpage>92</fpage><lpage>102</lpage><pub-id pub-id-type="doi">10.1017/S0033291718000557</pub-id><pub-id pub-id-type="medline">29530112</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Molas</surname><given-names>M</given-names> </name><name name-style="western"><surname>Lesaffre</surname><given-names>E</given-names> </name></person-group><article-title>Hurdle models for multilevel zero-inflated data via h-likelihood</article-title><source>Stat Med</source><year>2010</year><month>12</month><day>30</day><volume>29</volume><issue>30</issue><fpage>3294</fpage><lpage>3310</lpage><pub-id pub-id-type="doi">10.1002/sim.3852</pub-id><pub-id pub-id-type="medline">21170922</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ganjali</surname><given-names>M</given-names> </name><name name-style="western"><surname>Baghfalaki</surname><given-names>T</given-names> </name><name name-style="western"><surname>Balakrishnan</surname><given-names>N</given-names> </name></person-group><article-title>Joint modeling of zero-inflated longitudinal measurements and time-to-event outcomes with applications to dynamic prediction</article-title><source>Stat Methods Med Res</source><year>2024</year><month>10</month><volume>33</volume><issue>10</issue><fpage>1731</fpage><lpage>1767</lpage><pub-id pub-id-type="doi">10.1177/09622802241268466</pub-id><pub-id pub-id-type="medline">39373068</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>JK</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>MH</given-names> </name><name name-style="western"><surname>Hwang</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Developing prediction algorithms for late-life depression using wearable devices: a cohort study protocol</article-title><source>BMJ Open</source><year>2024</year><month>06</month><day>13</day><volume>14</volume><issue>6</issue><fpage>e073290</fpage><pub-id pub-id-type="doi">10.1136/bmjopen-2023-073290</pub-id><pub-id pub-id-type="medline">38871664</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>L&#x00F6;we</surname><given-names>B</given-names> </name><name name-style="western"><surname>Kroenke</surname><given-names>K</given-names> </name><name name-style="western"><surname>Herzog</surname><given-names>W</given-names> </name><name name-style="western"><surname>Gr&#x00E4;fe</surname><given-names>K</given-names> </name></person-group><article-title>Measuring depression outcome with a brief self-report instrument: sensitivity to change of the Patient Health Questionnaire (PHQ-9)</article-title><source>J Affect Disord</source><year>2004</year><month>07</month><volume>81</volume><issue>1</issue><fpage>61</fpage><lpage>66</lpage><pub-id pub-id-type="doi">10.1016/S0165-0327(03)00198-8</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sheehan</surname><given-names>DV</given-names> </name><name name-style="western"><surname>Lecrubier</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Sheehan</surname><given-names>KH</given-names> </name><etal/></person-group><article-title>The MINI-International Neuropsychiatric Interview (M.I.N.I.): the development and validation of a structured diagnostic psychiatric interview for DSM-IV and ICD-10</article-title><source>J Clin Psychiatry</source><year>1998</year><volume>59 Suppl 20</volume><issue>S20</issue><fpage>22</fpage><lpage>33</lpage><pub-id pub-id-type="medline">9881538</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Spitzer</surname><given-names>RL</given-names> </name><name name-style="western"><surname>Kroenke</surname><given-names>K</given-names> </name><name name-style="western"><surname>Williams</surname><given-names>JBW</given-names> </name><name name-style="western"><surname>L&#x00F6;we</surname><given-names>B</given-names> </name></person-group><article-title>A brief measure for assessing generalized anxiety disorder: the GAD-7</article-title><source>Arch Intern Med</source><year>2006</year><month>05</month><day>22</day><volume>166</volume><issue>10</issue><fpage>1092</fpage><lpage>1097</lpage><pub-id pub-id-type="doi">10.1001/archinte.166.10.1092</pub-id><pub-id pub-id-type="medline">16717171</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Russell</surname><given-names>D</given-names> </name><name name-style="western"><surname>Peplau</surname><given-names>LA</given-names> </name><name name-style="western"><surname>Ferguson</surname><given-names>ML</given-names> </name></person-group><article-title>Developing a measure of loneliness</article-title><source>J Pers Assess</source><year>1978</year><month>06</month><volume>42</volume><issue>3</issue><fpage>290</fpage><lpage>294</lpage><pub-id pub-id-type="doi">10.1207/s15327752jpa4203_11</pub-id><pub-id pub-id-type="medline">660402</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wilcox</surname><given-names>S</given-names> </name></person-group><article-title>Multidimensional scale of perceived social support</article-title><source>Psychol Trauma</source><year>2010</year><volume>2</volume><issue>3</issue><fpage>175</fpage><lpage>182</lpage></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bremner</surname><given-names>JD</given-names> </name><name name-style="western"><surname>Bolus</surname><given-names>R</given-names> </name><name name-style="western"><surname>Mayer</surname><given-names>EA</given-names> </name></person-group><article-title>Psychometric properties of the Early Trauma Inventory-Self Report</article-title><source>J Nerv Ment Dis</source><year>2007</year><month>03</month><volume>195</volume><issue>3</issue><fpage>211</fpage><lpage>218</lpage><pub-id pub-id-type="doi">10.1097/01.nmd.0000243824.84651.6c</pub-id><pub-id pub-id-type="medline">17468680</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Insel</surname><given-names>TR</given-names> </name></person-group><article-title>Digital phenotyping: a global tool for psychiatry</article-title><source>World Psychiatry</source><year>2018</year><month>10</month><volume>17</volume><issue>3</issue><fpage>276</fpage><lpage>277</lpage><pub-id pub-id-type="doi">10.1002/wps.20550</pub-id><pub-id pub-id-type="medline">30192103</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Williamson</surname><given-names>S</given-names> </name></person-group><article-title>Digital phenotyping in psychiatry</article-title><source>BJPsych advances</source><year>2023</year><month>11</month><volume>29</volume><issue>6</issue><fpage>428</fpage><lpage>429</lpage><pub-id pub-id-type="doi">10.1192/bja.2023.26</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hong</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>S</given-names> </name><etal/></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Kim</surname><given-names>S</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>S</given-names> </name></person-group><article-title>Depressive symptoms feature-based machine learning approach to predicting depression using smartphone</article-title><source>Healthcare (Basel)</source><year>2022</year><month>06</month><day>24</day><volume>10</volume><issue>7</issue><fpage>1189</fpage><pub-id pub-id-type="doi">10.3390/healthcare10071189</pub-id><pub-id pub-id-type="medline">35885716</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>De Angel</surname><given-names>V</given-names> </name><name name-style="western"><surname>Lewis</surname><given-names>S</given-names> </name><name name-style="western"><surname>White</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Digital health tools for the passive monitoring of depression: a systematic review of methods</article-title><source>NPJ Digit Med</source><year>2022</year><volume>5</volume><issue>1</issue><fpage>3</fpage><pub-id pub-id-type="doi">10.1038/s41746-021-00548-8</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Clement</surname><given-names>S</given-names> </name><name name-style="western"><surname>Schauman</surname><given-names>O</given-names> </name><name name-style="western"><surname>Graham</surname><given-names>T</given-names> </name><etal/></person-group><article-title>What is the impact of mental health-related stigma on help-seeking? A systematic review of quantitative and qualitative studies</article-title><source>Psychol Med</source><year>2015</year><month>01</month><volume>45</volume><issue>1</issue><fpage>11</fpage><lpage>27</lpage><pub-id pub-id-type="doi">10.1017/S0033291714000129</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rahman</surname><given-names>RA</given-names> </name><name name-style="western"><surname>Omar</surname><given-names>K</given-names> </name><name name-style="western"><surname>Danuri</surname><given-names>MSNM</given-names> </name><name name-style="western"><surname>Al-Garadi</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Noah</surname><given-names>SAM</given-names> </name></person-group><article-title>Application of machine learning methods in mental health detection: a systematic review</article-title><source>IEEE Access</source><year>2020</year><volume>8</volume><fpage>183952</fpage><lpage>183964</lpage><pub-id pub-id-type="doi">10.1109/ACCESS.2020.3029154</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sameh</surname><given-names>A</given-names> </name><name name-style="western"><surname>Rostami</surname><given-names>M</given-names> </name><name name-style="western"><surname>Oussalah</surname><given-names>M</given-names> </name><name name-style="western"><surname>Korpelainen</surname><given-names>R</given-names> </name><name name-style="western"><surname>Farrahi</surname><given-names>V</given-names> </name></person-group><article-title>Digital phenotypes and digital biomarkers for health and diseases: a systematic review of machine learning approaches utilizing passive non-invasive signals collected via wearable devices and smartphones</article-title><source>Artif Intell Rev</source><year>2025</year><volume>58</volume><issue>2</issue><fpage>66</fpage><pub-id pub-id-type="doi">10.1007/s10462-024-11009-5</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cail</surname><given-names>V</given-names> </name><name name-style="western"><surname>Beenackers</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Van Lenthe</surname><given-names>FJ</given-names> </name><etal/></person-group><article-title>Social network characteristics and levels of fluctuations in momentary depressive symptomatology among older adults</article-title><source>J Epidemiol Community Health</source><year>2025</year><month>10</month><day>9</day><volume>79</volume><issue>11</issue><fpage>828</fpage><lpage>834</lpage><pub-id pub-id-type="doi">10.1136/jech-2024-222959</pub-id><pub-id pub-id-type="medline">40813055</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Musliner</surname><given-names>KL</given-names> </name><name name-style="western"><surname>Munk-Olsen</surname><given-names>T</given-names> </name><name name-style="western"><surname>Eaton</surname><given-names>WW</given-names> </name><name name-style="western"><surname>Zandi</surname><given-names>PP</given-names> </name></person-group><article-title>Heterogeneity in long-term trajectories of depressive symptoms: patterns, predictors and outcomes</article-title><source>J Affect Disord</source><year>2016</year><month>03</month><day>1</day><volume>192</volume><fpage>199</fpage><lpage>211</lpage><pub-id pub-id-type="doi">10.1016/j.jad.2015.12.030</pub-id><pub-id pub-id-type="medline">26745437</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Crist&#x00F3;bal-Narv&#x00E1;ez</surname><given-names>P</given-names> </name><name name-style="western"><surname>Haro</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Koyanagi</surname><given-names>A</given-names> </name></person-group><article-title>Longitudinal association between perceived stress and depression among community-dwelling older adults: findings from the Irish Longitudinal Study on Ageing</article-title><source>J Affect Disord</source><year>2022</year><month>02</month><day>15</day><volume>299</volume><fpage>457</fpage><lpage>462</lpage><pub-id pub-id-type="doi">10.1016/j.jad.2021.12.041</pub-id><pub-id pub-id-type="medline">34942218</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>JK</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>J</given-names> </name><name name-style="western"><surname>Hwang</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Longitudinal examination of stress and depression in older adults over a 2&#x2010;year period: moderation effect of varied social support measures</article-title><source>Depress Anxiety</source><year>2024</year><volume>2024</volume><issue>1</issue><fpage>6462853</fpage><pub-id pub-id-type="doi">10.1155/2024/6462853</pub-id><pub-id pub-id-type="medline">40226743</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Olaya</surname><given-names>B</given-names> </name><name name-style="western"><surname>de Miquel</surname><given-names>C</given-names> </name><name name-style="western"><surname>Francia</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Understanding the incidence and recurrence of depression and associated risk factors in 9 years of follow-up: results from a population-based sample</article-title><source>Psychiatry Res</source><year>2025</year><month>03</month><volume>345</volume><fpage>116375</fpage><pub-id pub-id-type="doi">10.1016/j.psychres.2025.116375</pub-id><pub-id pub-id-type="medline">39893856</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>GE</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>MH</given-names> </name><name name-style="western"><surname>Lim</surname><given-names>WJ</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>SI</given-names> </name></person-group><article-title>The effects of smoking habit change on the risk of depression-analysis of data from the Korean National Health Insurance Service</article-title><source>J Affect Disord</source><year>2022</year><month>04</month><day>1</day><volume>302</volume><fpage>293</fpage><lpage>301</lpage><pub-id pub-id-type="doi">10.1016/j.jad.2022.01.095</pub-id><pub-id pub-id-type="medline">35085672</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Paudel</surname><given-names>M</given-names> </name><name name-style="western"><surname>Taylor</surname><given-names>BC</given-names> </name><name name-style="western"><surname>Ancoli-Israel</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Sleep disturbances and risk of depression in older men</article-title><source>Sleep</source><year>2013</year><month>07</month><day>1</day><volume>36</volume><issue>7</issue><fpage>1033</fpage><lpage>1040</lpage><pub-id pub-id-type="doi">10.5665/sleep.2804</pub-id><pub-id pub-id-type="medline">23814340</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>White</surname><given-names>KM</given-names> </name><name name-style="western"><surname>Dawe-Lane</surname><given-names>E</given-names> </name><name name-style="western"><surname>Siddi</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Understanding the subjective experience of long-term remote measurement technology use for symptom tracking in people with depression: multisite longitudinal qualitative analysis</article-title><source>JMIR Hum Factors</source><year>2023</year><month>01</month><day>26</day><volume>10</volume><fpage>e39479</fpage><pub-id pub-id-type="doi">10.2196/39479</pub-id><pub-id pub-id-type="medline">36701179</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Austin</surname><given-names>PC</given-names> </name><name name-style="western"><surname>Merlo</surname><given-names>J</given-names> </name></person-group><article-title>Intermediate and advanced topics in multilevel logistic regression analysis</article-title><source>Stat Med</source><year>2017</year><month>09</month><day>10</day><volume>36</volume><issue>20</issue><fpage>3257</fpage><lpage>3277</lpage><pub-id pub-id-type="doi">10.1002/sim.7336</pub-id><pub-id pub-id-type="medline">28543517</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shaw</surname><given-names>H</given-names> </name><name name-style="western"><surname>Taylor</surname><given-names>PJ</given-names> </name><name name-style="western"><surname>Ellis</surname><given-names>DA</given-names> </name><name name-style="western"><surname>Conchie</surname><given-names>SM</given-names> </name></person-group><article-title>Behavioral consistency in the digital age</article-title><source>Psychol Sci</source><year>2022</year><month>03</month><volume>33</volume><issue>3</issue><fpage>364</fpage><lpage>370</lpage><pub-id pub-id-type="doi">10.1177/09567976211040491</pub-id><pub-id pub-id-type="medline">35174745</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wisniewski</surname><given-names>H</given-names> </name><name name-style="western"><surname>Henson</surname><given-names>P</given-names> </name><name name-style="western"><surname>Torous</surname><given-names>J</given-names> </name></person-group><article-title>Using a smartphone app to identify clinically relevant behavior trends via symptom report, cognition scores, and exercise levels: a case series</article-title><source>Front Psychiatry</source><year>2019</year><volume>10</volume><fpage>652</fpage><pub-id pub-id-type="doi">10.3389/fpsyt.2019.00652</pub-id><pub-id pub-id-type="medline">31607960</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="report"><article-title>National Mental Health Survey 2021</article-title><year>2022</year><access-date>2026-04-29</access-date><publisher-name>National Center for Mental Health</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://mhs.ncmh.go.kr/board.es?mid=a10301000000&#x0026;amp;bid=0005&#x0026;amp;nPage=1&#x0026;amp;b_list_cnt=9&#x0026;amp;ord=&#x0026;amp;dept_cd=&#x0026;amp;tag=&#x0026;amp;list_no=16&#x0026;amp;listNo=&#x0026;amp;act=view&#x0026;amp;view_sdate_param=&#x0026;amp;keyField=&#x0026;amp;keyWord=">https://mhs.ncmh.go.kr/board.es?mid=a10301000000&#x0026;amp;bid=0005&#x0026;amp;nPage=1&#x0026;amp;b_list_cnt=9&#x0026;amp;ord=&#x0026;amp;dept_cd=&#x0026;amp;tag=&#x0026;amp;list_no=16&#x0026;amp;listNo=&#x0026;amp;act=view&#x0026;amp;view_sdate_param=&#x0026;amp;keyField=&#x0026;amp;keyWord=</ext-link></comment></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Abousaber</surname><given-names>I</given-names> </name><name name-style="western"><surname>Abdallah</surname><given-names>HF</given-names> </name><name name-style="western"><surname>El-Ghaish</surname><given-names>H</given-names> </name></person-group><article-title>Robust predictive framework for diabetes classification using optimized machine learning on imbalanced datasets</article-title><source>Front Artif Intell</source><year>2024</year><volume>7</volume><fpage>1499530</fpage><pub-id pub-id-type="doi">10.3389/frai.2024.1499530</pub-id><pub-id pub-id-type="medline">39839971</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Abdelhay</surname><given-names>O</given-names> </name><name name-style="western"><surname>Shatnawi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Najadat</surname><given-names>H</given-names> </name><name name-style="western"><surname>Altamimi</surname><given-names>T</given-names> </name></person-group><article-title>Resampling methods for class imbalance in clinical prediction models: a scoping review protocol</article-title><source>PLoS ONE</source><year>2025</year><volume>20</volume><issue>11</issue><fpage>e0330050</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0330050</pub-id><pub-id pub-id-type="medline">41183062</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gurcan</surname><given-names>F</given-names> </name><name name-style="western"><surname>Soylu</surname><given-names>A</given-names> </name></person-group><article-title>Learning from imbalanced data: integration of advanced resampling techniques and machine learning models for enhanced cancer diagnosis and prognosis</article-title><source>Cancers (Basel)</source><year>2024</year><month>10</month><day>8</day><volume>16</volume><issue>19</issue><fpage>3417</fpage><pub-id pub-id-type="doi">10.3390/cancers16193417</pub-id><pub-id pub-id-type="medline">39410036</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mendes</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Barbar</surname><given-names>A</given-names> </name><name name-style="western"><surname>Refaie</surname><given-names>M</given-names> </name></person-group><article-title>Synthetic data generation: a privacy-preserving approach to accelerate rare disease research</article-title><source>Front Digit Health</source><year>2025</year><volume>7</volume><fpage>1563991</fpage><pub-id pub-id-type="doi">10.3389/fdgth.2025.1563991</pub-id><pub-id pub-id-type="medline">40171526</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="report"><article-title>Survey on smartphone usage rates &#x0026; brands, smartwatches, and wireless earphones 2012-2023</article-title><year>2023</year><access-date>2026-03-07</access-date><publisher-name>Gallup</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://www.gallup.co.kr/gallupdb/reportContent.asp?seqNo=1405">https://www.gallup.co.kr/gallupdb/reportContent.asp?seqNo=1405</ext-link></comment></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Brietzke</surname><given-names>E</given-names> </name><name name-style="western"><surname>Hawken</surname><given-names>ER</given-names> </name><name name-style="western"><surname>Idzikowski</surname><given-names>M</given-names> </name><name name-style="western"><surname>Pong</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kennedy</surname><given-names>SH</given-names> </name><name name-style="western"><surname>Soares</surname><given-names>CN</given-names> </name></person-group><article-title>Integrating digital phenotyping in clinical characterization of individuals with mood disorders</article-title><source>Neurosci Biobehav Rev</source><year>2019</year><month>09</month><volume>104</volume><fpage>223</fpage><lpage>230</lpage><pub-id pub-id-type="doi">10.1016/j.neubiorev.2019.07.009</pub-id><pub-id pub-id-type="medline">31330197</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Descriptive statistics of the participants.</p><media xlink:href="ai_v5i1e69494_app1.docx" xlink:title="DOCX File, 19 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Logistic regression results for attrition bias.</p><media xlink:href="ai_v5i1e69494_app2.docx" xlink:title="DOCX File, 17 KB"/></supplementary-material></app-group></back></article>