<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="review-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Hum Factors</journal-id><journal-id journal-id-type="publisher-id">humanfactors</journal-id><journal-id journal-id-type="index">6</journal-id><journal-title>JMIR Human Factors</journal-title><abbrev-journal-title>JMIR Hum Factors</abbrev-journal-title><issn pub-type="epub">2292-9495</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v13i1e78648</article-id><article-id pub-id-type="doi">10.2196/78648</article-id><article-categories><subj-group subj-group-type="heading"><subject>Review</subject></subj-group></article-categories><title-group><article-title>Machine Learning for the Analysis of Healthy Lifestyle Data: Scoping Review and Guidelines</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Estrella</surname><given-names>Tony</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Capdevila</surname><given-names>Lluis</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Alfonso</surname><given-names>Carla</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Losilla</surname><given-names>Josep-Maria</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff3">3</xref></contrib></contrib-group><aff id="aff1"><institution>Sport Research Institute, Universitat Aut&#x00F2;noma de Barcelona</institution><addr-line>Bellaterra</addr-line><country>Spain</country></aff><aff id="aff2"><institution>Department of Basic Psychology, Universitat Aut&#x00F2;noma de Barcelona</institution><addr-line>Edifici N, Planta 1</addr-line><addr-line>Cerdanyola del Vall&#x00E8;s</addr-line><addr-line>Barcelona</addr-line><country>Spain</country></aff><aff id="aff3"><institution>Department of Psychobiology and Methodology of Health Science, Universitat Aut&#x00F2;noma de Barcelona</institution><addr-line>Cerdanyola del Vall&#x00E8;s</addr-line><addr-line>Barcelona</addr-line><country>Spain</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Kushniruk</surname><given-names>Andre</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Adepoju</surname><given-names>Adewumi</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Yogeshappa</surname><given-names>Vedamurthy Gejjegondanahalli</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Tony Estrella, MSc, Department of Basic Psychology, Universitat Aut&#x00F2;noma de Barcelona, Edifici N, Planta 1, Cerdanyola del Vall&#x00E8;s, Barcelona, 08193, Spain, 34 93 581 2758; <email>antonio.estrella@uab.cat</email></corresp></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>27</day><month>2</month><year>2026</year></pub-date><volume>13</volume><elocation-id>e78648</elocation-id><history><date date-type="received"><day>06</day><month>06</month><year>2025</year></date><date date-type="rev-recd"><day>06</day><month>12</month><year>2025</year></date><date date-type="accepted"><day>14</day><month>12</month><year>2025</year></date></history><copyright-statement>&#x00A9; Tony Estrella, Lluis Capdevila, Carla Alfonso, Josep-Maria Losilla. Originally published in JMIR Human Factors (<ext-link ext-link-type="uri" xlink:href="https://humanfactors.jmir.org">https://humanfactors.jmir.org</ext-link>), 27.2.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Human Factors, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://humanfactors.jmir.org">https://humanfactors.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://humanfactors.jmir.org/2026/1/e78648"/><abstract><sec><title>Background</title><p>Advances in data science and technology have transformed lifestyle research by enabling the integration of multimodal information and the generation of large-scale datasets. Despite the growing interest in machine learning (ML) within health behavior research, significant methodological gaps remain.</p></sec><sec><title>Objective</title><p>The study aims to systematically review the applications of supervised ML algorithms in the analysis of healthy lifestyle data, with a particular focus on the methodological approaches used. The specific objectives are to explore the types and sources of data used for health outcomes, examine the ML processes used, including explainable artificial intelligence (XAI) methods, and review the software tools used. Additionally, this review aims to provide practical guidelines to enhance the quality and transparency of future ML research in health.</p></sec><sec sec-type="methods"><title>Methods</title><p>Following the PRISMA-ScR (Preferred Reporting Items for Systematic Reviews and Meta-Analyses extension for Scoping Reviews) recommendations, the search was conducted across PubMed, PsycINFO, and Web of Science, yielding 65 studies that met the inclusion criteria.</p></sec><sec sec-type="results"><title>Results</title><p>Most studies (48/65, 74%) integrated multidomain data from physical activity, diet, sleep, and stress. Data sources were split between self-acquired data (33/65, 51%) and health repositories (32/65, 49%). Single-item measurements were common, particularly for physical activity, diet, and sleep. Although 40 of 65 studies used a multimodel approach, random forest was the most frequently applied algorithm. To improve explainability, 22 of 65 (33.84%) studies incorporated specific XAI methods, with 21 using Shapley Additive Explanation values and 1 using local interpretable model-agnostic explanations. R (R Core Team) and Python (Python Software Foundation) were the most widely used software tools, with variation in the libraries used.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This review highlights methodological gaps in the application of supervised ML to healthy lifestyle data. The ML workflow should span from data acquisition to explainability, using iterative steps to improve methodological rigor. Although multidomain data collection enhances the understanding of health issues related to lifestyle, representativeness remains limited due to methodological shortcomings in data acquisition. While random forest was the most commonly used algorithm, a multimodel approach is recommended for a comprehensive comparison. Lifestyle components consistently ranked among the top features in studies integrating XAI. Incorporating XAI methods into the ML pipeline can support personalized interventions, provided data collection is accurate. The R metapackage (tidymodels; Max Kuhn and Hadley Wickham) facilitates process evaluation through unified syntax, improving replicability. Methodological and reporting guidelines and a checklist are provided to enhance transparency and replicability in multidisciplinary ML research.</p></sec><sec sec-type="registered-report"><title>International Registered Report Identifier (IRRID)</title><p>RR2-10.37766/inplasy2023.3.0065</p></sec></abstract><kwd-group><kwd>machine learning</kwd><kwd>artificial intelligence</kwd><kwd>healthy lifestyle</kwd><kwd>physical activity</kwd><kwd>diet</kwd><kwd>sleep</kwd><kwd>stress</kwd><kwd>review</kwd><kwd>data analysis</kwd><kwd>XAI</kwd><kwd>explainable artificial intelligence</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>There is a growing interest in understanding the effects of synergistic relationships among lifestyle behaviors and their effect on health outcomes [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. Traditionally, healthy lifestyle (HL) research has primarily focused on physical activity and diet. However, recent studies increasingly include sleep and stress management as critical components of lifestyle [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. For instance, stress has been shown to negatively influence physical activity, sleep, and dietary habits [<xref ref-type="bibr" rid="ref5">5</xref>], which in turn have an overall impact on health and well-being. This multidimensional perspective has gained attention in public health under the concept of lifestyle medicine, which incorporates physical activity, diet, sleep, and stress management as cost-effective interventions to prevent noncommunicable diseases, such as cardiovascular and metabolic diseases [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>].</p><p>Technological advances, including wearable devices and lifelogging processes, have significantly enhanced the capability to collect multimodal, high-frequency, and ecological lifestyle data [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. This wealth of data provides valuable contextual information and insights for researchers and users [<xref ref-type="bibr" rid="ref11">11</xref>]. However, the vast amount and complexity of behavioral and physiological data expose significant analytical challenges. Traditional statistical models often struggle with the high dimensionality, heterogeneity, and nonlinearity typical of lifestyle studies. Recent progress in computational power and artificial intelligence (AI), particularly machine learning (ML), has contributed to addressing these limitations [<xref ref-type="bibr" rid="ref12">12</xref>].</p><p>ML models are capable of analyzing complex data types and generating insights and knowledge to improve decision-making [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. Furthermore, ML algorithms can flexibly handle nonlinear relationships among features and outcomes. While the boundary between classical statistics and ML is not clear, ML algorithms are recognized for their flexible data-driven approach, avoiding the imposition of a predetermined relational structure between variables [<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref17">17</xref>]. Additionally, prioritizing algorithms that maximize generalizability to new data, often referred to as scalability in the big data context, is crucial to face new health challenges [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. These characteristics make ML analysis a suitable methodology for predictive modeling and feature extraction in health-related lifestyle research.</p><p>ML models are broadly classified into supervised learning (SL) and unsupervised learning (UL). In SL, the model is trained with labeled data, where each observation has an associated response measurement, to predict known outcomes such as disease risk or behavioral adherence [<xref ref-type="bibr" rid="ref19">19</xref>]. The goal of SL is to fit a model that can predict the response when applied to new data. When the response value is continuous, this is known as a &#x201C;regression problem&#x201D;; when the response is categorical, it is known as a &#x201C;classification problem.&#x201D; In contrast, in UL models, the goal is to discover patterns rather than predict outcomes, since there is no associated response to the input, and the model seeks relationships and similarities between observations. In the health domain, where diagnosis and detection are key focuses, SL, and particularly classification tasks, are more prevalent due to their ability to evaluate these predictions [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. Clinical applications of SL include triage systems, prognosis prediction, and disease classification using rapid testing [<xref ref-type="bibr" rid="ref22">22</xref>]. Consequently, SL methods are standard in epidemiology to enhance clinical decisions based on input-output relationships [<xref ref-type="bibr" rid="ref23">23</xref>]. Since prediction and explainability are central concerns in health research, this scoping review focuses specifically on SL methods.</p><p>Despite the growing attention to ML in health behavior research, there remain significant methodological gaps. Prior reviews have focused primarily on outcome effectiveness or AI chatbot interventions, often providing limited detail about the ML process involved [<xref ref-type="bibr" rid="ref24">24</xref>]. A recent scoping review on ML methods used in health promotion and behavioral change found that the main interventions studied are those related to physical activity, while other crucial aspects of HL were overlooked, revealing an imbalance in this literature [<xref ref-type="bibr" rid="ref25">25</xref>]. Similarly, Lai et al [<xref ref-type="bibr" rid="ref26">26</xref>] reviewed the applications of large language models in exercise recommendations and physical activity, highlighting methodological limitations associated with these AI models. In sum, these studies underscore the need for a more comprehensive review to include a holistic concept of HL. Furthermore, methodological details such as data preprocessing, model evaluation, and explainability are often underreported, hindering transparency, reproducibility, and interdisciplinary collaboration.</p><p>To address the lack of explainability, explainable artificial intelligence (XAI) has emerged, which focuses on understanding AI algorithms and making them more transparent. XAI aims to provide human-understandable explanations for the decisions made by ML models [<xref ref-type="bibr" rid="ref27">27</xref>]. In HL research, XAI can be directed to identify the set of behaviors that significantly influence health, thereby enhancing transparency and trust in AI. It is important to distinguish between interpretability and explainability in the AI context. While interpretability refers to understanding the influence of each feature in the original model, explainability involves deriving actionable human insights from the model&#x2019;s predictions [<xref ref-type="bibr" rid="ref28">28</xref>]. Interpretability enables AI developers to delve into the model&#x2019;s decision-making to comprehend how algorithms reach their decisions. Conversely, explainability refers to the process for creating common meaning from model decisions and therefore provides human-readable explanations [<xref ref-type="bibr" rid="ref28">28</xref>]. Therefore, reporting the explainability method used in ML projects is crucial not only to enhance the decision-making process of the end user but also to understand how lifestyle factors interact with health outcomes.</p><p>Therefore, this study aims to systematically review the applications of supervised ML algorithms in analyzing HL data, with a specific focus on the methodological aspects used in these studies, rather than their results. The specific objectives are to explore (1) the specific lifestyle data used in health outcome studies; (2) the sources and types of data subjected to analysis; (3) the characteristics of the ML models, including XAI methods; and (4) the programs and libraries used for ML implementation. Additionally, based on the findings of this scoping review, we aim to provide practical guidelines to enhance the quality and transparency of future ML research in lifestyle science. A scoping review is the type of systematized review (ie, systematic, transparent, and replicable) most appropriate for addressing these objectives [<xref ref-type="bibr" rid="ref29">29</xref>].</p></sec><sec id="s2" sec-type="methods"><title>Method</title><sec id="s2-1"><title>Overview</title><p>To maximize the reporting quality of this scoping review, we followed the PRISMA-ScR (Preferred Reporting Items for Systematic Reviews and Meta-Analyses extension for Scoping Reviews) recommendations [<xref ref-type="bibr" rid="ref30">30</xref>] (checklist provided in <xref ref-type="supplementary-material" rid="app2">Checklist 1</xref>). The protocol for this scoping review was registered with the International Platform of Registered Systematic Review and Meta-Analysis Protocols (INPLASY) [<xref ref-type="bibr" rid="ref31">31</xref>]. All data generated in this review are provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> and are accessible in the institutional repository [<xref ref-type="bibr" rid="ref32">32</xref>].</p></sec><sec id="s2-2"><title>Search Strategy</title><p>In this scoping review, we searched for primary studies in the 3 principal health databases: PubMed (National Center for Biotechnology Information), PsycINFO (ProQuest), and Web of Science (Clarivate). The search was restricted to medical and psychological databases to capture studies directly relevant to health outcomes. Consequently, studies primarily published in engineering or computer science, which may focus on algorithm development or sensor-based data processing, were not included. The search strategy followed the PRESS (Peer Review of Electronic Search Strategies) [<xref ref-type="bibr" rid="ref33">33</xref>] and PRISMA-S (Preferred Reporting Items for Systematic Reviews and Meta-Analyses&#x2013;Search extension) guidelines [<xref ref-type="bibr" rid="ref34">34</xref>] and consisted of 2 groups of search terms referring to (1) HL and (2) ML. We also added a third group of terms preceded by the Boolean operator &#x201C;NOT&#x201D; to improve the specificity of the search strategy.</p><p>This scoping review adopts a health-focused perspective, in which HL is treated as a multidimensional construct rather than the sum of isolated behaviors [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]. Therefore, the umbrella term HL was combined using the operator &#x201C;OR&#x201D; with an interaction block including (1) physical activity, (2) diet, (3) sleep, and (4) stress. This block is aligned with the multiple health behavior change and lifestyle medicine frameworks, in which the interaction between behaviors is a central construct [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref38">38</xref>].</p><p>The search strategy was adapted to the specific syntax of each database (Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The search was conducted on October 10, 2025, with language restrictions (English and Spanish) but without limitations on publication years.</p></sec><sec id="s2-3"><title>Study Selection</title><sec id="s2-3-1"><title>Inclusion and Exclusion Criteria</title><p>Studies were included in or excluded from the review according to the following criteria provided in <xref ref-type="other" rid="box1">Textbox 1</xref>.</p><boxed-text id="box1"><title> Inclusion and exclusion criteria.</title><p><bold>Inclusion criteria:</bold></p><list list-type="bullet"><list-item><p>Used supervised machine learning (ML) models for analyzing lifestyle data.</p></list-item><list-item><p>Analyzed lifestyle behaviors as either inputs or outputs of the ML models.</p></list-item><list-item><p>Used data from real individuals (not simulations).</p></list-item><list-item><p>Published in English or Spanish.</p></list-item></list><p><bold>Exclusion criteria:</bold></p><list list-type="bullet"><list-item><p>Focused on unsupervised learning (UL) without connection to supervised learning (SL) modeling.</p></list-item><list-item><p>Focused on mathematical formulation or guidelines for implementing ML models in health.</p></list-item><list-item><p>Used simulated data or aimed to develop a chatbot or app based on ML.</p></list-item><list-item><p>Primarily addressed substance abuse, such as alcohol intake or smoking cessation.</p></list-item><list-item><p>Focused exclusively on classical statistical regression algorithms, such as linear or logistic regression, which were not considered ML on their own in this review.</p></list-item></list></boxed-text></sec><sec id="s2-3-2"><title>Justification of Exclusions</title><p>UL algorithms were excluded because they do not have an associated response to inputs, thereby lacking performance evaluation. Classical statistical regression algorithms, such as linear or logistic regression, were not considered in this review. While the boundary between classical statistics and ML is not clear, ML algorithms are recognized for their flexible data-driven approach, avoiding the imposition of a predetermined relational structure between variables [<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref17">17</xref>]. Additionally, prioritizing algorithms that maximize generalizability to new data, often referred to as scalability in the big data context, is crucial to address new health challenges [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. Consequently, studies focusing exclusively on this type of statistical algorithm were excluded. However, we acknowledge that the use of a model ensemble approach allows for the inclusion of these statistical algorithms to assess the performance of different algorithms during the evaluation step. Studies on substance abuse disorders were excluded as they involve distinct behavioral and neurobiological mechanisms that differ substantially from the domains of physical activity, diet, sleep, and stress, which are the core components of HL behaviors as defined in this review. In addition, substance abuse is categorized within the risk avoidance cluster, which is conceptually distinct from the other 4 behaviors examined in this review [<xref ref-type="bibr" rid="ref3">3</xref>]. This distinction is well established in multiple health behavior theories, which differentiate behaviors that enhance health from those that reduce risk through avoidance. Therefore, its exclusion preserves the applicability of results to a multiple health behavior framework, as the selected behaviors are interrelated through shared psychological resources [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref39">39</xref>].</p><p>Two reviewers (TE and CA) independently screened titles and abstracts in the first phase and full texts in the second phase. Discrepancies were resolved by consensus, with the participation of a third reviewer (JML) when necessary. Agreement between reviewers during the selection process was analyzed by calculating Cohen &#x03BA;.</p></sec></sec><sec id="s2-4"><title>Data Management</title><p>Mendeley was used as reference management software; the results of the search strategy were entered, and duplicates were merged or removed. An ad hoc checklist was used to extract information from the included papers. The checklist was divided into 5 sections:</p><list list-type="bullet"><list-item><p>General information: authors, title, year, and country of affiliation.</p></list-item><list-item><p>Methodological data: type of study, aim, year of data collection, form of data acquisition, sample, and countries represented in the data.</p></list-item><list-item><p>Study variables: health issues, lifestyle features, and the model&#x2019;s input and output variables.</p></list-item><list-item><p>Software: statistical programming language, libraries, and packages.</p></list-item><list-item><p>Model aspects: type of problem, stages of ML analysis, ML methods, model evaluation, evaluation metrics, and XAI methods.</p></list-item></list></sec><sec id="s2-5"><title>Strategy of Data Synthesis</title><p>The review was presented as a narrative synthesis, and the information was summarized in tables and figures. The information extracted from the studies was divided into 3 blocks: type of data, ML process, and software. For data extraction, we focused on lifestyle components, health outcomes, data sources, acquisition methods, and data typology. Regarding the ML process, we focused on the whole process, consisting of preprocessing, modeling, validation, evaluation, and XAI methods. For model evaluation, only the procedures used for final performance assessment were extracted. When studies reported cross-validation, we classified it as the final performance estimation method unless authors explicitly stated its use for hyperparameter optimization. To identify the top-ranked lifestyle components in the XAI analysis, we systematically examined the figures and tables reported in each study. In this review, the term ranked refers to features that were highlighted by the XAI algorithm. In contrast, unranked indicates that appeared in the model but were not reported in the XAI visualization, while not available denotes features that were not included in the ML model. Software used in each study was also recorded.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Overview</title><p>A total of 2249 papers were retrieved from the databases, and 65 studies met the eligibility criteria and were included in this scoping review (refer to <xref ref-type="fig" rid="figure1">Figure 1</xref>). There was very good agreement between reviewers during the selection process: 96% (n=52; &#x03BA;=0.84, 95% CI 0.61-1.0) in the title and abstract screening and 94% (n=35; &#x03BA;=0.88, 95% CI 0.71-1.0) in the full-text screening.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) flow diagram of the scientific literature search and selection. ML: machine learning.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="humanfactors_v13i1e78648_fig01.png"/></fig><p>From this point forward, the &#x201C;Results&#x201D; section is structured following the ML workflow depicted in <xref ref-type="fig" rid="figure2">Figure 2</xref>, which illustrates the 5 key steps in the ML pipeline. The process begins with data acquisition, followed by preprocessing to prepare the data. Then, SL algorithms are applied and evaluated to determine their effectiveness. Finally, explainability techniques are used to understand the models. The dashed lines indicate that modeling, evaluation, and explainability can improve earlier stages, making the process iterative. Each stage of the process corresponds to a subsection. Finally, we examined the software used throughout the entire process in the included studies.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Overview of the machine learning workflow, spanning from data acquisition to explainability. The dashed lines represent iterative feedback loops within the process. LIME: local interpretable model-agnostic explanations; SHAP: Shapley Additive Explanation.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="humanfactors_v13i1e78648_fig02.png"/></fig></sec><sec id="s3-2"><title>Data Acquisition: Collection Modes, Data Typology, Lifestyle Variables, and Health Outcomes</title><p>The 65 papers included in this review were published between 2004 and 2025, with 57 (87.7%) published since 2019. <xref ref-type="fig" rid="figure3">Figure 3</xref> shows the annual productivity output stratified by lifestyle components. The studies were carried out in several geographical regions across 4 continents (Table S2 and Figure S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The mean sample size was 29,905.14 participants, with the smallest study including 8 participants and the largest including 470,778 participants.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Bar graph showing productivity by publication year, with each line and dot representing a lifestyle component.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="humanfactors_v13i1e78648_fig03.png"/></fig><p>Four lifestyle domains were identified in the review: physical activity, diet, sleep, and stress. Most studies (48/65, 74%) integrated data from more than 1 lifestyle domain (refer to <xref ref-type="table" rid="table1">Table 1</xref>). The most studied component was physical activity, featured in 61 of 65 studies. Diet and sleep appeared in 33 of 65 (51%) and 34 of 65 (52%) studies, respectively, while stress appeared in 15 of 65 (23%) studies (refer to <xref ref-type="fig" rid="figure3">Figure 3</xref>). Only 17 of 65 (26%) studies focused exclusively on a single domain (15 on physical activity [<xref ref-type="bibr" rid="ref40">40</xref>-<xref ref-type="bibr" rid="ref54">54</xref>] and 2 on sleep [<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref56">56</xref>]).</p><p>Regarding data sources, 33 of 65 (51%) studies relied on self-acquired data, while 32 of 65 (49%) studies used either private or public health datasets, such as UK Biobank [<xref ref-type="bibr" rid="ref57">57</xref>]. Among the studies using self-acquired data, the mean sample size was 10,503.41 participants. Six studies focused exclusively on females [<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref58">58</xref>-<xref ref-type="bibr" rid="ref61">61</xref>], and 27 studies reported a female proportion ranging from 41% to 89.4%. Studies using health repositories exhibited a greater mean sample size of 80,406.38 participants. Nineteen studies reported a female proportion ranging from 41.33% to 70%, 12 did not report sex distribution, and 1 study focused exclusively on females.</p><p><xref ref-type="fig" rid="figure4">Figure 4</xref> summarizes the different data collection modes used for each of the 4 lifestyle domains identified (Table S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> provides a detailed description of each measure). Single-item measures were used in 40 of 65 (61.5%) studies assessing physical activity, 18 of 65 (27.7%) studies assessing diet, and 22 of 65 (33.8%) studies assessing sleep. Despite the heterogeneity of these items, distinct categories emerged within each lifestyle domain.</p><p>For physical activity, the emerging categories included engagement in physical activities [<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref50">50</xref>-<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref62">62</xref>-<xref ref-type="bibr" rid="ref66">66</xref>], intensity [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref67">67</xref>-<xref ref-type="bibr" rid="ref71">71</xref>], frequency [<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref72">72</xref>-<xref ref-type="bibr" rid="ref86">86</xref>], and environmental factors [<xref ref-type="bibr" rid="ref87">87</xref>,<xref ref-type="bibr" rid="ref88">88</xref>]. Within the diet domain, categories included frequency of consumption [<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref72">72</xref>,<xref ref-type="bibr" rid="ref84">84</xref>], types of products [<xref ref-type="bibr" rid="ref75">75</xref>,<xref ref-type="bibr" rid="ref76">76</xref>,<xref ref-type="bibr" rid="ref80">80</xref>,<xref ref-type="bibr" rid="ref82">82</xref>], environmental factors [<xref ref-type="bibr" rid="ref87">87</xref>], and consumption habits [<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref65">65</xref>,<xref ref-type="bibr" rid="ref68">68</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref71">71</xref>,<xref ref-type="bibr" rid="ref86">86</xref>,<xref ref-type="bibr" rid="ref89">89</xref>]. Regarding sleep, categories included sleep duration [<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref66">66</xref>-<xref ref-type="bibr" rid="ref68">68</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref72">72</xref>,<xref ref-type="bibr" rid="ref77">77</xref>-<xref ref-type="bibr" rid="ref79">79</xref>,<xref ref-type="bibr" rid="ref81">81</xref>,<xref ref-type="bibr" rid="ref82">82</xref>,<xref ref-type="bibr" rid="ref84">84</xref>,<xref ref-type="bibr" rid="ref85">85</xref>,<xref ref-type="bibr" rid="ref87">87</xref>], perceived sleep quality [<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref89">89</xref>], and sleep-related problems [<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref80">80</xref>]. Finally, within the stress domain, the emerging category focused primarily on stress level [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref79">79</xref>,<xref ref-type="bibr" rid="ref82">82</xref>,<xref ref-type="bibr" rid="ref86">86</xref>,<xref ref-type="bibr" rid="ref89">89</xref>,<xref ref-type="bibr" rid="ref90">90</xref>].</p><p>Questionnaires were used to collect physical activity data in 13 studies. The standardized questionnaires included the Global Physical Activity Questionnaire (GPAQ) [<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref72">72</xref>,<xref ref-type="bibr" rid="ref91">91</xref>], the International Physical Activity Questionnaire (IPAQ) [<xref ref-type="bibr" rid="ref92">92</xref>], the Lifetime Total Physical Activity Questionnaire (exercise and sport subscale) [<xref ref-type="bibr" rid="ref93">93</xref>], the Nutritional and Social Healthy Habits (NutSo-HH) scale [<xref ref-type="bibr" rid="ref94">94</xref>], the Indian Migration Study Physical Activity Questionnaire (IMS-PAQ) [<xref ref-type="bibr" rid="ref95">95</xref>], physical fitness test [<xref ref-type="bibr" rid="ref41">41</xref>], the Short Questionnaire to Assess Health-Enhancing Physical Activity (SQUASH) [<xref ref-type="bibr" rid="ref73">73</xref>,<xref ref-type="bibr" rid="ref74">74</xref>], the physical activity scale from the Active Living Index [<xref ref-type="bibr" rid="ref88">88</xref>], the Pregnancy Physical Activity Questionnaire [<xref ref-type="bibr" rid="ref61">61</xref>], and the Physical Activity Scale for the Elderly [<xref ref-type="bibr" rid="ref96">96</xref>]. For diet assessment, 12 studies used the Food Frequency Questionnaire (FFQ) [<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref73">73</xref>,<xref ref-type="bibr" rid="ref74">74</xref>,<xref ref-type="bibr" rid="ref83">83</xref>,<xref ref-type="bibr" rid="ref88">88</xref>,<xref ref-type="bibr" rid="ref91">91</xref>,<xref ref-type="bibr" rid="ref92">92</xref>,<xref ref-type="bibr" rid="ref95">95</xref>], the PrimeScreen questionnaire [<xref ref-type="bibr" rid="ref61">61</xref>], the Mini Nutritional Assessment [<xref ref-type="bibr" rid="ref97">97</xref>], the NutSo-HH scale [<xref ref-type="bibr" rid="ref94">94</xref>], and a nonstandardized questionnaire consisting of items from different questionnaires [<xref ref-type="bibr" rid="ref93">93</xref>]. The standardized questionnaires used to measure sleep were the Pittsburgh Sleep Quality Index [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref56">56</xref>,<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref86">86</xref>,<xref ref-type="bibr" rid="ref91">91</xref>,<xref ref-type="bibr" rid="ref92">92</xref>,<xref ref-type="bibr" rid="ref96">96</xref>,<xref ref-type="bibr" rid="ref97">97</xref>], the NutSo-HH scale [<xref ref-type="bibr" rid="ref94">94</xref>], the Munich Chronotype questionnaire and Sleep Disturbance Scale for Children [<xref ref-type="bibr" rid="ref64">64</xref>], and the Epworth Sleepiness Scale [<xref ref-type="bibr" rid="ref96">96</xref>]. To measure stress, the stress subscale of the Depression Anxiety Stress Scale (DASS) [<xref ref-type="bibr" rid="ref92">92</xref>,<xref ref-type="bibr" rid="ref93">93</xref>], the INTERHEART stress questionnaire [<xref ref-type="bibr" rid="ref59">59</xref>], the Psychosocial Well-being Index-Short Form [<xref ref-type="bibr" rid="ref91">91</xref>], the Perceived Stress Scale [<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref64">64</xref>,<xref ref-type="bibr" rid="ref88">88</xref>], and the Profile of Mood States [<xref ref-type="bibr" rid="ref81">81</xref>] were used. Regarding data collection through sensors, most studies used wearable devices. One study used a smartphone to obtain points of interest related to physical activity and diet [<xref ref-type="bibr" rid="ref98">98</xref>], and 1 sleep study used polysomnography [<xref ref-type="bibr" rid="ref55">55</xref>]. Finally, 2 studies used words related to physical activity and diet, 1 derived from Google Trends [<xref ref-type="bibr" rid="ref99">99</xref>] and the other from Twitter (Twitter, Inc) [<xref ref-type="bibr" rid="ref100">100</xref>]<italic>.</italic></p><p>Concerning the modeled inputs, 56 of 65 (86.1%) studies used multimodal data. The input modalities were lifestyle (60/65, 92.3%), sociodemographic (49/65, 75.3%), clinical (29/65, 44.6%), anthropometric (14/65, 21.5%), psychological (20/65, 30.7%), physical (3/65, 4.62%), environmental (10/65, 15.38%), physiological (3/65, 4.62%), and behavioral (2/65, 3.07%). The model outcomes included lifestyle domains in 14 (22% studies; 5 physical activity [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref44">44</xref>-<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref90">90</xref>], 5 sleep [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref86">86</xref>,<xref ref-type="bibr" rid="ref97">97</xref>,<xref ref-type="bibr" rid="ref101">101</xref>], 3 diet [<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref94">94</xref>], and 1 stress [<xref ref-type="bibr" rid="ref61">61</xref>]) and other health outcomes in 51 (75% studies; with mental health, cancer, cardiovascular diseases, and diabetes being the most frequent categories; refer to <xref ref-type="table" rid="table1">Table 1</xref>).</p><p>Cross-sectional data were acquired in 36 (55%) studies [<xref ref-type="bibr" rid="ref42">42</xref>-<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref51">51</xref>-<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref56">56</xref>-<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref60">60</xref>-<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref65">65</xref>,<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref71">71</xref>-<xref ref-type="bibr" rid="ref74">74</xref>,<xref ref-type="bibr" rid="ref77">77</xref>-<xref ref-type="bibr" rid="ref80">80</xref>,<xref ref-type="bibr" rid="ref84">84</xref>,<xref ref-type="bibr" rid="ref85">85</xref>,<xref ref-type="bibr" rid="ref89">89</xref>,<xref ref-type="bibr" rid="ref92">92</xref>,<xref ref-type="bibr" rid="ref94">94</xref>,<xref ref-type="bibr" rid="ref95">95</xref>,<xref ref-type="bibr" rid="ref97">97</xref>], longitudinal data in 18 (28%) [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref64">64</xref>,<xref ref-type="bibr" rid="ref67">67</xref>-<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref81">81</xref>,<xref ref-type="bibr" rid="ref82">82</xref>,<xref ref-type="bibr" rid="ref96">96</xref>] studies, time-series data in 7 (11%) [<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref75">75</xref>,<xref ref-type="bibr" rid="ref76">76</xref>,<xref ref-type="bibr" rid="ref101">101</xref>,<xref ref-type="bibr" rid="ref102">102</xref>] studies, combined longitudinal and time-series data in 1 study [<xref ref-type="bibr" rid="ref90">90</xref>], textual data in 2 studies [<xref ref-type="bibr" rid="ref99">99</xref>,<xref ref-type="bibr" rid="ref100">100</xref>], and combined cross-sectional and geographical data in 1 study [<xref ref-type="bibr" rid="ref103">103</xref>].</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Summary of the machine learning (ML) workflow from data acquisition to explainability in the included studies.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Study</td><td align="left" valign="bottom">Physical activity</td><td align="left" valign="bottom">Diet</td><td align="left" valign="bottom">Sleep</td><td align="left" valign="bottom">Stress</td><td align="left" valign="bottom">Health outcome</td><td align="left" valign="bottom">Preprocess</td><td align="left" valign="bottom">ML<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> algorithm</td><td align="left" valign="bottom">Model evaluation</td><td align="left" valign="bottom">XAI<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td></tr></thead><tbody><tr><td align="left" valign="top">Abdul Rahman et al [<xref ref-type="bibr" rid="ref72">72</xref>]</td><td align="left" valign="top">Questionnaire (standardized) and single items (frequency)</td><td align="left" valign="top">Single items (frequency)</td><td align="left" valign="top">Single items (sleep hours)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Mental health</td><td align="left" valign="top">Missing imputation, Resampling, and dimensionality reduction</td><td align="left" valign="top">RF<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup>, ANN<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup>, NB<sup><xref ref-type="table-fn" rid="table1fn5">e</xref></sup>, and KNN<sup><xref ref-type="table-fn" rid="table1fn6">f</xref></sup></td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Afrash et al [<xref ref-type="bibr" rid="ref58">58</xref>]</td><td align="left" valign="top">Single items (engagement)</td><td align="left" valign="top">Single items (frequency)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Cancer</td><td align="left" valign="top">Transformation, missing imputation, and dimensionality reduction</td><td align="left" valign="top">DT<sup><xref ref-type="table-fn" rid="table1fn7">g</xref></sup>, MLPNN<sup><xref ref-type="table-fn" rid="table1fn8">h</xref></sup>, RBFNN<sup><xref ref-type="table-fn" rid="table1fn9">i</xref></sup>, FNN<sup><xref ref-type="table-fn" rid="table1fn10">j</xref></sup>, PNN<sup><xref ref-type="table-fn" rid="table1fn11">k</xref></sup>, and KNN</td><td align="left" valign="top">10-fold cross-validation (final evaluation)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Ai et al [<xref ref-type="bibr" rid="ref93">93</xref>]</td><td align="left" valign="top">Questionnaire (standardized) and single items (frequency)</td><td align="left" valign="top">Questionnaire (nonstandardized)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">Alzheimer disease</td><td align="left" valign="top">Transformation, missing imputation, and dimensionality reduction</td><td align="left" valign="top">RF and SVM<sup><xref ref-type="table-fn" rid="table1fn12">l</xref></sup></td><td align="left" valign="top">Nested cross-validation</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Allen [<xref ref-type="bibr" rid="ref87">87</xref>]</td><td align="left" valign="top">Single items (environment)</td><td align="left" valign="top">Single items (environment)</td><td align="left" valign="top">Single items (sleep hours)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Obesity</td><td align="left" valign="top">Missing imputation and dimensionality reduction</td><td align="left" valign="top">RF and DT</td><td align="left" valign="top">2-fold cross-validation (final evaluation)</td><td align="left" valign="top">LIME<sup><xref ref-type="table-fn" rid="table1fn13">m</xref></sup></td></tr><tr><td align="left" valign="top">Alshuraf et al [<xref ref-type="bibr" rid="ref59">59</xref>]</td><td align="left" valign="top">Sensor (wearable)</td><td align="left" valign="top">Single items (habits)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">Cardiovascular disease</td><td align="left" valign="top">Transformation, missing imputation, and dimensionality reduction</td><td align="left" valign="top">RF, DT, KNN, and NB</td><td align="left" valign="top">Leave-one-out cross-validation (LOOCV)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Birk et al [<xref ref-type="bibr" rid="ref95">95</xref>]</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Diabetes</td><td align="left" valign="top">Resampling and dimensionality reduction</td><td align="left" valign="top">RF</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">B&#x00F4;to et al [<xref ref-type="bibr" rid="ref62">62</xref>]</td><td align="left" valign="top">Single items (engagement)</td><td align="left" valign="top">Single items (habits)</td><td align="left" valign="top">Single items (sleep hours)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Lifestyle (diet)</td><td align="left" valign="top">Transformation and dimensionality reduction</td><td align="left" valign="top">DT</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Butkevi&#x010D;i&#x016B;t&#x0117; et al [<xref ref-type="bibr" rid="ref40">40</xref>]</td><td align="left" valign="top">Sensor (wearable)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Lifestyle (physical activity)</td><td align="left" valign="top">Transformation</td><td align="left" valign="top">RF</td><td align="left" valign="top">5-fold cross-validation (final evaluation)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Cai et al [<xref ref-type="bibr" rid="ref41">41</xref>]</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Successful aging</td><td align="left" valign="top">Transformation and dimensionality reduction</td><td align="left" valign="top">RF, GBM<sup><xref ref-type="table-fn" rid="table1fn14">n</xref></sup>, and ANN</td><td align="left" valign="top">10-fold cross-validation (final evaluation)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Cheung et al [<xref ref-type="bibr" rid="ref90">90</xref>]</td><td align="left" valign="top">Sensor (wearable)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Single items (stress level)</td><td align="left" valign="top">Lifestyle (physical activity)</td><td align="left" valign="top">Dimensionality reduction</td><td align="left" valign="top">RF and DT</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Chiang and Dey [<xref ref-type="bibr" rid="ref102">102</xref>]</td><td align="left" valign="top">Sensor (wearable)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Sensor (wearable)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Blood pressure</td><td align="left" valign="top">Transformation, missing imputation, and dimensionality reduction</td><td align="left" valign="top">RF, GBM, MLPNN, LSTM-RNN<sup><xref ref-type="table-fn" rid="table1fn15">o</xref></sup>, and SVM</td><td align="left" valign="top">5-fold cross-validation (final evaluation) and online weighted-resampling</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Cort&#x00E9;s-Iba&#x00F1;ez et al [<xref ref-type="bibr" rid="ref73">73</xref>]</td><td align="left" valign="top">Questionnaire (standardized) and single items (frequency)</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Cancer</td><td align="left" valign="top">Transformation, missing imputation, resampling, and dimensionality reduction</td><td align="left" valign="top">RF and SVM</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Cort&#x00E9;s-Iba&#x00F1;ez et al [<xref ref-type="bibr" rid="ref74">74</xref>]</td><td align="left" valign="top">Questionnaire (standardized) and single items (frequency)</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Cancer</td><td align="left" valign="top">Transformation, resampling, and dimensionality reduction</td><td align="left" valign="top">RF, GBM, and SVM</td><td align="left" valign="top">5-fold cross-validation (final evaluation)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Dianati-Nasab et al [<xref ref-type="bibr" rid="ref47">47</xref>]</td><td align="left" valign="top">Single items (engagement)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Cancer</td><td align="left" valign="top">Missing imputation and dimensionality reduction</td><td align="left" valign="top">RF, DT, XGBoost<sup><xref ref-type="table-fn" rid="table1fn16">p</xref></sup>, and ANN</td><td align="left" valign="top">10-fold cross-validation (final evaluation)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Faruqui et al [<xref ref-type="bibr" rid="ref75">75</xref>]</td><td align="left" valign="top">Single items (frequency)</td><td align="left" valign="top">Single items (type of products)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Diabetes</td><td align="left" valign="top">Transformation and missing imputation</td><td align="left" valign="top">LSTM-RNN, ANN, and KNN</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Gu et al [<xref ref-type="bibr" rid="ref60">60</xref>]</td><td align="left" valign="top">Single items (frequency)</td><td align="left" valign="top">Single items (frequency)</td><td align="left" valign="top">Single items (sleep hours)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Infertility risk in women</td><td align="left" valign="top">Dimensionality reduction</td><td align="left" valign="top">RF, DT, BoostDT<sup><xref ref-type="table-fn" rid="table1fn17">q</xref></sup>, LightGBM<sup><xref ref-type="table-fn" rid="table1fn18">r</xref></sup>, and AdaBoost<sup><xref ref-type="table-fn" rid="table1fn19">s</xref></sup></td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">SHAP<sup><xref ref-type="table-fn" rid="table1fn20">t</xref></sup> values</td></tr><tr><td align="left" valign="top">Guthrie et al [<xref ref-type="bibr" rid="ref76">76</xref>]</td><td align="left" valign="top">Single items (frequency)</td><td align="left" valign="top">Single items (type of products)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Cardiometabolic disease</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">RF</td><td align="left" valign="top">Leave-one-out cross-validation (LOOCV)</td><td align="left" valign="top">SHAP values</td></tr><tr><td align="left" valign="top">Hu et al [<xref ref-type="bibr" rid="ref77">77</xref>]</td><td align="left" valign="top">Single items (frequency)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Single items (sleep hours)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Cardiovascular disease</td><td align="left" valign="top">Missing imputation and dimensionality reduction</td><td align="left" valign="top">RF and BART<sup><xref ref-type="table-fn" rid="table1fn21">u</xref></sup></td><td align="left" valign="top">Not reported</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Hu et al [<xref ref-type="bibr" rid="ref78">78</xref>]</td><td align="left" valign="top">Single items (frequency)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Single items (sleep hours)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Cardiovascular disease</td><td align="left" valign="top">Missing imputation and dimensionality reduction</td><td align="left" valign="top">RF, XGBoost, and BART</td><td align="left" valign="top">5-fold cross-validation (final evaluation)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Huang et al [<xref ref-type="bibr" rid="ref63">63</xref>]</td><td align="left" valign="top">Single items (engagement)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Single items (sleep quality)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Cognitive function</td><td align="left" valign="top">Missing imputation and resampling</td><td align="left" valign="top">RF, BoostDT, XGBoost, and LSTM-RNN</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">SHAP values</td></tr><tr><td align="left" valign="top">Jin and Halili [<xref ref-type="bibr" rid="ref67">67</xref>]</td><td align="left" valign="top">Single items (intensity)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Single items (sleep hours)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Mental health</td><td align="left" valign="top">Transformation, missing imputation, resampling, and dimensionality reduction</td><td align="left" valign="top">RF, DT, XGBoost, LightGBM, CatBoost<sup><xref ref-type="table-fn" rid="table1fn22">v</xref></sup>, Bagging<sup><xref ref-type="table-fn" rid="table1fn23">w</xref></sup>, HistGBM<sup><xref ref-type="table-fn" rid="table1fn24">x</xref></sup>, SVM, and MLPNN</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">SHAP values</td></tr><tr><td align="left" valign="top">Kim et al [<xref ref-type="bibr" rid="ref91">91</xref>]</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">Questionnaire (standardized) and Single items (Sleep hours)</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">Quality of life</td><td align="left" valign="top">Transformation, Resampling</td><td align="left" valign="top">RF, DT, XGBoost, SVM, NB, KNN</td><td align="left" valign="top">6-fold cross-validation (final evaluation)</td><td align="left" valign="top">SHAP values</td></tr><tr><td align="left" valign="top">Kimura et al [<xref ref-type="bibr" rid="ref104">104</xref>]</td><td align="left" valign="top">Sensor (wearable)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Sensor (wearable)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Alzheimer disease</td><td align="left" valign="top">Dimensionality reduction</td><td align="left" valign="top">SVM</td><td align="left" valign="top">5-fold cross-validation (final evaluation)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Kiss et al [<xref ref-type="bibr" rid="ref64">64</xref>]</td><td align="left" valign="top">Single items (engagement)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Questionnaire (standardized) and single items (sleep hours)</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">Mental health</td><td align="left" valign="top">Transformation, missing imputation, and dimensionality reduction</td><td align="left" valign="top">XGBoost</td><td align="left" valign="top">Nested cross-validation</td><td align="left" valign="top">SHAP values</td></tr><tr><td align="left" valign="top">Li and Song [<xref ref-type="bibr" rid="ref50">50</xref>]</td><td align="left" valign="top">Single items (engagement)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Cognitive function</td><td align="left" valign="top">Transformation</td><td align="left" valign="top">CNN<sup><xref ref-type="table-fn" rid="table1fn25">y</xref></sup>, Transformer, LSTM-RNN, GRU-Attention<sup><xref ref-type="table-fn" rid="table1fn26">z</xref></sup>, WaveNet, and RNN<sup><xref ref-type="table-fn" rid="table1fn27">aa</xref></sup></td><td align="left" valign="top">10-fold cross-validation (final evaluation)</td><td align="left" valign="top">SHAP values</td></tr><tr><td align="left" valign="top">Lim et al [<xref ref-type="bibr" rid="ref42">42</xref>]</td><td align="left" valign="top">Single items (intensity)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Osteoarthritis</td><td align="left" valign="top">Transformation, missing imputation, resampling, and dimensionality reduction</td><td align="left" valign="top">FFNN<sup><xref ref-type="table-fn" rid="table1fn28">ab</xref></sup></td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Lim et al [<xref ref-type="bibr" rid="ref10">10</xref>]</td><td align="left" valign="top">Single items (intensity)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Questionnaire (standardized) and single items (sleep quality)</td><td align="left" valign="top">Single items (Stress level)</td><td align="left" valign="top">Lifestyle (sleep)</td><td align="left" valign="top">Transformation, missing imputation, and dimensionality reduction</td><td align="left" valign="top">RF and DT</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Lin et al [<xref ref-type="bibr" rid="ref51">51</xref>]</td><td align="left" valign="top">Single items (engagement)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Loneliness</td><td align="left" valign="top">Transformation, Missing imputation, Dimensionality reduction</td><td align="left" valign="top">RF, DT, SVM, MLP, and KNN</td><td align="left" valign="top">10-fold cross-validation (final evaluation)</td><td align="left" valign="top">SHAP values</td></tr><tr><td align="left" valign="top">Liu et al [<xref ref-type="bibr" rid="ref53">53</xref>]</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Cardiovascular disease</td><td align="left" valign="top">Transformation</td><td align="left" valign="top">RSF<sup><xref ref-type="table-fn" rid="table1fn29">ac</xref></sup></td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Luo et al [<xref ref-type="bibr" rid="ref79">79</xref>]</td><td align="left" valign="top">Single items (frequency)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Single items (sleep hours)</td><td align="left" valign="top">Single items (stress level)</td><td align="left" valign="top">Social network addiction risk</td><td align="left" valign="top">Transformation and dimensionality reduction</td><td align="left" valign="top">RF</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Luo et al [<xref ref-type="bibr" rid="ref57">57</xref>]</td><td align="left" valign="top">Single items (intensity)</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">Single items (sleep hours)</td><td align="left" valign="top">Single items (stress level)</td><td align="left" valign="top">Chronic kidney disease</td><td align="left" valign="top">Missing imputation and dimensionality reduction</td><td align="left" valign="top">GBM</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Luo et al [<xref ref-type="bibr" rid="ref68">68</xref>]</td><td align="left" valign="top">Single items (intensity)</td><td align="left" valign="top">Single items (habits)</td><td align="left" valign="top">Single items (sleep hours)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Frailty</td><td align="left" valign="top">Missing imputation</td><td align="left" valign="top">XGBoost</td><td align="left" valign="top">10-fold cross-validation (final evaluation)</td><td align="left" valign="top">SHAP values</td></tr><tr><td align="left" valign="top">Majcherek et al [<xref ref-type="bibr" rid="ref80">80</xref>]</td><td align="left" valign="top">Single items (frequency)</td><td align="left" valign="top">Single items (type of products)</td><td align="left" valign="top">Single items (sleep problems)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Mental health</td><td align="left" valign="top">Missing imputation</td><td align="left" valign="top">XGBoost</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">SHAP values</td></tr><tr><td align="left" valign="top">Majcherek et al [<xref ref-type="bibr" rid="ref65">65</xref>]</td><td align="left" valign="top">Single items (engagement)</td><td align="left" valign="top">Single items (habits)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Diabetes</td><td align="left" valign="top">Resampling</td><td align="left" valign="top">RF, DT, AdaBoost, CatBoost, HistGBM, LightGBM, XGBoost, KNN, NB, and Nearest Centroid</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">SHAP values</td></tr><tr><td align="left" valign="top">Matta et al [<xref ref-type="bibr" rid="ref48">48</xref>]</td><td align="left" valign="top">Sensor (wearable)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Lifestyle (sleep)</td><td align="left" valign="top">Transformation</td><td align="left" valign="top">MLP</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Moon and Woo [<xref ref-type="bibr" rid="ref89">89</xref>]</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Single items (habits)</td><td align="left" valign="top">Single items (sleep quality)</td><td align="left" valign="top">Single items (stress level)</td><td align="left" valign="top">Mental health</td><td align="left" valign="top">Transformation, missing imputation, resampling, and dimensionality reduction</td><td align="left" valign="top">RF and ANN</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Morris et al [<xref ref-type="bibr" rid="ref88">88</xref>]</td><td align="left" valign="top">Questionnaire (standardized) and single items (environment)</td><td align="left" valign="top">Questionnaire (standardized) and single items (environment)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">Cardiovascular disease</td><td align="left" valign="top">Missing imputation</td><td align="left" valign="top">RF and ANN</td><td align="left" valign="top">10-fold cross-validation (final evaluation)</td><td align="left" valign="top">SHAP values</td></tr><tr><td align="left" valign="top">Mousavi et al [<xref ref-type="bibr" rid="ref66">66</xref>]</td><td align="left" valign="top">Single items (engagement)</td><td align="left" valign="top">Single items (frequency)</td><td align="left" valign="top">Single items (sleep hours)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Lifestyle (diet)</td><td align="left" valign="top">Dimensionality reduction</td><td align="left" valign="top">FFNN</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Mun and Geng [<xref ref-type="bibr" rid="ref81">81</xref>]</td><td align="left" valign="top">Single items (frequency)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Single items (sleep hours)</td><td align="left" valign="top">Questionnaire (standardized) and sensor (wearable)</td><td align="left" valign="top">Fatigue</td><td align="left" valign="top">Transformation, missing imputation, and dimensionality reduction</td><td align="left" valign="top">RF</td><td align="left" valign="top">10-fold cross-validation (final evaluation)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Nichols et al [<xref ref-type="bibr" rid="ref61">61</xref>]</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">Lifestyle (stress)</td><td align="left" valign="top">Transformation, missing imputation, resampling, and dimensionality reduction</td><td align="left" valign="top">SVM</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Oladeji et al [<xref ref-type="bibr" rid="ref99">99</xref>]</td><td align="left" valign="top">Words (Google Trends)</td><td align="left" valign="top">Words (Google Trends)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Obesity</td><td align="left" valign="top">Dimensionality reduction</td><td align="left" valign="top">RF, GBM, and SVM</td><td align="left" valign="top">Out-of-sample</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Park et al [<xref ref-type="bibr" rid="ref49">49</xref>]</td><td align="left" valign="top">Single items (intensity)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Adverse health event</td><td align="left" valign="top">Dimensionality reduction</td><td align="left" valign="top">XGBoost</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Park and Edington [<xref ref-type="bibr" rid="ref82">82</xref>]</td><td align="left" valign="top">Single items (frequency)</td><td align="left" valign="top">Single items (type of products)</td><td align="left" valign="top">Single items (sleep hours)</td><td align="left" valign="top">Single items (stress level)</td><td align="left" valign="top">Diabetes</td><td align="left" valign="top">Missing imputation and resampling</td><td align="left" valign="top">MLPNN</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Park [<xref ref-type="bibr" rid="ref83">83</xref>]</td><td align="left" valign="top">Single items (frequency)</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Visceral fat</td><td align="left" valign="top">Transformation, missing imputation, and dimensionality reduction</td><td align="left" valign="top">RF, XGBoost, and ANN</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">SHAP values</td></tr><tr><td align="left" valign="top">Pereira et al [<xref ref-type="bibr" rid="ref92">92</xref>]</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">Mental health</td><td align="left" valign="top">Transformation and missing imputation</td><td align="left" valign="top">RF, XGBoost, and SVM</td><td align="left" valign="top">10-fold cross-validation (final evaluation)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Puterman et al [<xref ref-type="bibr" rid="ref69">69</xref>]</td><td align="left" valign="top">Single items (intensity)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Single items (sleep problems)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Mortality</td><td align="left" valign="top">Transformation, missing imputation, and dimensionality reduction</td><td align="left" valign="top">RSF</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Qasrawi et al [<xref ref-type="bibr" rid="ref70">70</xref>]</td><td align="left" valign="top">Single items (intensity)</td><td align="left" valign="top">Single items (habits)</td><td align="left" valign="top">Single items (sleep hours)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Mental health</td><td align="left" valign="top">Missing imputation and dimensionality reduction</td><td align="left" valign="top">RF, DT, XGBoost, SVM, ANN, KNN</td><td align="left" valign="top">10-fold cross-validation (final evaluation)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Recenti et al [<xref ref-type="bibr" rid="ref43">43</xref>]</td><td align="left" valign="top">Single items (frequency)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Lifestyle (physical activity)</td><td align="left" valign="top">Missing imputation and resampling</td><td align="left" valign="top">RF, GBM, and AdaBoost</td><td align="left" valign="top">10-fold cross-validation (final evaluation)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Recenti et al [<xref ref-type="bibr" rid="ref44">44</xref>]</td><td align="left" valign="top">Single items (frequency)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Diabetes</td><td align="left" valign="top">Missing imputation and resampling</td><td align="left" valign="top">RF, GBM, and AdaBoost</td><td align="left" valign="top">10-fold cross-validation (final evaluation)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Ren et al [<xref ref-type="bibr" rid="ref52">52</xref>]</td><td align="left" valign="top">Single items (engagement)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Cognitive function</td><td align="left" valign="top">Missing imputation, Resampling</td><td align="left" valign="top">RF, XGBoost, SVM</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">SHAP values</td></tr><tr><td align="left" valign="top">Ruiz et al [<xref ref-type="bibr" rid="ref54">54</xref>]</td><td align="left" valign="top">Single items (engagement)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Depression</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">DT</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Sandri et al [<xref ref-type="bibr" rid="ref94">94</xref>]</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Lifestyle (diet)</td><td align="left" valign="top">Transformation and resampling</td><td align="left" valign="top">RF, DT, XGBoost, CatBoost, HistGBM, and FFNN</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">SHAP values</td></tr><tr><td align="left" valign="top">Sathyanarayana et al [<xref ref-type="bibr" rid="ref101">101</xref>]</td><td align="left" valign="top">Sensor (wearable)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Sensor (wearable)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Lifestyle (sleep)</td><td align="left" valign="top">Missing imputation</td><td align="left" valign="top">MLPNN, CNN, SETRNN<sup><xref ref-type="table-fn" rid="table1fn30">ad</xref></sup>, and LSTM-RNN</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Shi et al [<xref ref-type="bibr" rid="ref84">84</xref>]</td><td align="left" valign="top">Single items (frequency)</td><td align="left" valign="top">Single items (frequency)</td><td align="left" valign="top">Single items (sleep hours)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Osteoporosis</td><td align="left" valign="top">Transformation, missing imputation, resampling, and dimensionality reduction</td><td align="left" valign="top">RF, DT, SVM, and KNN</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">SHAP values</td></tr><tr><td align="left" valign="top">Staudenmayer et al [<xref ref-type="bibr" rid="ref45">45</xref>]</td><td align="left" valign="top">Sensor (wearable)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Lifestyle (physical activity)</td><td align="left" valign="top">Transformation</td><td align="left" valign="top">RF, DT, ANN, and SVM</td><td align="left" valign="top">Leave-one-out cross-validation (LOOCV)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Stemmer et al [<xref ref-type="bibr" rid="ref100">100</xref>]</td><td align="left" valign="top">Words (Twitter)</td><td align="left" valign="top">Words (Twitter)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Inflammatory bowel disease</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">RF, GBM, AdaBoost, and SVM</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Su et al [<xref ref-type="bibr" rid="ref56">56</xref>]</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Resilience</td><td align="left" valign="top">Dimensionality reduction</td><td align="left" valign="top">RF, DT, and XGBoost</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">SHAP values</td></tr><tr><td align="left" valign="top">Wallace et al [<xref ref-type="bibr" rid="ref96">96</xref>]</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Questionnaire (standardized) and single items (sleep hours)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Mortality</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">RSF</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Wallace et al [<xref ref-type="bibr" rid="ref55">55</xref>]</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Single items (sleep hours) and sensor (polysomnography)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Mortality</td><td align="left" valign="top">Missing imputation and dimensionality reduction</td><td align="left" valign="top">RF</td><td align="left" valign="top">External dataset</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Wang et al [<xref ref-type="bibr" rid="ref97">97</xref>]</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Lifestyle (sleep)</td><td align="left" valign="top">Missing imputation, resampling, and dimensionality reduction</td><td align="left" valign="top">GBM, LightGBM, SVM, MLPNN, and KNN</td><td align="left" valign="top">10-fold cross-validation (final evaluation)</td><td align="left" valign="top">SHAP values</td></tr><tr><td align="left" valign="top">Xin and Ren [<xref ref-type="bibr" rid="ref85">85</xref>]</td><td align="left" valign="top">Single items (frequency)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Single items (Sleep hours)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Mental health</td><td align="left" valign="top">Dimensionality reduction</td><td align="left" valign="top">RF</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">SHAP values</td></tr><tr><td align="left" valign="top">Zhang et al [<xref ref-type="bibr" rid="ref86">86</xref>]</td><td align="left" valign="top">Single items (frequency)</td><td align="left" valign="top">Single items (habits)</td><td align="left" valign="top">Questionnaire (standardized)</td><td align="left" valign="top">Single items (stress level)</td><td align="left" valign="top">Lifestyle (sleep)</td><td align="left" valign="top">Resampling</td><td align="left" valign="top">RF, DT, XGBoost, SVM, ANN, and KNN</td><td align="left" valign="top">External dataset</td><td align="left" valign="top">SHAP values</td></tr><tr><td align="left" valign="top">Zhou et al [<xref ref-type="bibr" rid="ref46">46</xref>]</td><td align="left" valign="top">Sensor (wearable)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Lifestyle (physical activity)</td><td align="left" valign="top">Transformation</td><td align="left" valign="top">SVM</td><td align="left" valign="top">Out-of-sample</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Zhou et al [<xref ref-type="bibr" rid="ref98">98</xref>]</td><td align="left" valign="top">Sensor (phone)</td><td align="left" valign="top">Sensor (phone)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Obesity</td><td align="left" valign="top">Missing imputation and dimensionality reduction</td><td align="left" valign="top">RF, GRF<sup><xref ref-type="table-fn" rid="table1fn31">ae</xref></sup>, and ANN</td><td align="left" valign="top">10-fold cross-validation (final evaluation)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Zhou et al [<xref ref-type="bibr" rid="ref71">71</xref>]</td><td align="left" valign="top">Single items (intensity)</td><td align="left" valign="top">Single items (habits)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">Psoriasis</td><td align="left" valign="top">Resampling</td><td align="left" valign="top">XGBoost</td><td align="left" valign="top">Hold-out test set</td><td align="left" valign="top">SHAP values</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>ML: machine learning.</p></fn><fn id="table1fn2"><p><sup>b</sup>XAI: explainable artificial intelligence.</p></fn><fn id="table1fn3"><p><sup>c</sup>RF: random forest.</p></fn><fn id="table1fn4"><p><sup>d</sup>ANN: artificial neural network.</p></fn><fn id="table1fn5"><p><sup>e</sup>NB: naive Bayes.</p></fn><fn id="table1fn6"><p><sup>f</sup>KNN: k-nearest neighbor.</p></fn><fn id="table1fn7"><p><sup>g</sup>DT: decision tree.</p></fn><fn id="table1fn8"><p><sup>h</sup>MLPNN: multilayer perceptron neural network.</p></fn><fn id="table1fn9"><p><sup>i</sup>RBFNN: radial basis function neural network.</p></fn><fn id="table1fn10"><p><sup>j</sup>FNN: fuzzy neural network.</p></fn><fn id="table1fn11"><p><sup>k</sup>PNN: probabilistic neural network.</p></fn><fn id="table1fn12"><p><sup>l</sup>SVM: support vector machine.</p></fn><fn id="table1fn13"><p><sup>m</sup>LIME: local interpretable model-agnostic explanations.</p></fn><fn id="table1fn14"><p><sup>n</sup>GBM: gradient boosting.</p></fn><fn id="table1fn15"><p><sup>o</sup>LST-RNN: long short-term memory recurrent neural network.</p></fn><fn id="table1fn16"><p><sup>p</sup>XGBoost: extreme gradient boosting.</p></fn><fn id="table1fn17"><p><sup>q</sup>BoostDT: boost decision tree.</p></fn><fn id="table1fn18"><p><sup>r</sup>LightGBM: light gradient boosting machine.</p></fn><fn id="table1fn19"><p><sup>s</sup>AdaBoost: adaptive boosting.</p></fn><fn id="table1fn20"><p><sup>t</sup>SHAP: Shapley Additive Explanations.</p></fn><fn id="table1fn21"><p><sup>u</sup>BART: Bayesian additive regression trees.</p></fn><fn id="table1fn22"><p><sup>v</sup>CatBoost:<bold> </bold>categorical boosting.</p></fn><fn id="table1fn23"><p><sup>w</sup>Bagging: bootstrap aggregating.</p></fn><fn id="table1fn24"><p><sup>x</sup>HistGBM: histogram-based gradient boosting machine. </p></fn><fn id="table1fn25"><p><sup>y</sup>CNN: convolutional neural network.</p></fn><fn id="table1fn26"><p><sup>z</sup>GRU-Attention: gated recurrent unit with attention.</p></fn><fn id="table1fn27"><p><sup>aa</sup>RNN: recurrent neural network.</p></fn><fn id="table1fn28"><p><sup>ab</sup>FFNN: feed-forward neural network.</p></fn><fn id="table1fn29"><p><sup>ac</sup>RSF: random survival forest.</p></fn><fn id="table1fn30"><p><sup>ad</sup>SETRNN: simple Elman-type recurrent neural network.</p></fn><fn id="table1fn31"><p><sup>ae</sup>GRF: generalized random forest.</p></fn></table-wrap-foot></table-wrap><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Stacked bar chart summarizing the data acquisition methodology for each lifestyle component.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="humanfactors_v13i1e78648_fig04.png"/></fig></sec><sec id="s3-3"><title>Preprocessing</title><p>The preprocessing phase was divided into variable transformation, missing imputation, resampling, and dimensionality reduction. At least one of these preprocessing phases was reported by 59 (90.76%) studies (refer to <xref ref-type="table" rid="table1">Table 1</xref> and Table S4 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for more details).</p><p>There were 26 (40%) studies that reported normalization or other arithmetic or statistical transformations of variables before the modeling phase [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref64">64</xref>,<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref73">73</xref>-<xref ref-type="bibr" rid="ref75">75</xref>,<xref ref-type="bibr" rid="ref79">79</xref>,<xref ref-type="bibr" rid="ref81">81</xref>,<xref ref-type="bibr" rid="ref83">83</xref>,<xref ref-type="bibr" rid="ref84">84</xref>,<xref ref-type="bibr" rid="ref89">89</xref>,<xref ref-type="bibr" rid="ref91">91</xref>-<xref ref-type="bibr" rid="ref94">94</xref>,<xref ref-type="bibr" rid="ref102">102</xref>]. Six (9.23%) studies recoded categorical variables into quantitative variables, 5 used one-hot encoding [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref64">64</xref>,<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref102">102</xref>], and 1 used principal component analysis with quantile transformer scaler [<xref ref-type="bibr" rid="ref42">42</xref>].</p><p>Missing data imputation was reported in 37 (56.92%) studies. Twelve papers simply removed cases with missing data [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref42">42</xref>-<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref64">64</xref>,<xref ref-type="bibr" rid="ref77">77</xref>,<xref ref-type="bibr" rid="ref78">78</xref>,<xref ref-type="bibr" rid="ref80">80</xref>,<xref ref-type="bibr" rid="ref93">93</xref>,<xref ref-type="bibr" rid="ref98">98</xref>,<xref ref-type="bibr" rid="ref101">101</xref>], while others applied cutoff percentages for missing values (eg, 10% [<xref ref-type="bibr" rid="ref87">87</xref>], 30 % [<xref ref-type="bibr" rid="ref73">73</xref>], or &#x003E;50% [<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref72">72</xref>]), and 1 study removed observations with missing values in the output [<xref ref-type="bibr" rid="ref102">102</xref>]. Techniques included single imputation (mean, median, or mode) [<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref83">83</xref>,<xref ref-type="bibr" rid="ref88">88</xref>,<xref ref-type="bibr" rid="ref92">92</xref>], multiple imputation by chained equations [<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref72">72</xref>,<xref ref-type="bibr" rid="ref73">73</xref>], k-nearest neighbor [<xref ref-type="bibr" rid="ref89">89</xref>,<xref ref-type="bibr" rid="ref102">102</xref>], regression-based algorithm [<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref81">81</xref>], random forest (RF)&#x2013;based multiple imputation [<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref84">84</xref>], the MissForest algorithm [<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref68">68</xref>], imputation based on peers with similar health profile group [<xref ref-type="bibr" rid="ref82">82</xref>], imputation using training data [<xref ref-type="bibr" rid="ref104">104</xref>], and replacement of missing values with the last available data [<xref ref-type="bibr" rid="ref75">75</xref>].</p><p>Resampling techniques were reported in 21 (32.30%) papers. Eighteen studies balanced the datasets using methods such as using the minority class as a reference, undersampling the majority class [<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref61">61</xref>], or the synthetic minority oversampling technique (SMOTE) [<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref71">71</xref>,<xref ref-type="bibr" rid="ref72">72</xref>,<xref ref-type="bibr" rid="ref84">84</xref>,<xref ref-type="bibr" rid="ref86">86</xref>,<xref ref-type="bibr" rid="ref89">89</xref>,<xref ref-type="bibr" rid="ref91">91</xref>,<xref ref-type="bibr" rid="ref94">94</xref>,<xref ref-type="bibr" rid="ref95">95</xref>,<xref ref-type="bibr" rid="ref97">97</xref>]. One paper compared the results of SMOTE against the adaptive synthetic algorithm [<xref ref-type="bibr" rid="ref65">65</xref>]. Finally, 1 study stabilized variations in underrepresented outcome classes using bootstrap resampling [<xref ref-type="bibr" rid="ref82">82</xref>]. Regarding cancer studies where cases were fewer than controls, 2 different strategies were applied to the same dataset: sample-size equalization by randomly grouping cancer-free participants based on the number of cancer survivors [<xref ref-type="bibr" rid="ref74">74</xref>], while another study matched cases and controls by sex, age, and education level, then selected a random sample resulting in 50% cases and 50% controls [<xref ref-type="bibr" rid="ref73">73</xref>].</p><p>Dimensionality reduction was used in 38 (58.46%) studies using 3 approaches. The first approach involved assessing the relationship between features and outcomes by removing redundant information [<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref64">64</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref83">83</xref>,<xref ref-type="bibr" rid="ref85">85</xref>,<xref ref-type="bibr" rid="ref87">87</xref>,<xref ref-type="bibr" rid="ref93">93</xref>,<xref ref-type="bibr" rid="ref98">98</xref>,<xref ref-type="bibr" rid="ref99">99</xref>]. Other methods included factor analysis [<xref ref-type="bibr" rid="ref10">10</xref>] and principal component analysis [<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref69">69</xref>]. The second approach optimized models to achieve lower prediction error [<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref104">104</xref>]. The third approach involved automatic selection of predictors during model training [<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref72">72</xref>-<xref ref-type="bibr" rid="ref74">74</xref>,<xref ref-type="bibr" rid="ref77">77</xref>,<xref ref-type="bibr" rid="ref78">78</xref>,<xref ref-type="bibr" rid="ref81">81</xref>,<xref ref-type="bibr" rid="ref90">90</xref>,<xref ref-type="bibr" rid="ref95">95</xref>,<xref ref-type="bibr" rid="ref102">102</xref>]. For more information, refer to Table S4 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s3-4"><title>SL Models</title><sec id="s3-4-1"><title>Models Overview</title><p>In this section, the core components of ML models are described, beginning with problem formulation and algorithm families, followed by evaluation components. Depending on the purpose of the ML analysis, papers were grouped as classification or regression when the objective was prediction, and as feature selection when the goal was explanation [<xref ref-type="bibr" rid="ref19">19</xref>]. Most studies (46/65, 70.77%) focused on classification, 9 (13.83%) on regression, 2 (3.1%) on both classification and regression, and 8 (12.30%) on feature selection.</p><p>Six families of algorithms emerged from the studies: tree-based, deep learning, support vector machines, k-nearest neighbors, na&#x00EF;ve Bayes, and nearest centroid. The approach adopted across 40 studies was a multimodel approach, with 29 of them incorporating algorithms from diverse algorithmic families. <xref ref-type="fig" rid="figure5">Figure 5</xref> provides a comprehensive taxonomy of the specific algorithms implemented. The following subsections describe the application of specific algorithms within the 3 most used families (tree-based, deep learning, and support vector machines) in relation to the type of data used.</p><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Machine learning families and algorithms taxonomy. BART: Bayesian additive regression trees; CNN: convolutional neural network; DT: decision tree; FFNN: feed-forward neural network; FNN: fuzzy neural network; GB: gradient boosting; GRU-attention: gated recurrent unit with attention; KNN: k-nearest neighbor; LSTM-RNN: long short-term memory recurrent neural network; MLPNN: multilayer perceptron neural network; NB: naive Bayes; NS: not specified; PNN: probabilistic neural network; RBFNN: radial basis function neural network; RF: random forest; SETRNN: simple Elman-type recurrent neural network; SVM Ln: support vector machine with linear kernel; SVM RBF: support vector machine with a radial basis function.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="humanfactors_v13i1e78648_fig05.png"/></fig></sec><sec id="s3-4-2"><title>Tree-Based Algorithms</title><p>Tree-based algorithms were applied in 55 (84.61%) studies, covering all data types. RF was used in 45 (69.23%) out of 55 studies. Specifically, RF was implemented in 27 cross-sectional studies [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref51">51</xref>-<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref56">56</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref65">65</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref72">72</xref>-<xref ref-type="bibr" rid="ref74">74</xref>,<xref ref-type="bibr" rid="ref77">77</xref>-<xref ref-type="bibr" rid="ref79">79</xref>,<xref ref-type="bibr" rid="ref84">84</xref>-<xref ref-type="bibr" rid="ref87">87</xref>,<xref ref-type="bibr" rid="ref89">89</xref>,<xref ref-type="bibr" rid="ref91">91</xref>-<xref ref-type="bibr" rid="ref95">95</xref>], 11 longitudinal studies [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref81">81</xref>,<xref ref-type="bibr" rid="ref83">83</xref>,<xref ref-type="bibr" rid="ref88">88</xref>,<xref ref-type="bibr" rid="ref96">96</xref>], 3 time-series studies [<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref76">76</xref>,<xref ref-type="bibr" rid="ref102">102</xref>], 2 textual studies [<xref ref-type="bibr" rid="ref99">99</xref>,<xref ref-type="bibr" rid="ref100">100</xref>], 1 study with both cross-sectional and geographical data [<xref ref-type="bibr" rid="ref98">98</xref>], and 1 study with both longitudinal and time-series data [<xref ref-type="bibr" rid="ref90">90</xref>].</p><p>Different versions of the gradient boosting algorithm were performed in 28 studies, including gradient boosting machines, extreme gradient boosting, adaptive boosting, and light gradient boosting machine [<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref56">56</xref>,<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref63">63</xref>-<xref ref-type="bibr" rid="ref65">65</xref>,<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref68">68</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref71">71</xref>,<xref ref-type="bibr" rid="ref74">74</xref>,<xref ref-type="bibr" rid="ref78">78</xref>,<xref ref-type="bibr" rid="ref80">80</xref>,<xref ref-type="bibr" rid="ref83">83</xref>,<xref ref-type="bibr" rid="ref86">86</xref>,<xref ref-type="bibr" rid="ref91">91</xref>,<xref ref-type="bibr" rid="ref92">92</xref>,<xref ref-type="bibr" rid="ref94">94</xref>,<xref ref-type="bibr" rid="ref97">97</xref>,<xref ref-type="bibr" rid="ref99">99</xref>,<xref ref-type="bibr" rid="ref100">100</xref>,<xref ref-type="bibr" rid="ref102">102</xref>]. Finally, decision tree algorithms were implemented in 19 studies [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref56">56</xref>,<xref ref-type="bibr" rid="ref58">58</xref>-<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref65">65</xref>,<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref84">84</xref>,<xref ref-type="bibr" rid="ref86">86</xref>,<xref ref-type="bibr" rid="ref87">87</xref>,<xref ref-type="bibr" rid="ref90">90</xref>,<xref ref-type="bibr" rid="ref91">91</xref>,<xref ref-type="bibr" rid="ref94">94</xref>], and Bayesian additive regression trees in 2 studies [<xref ref-type="bibr" rid="ref77">77</xref>,<xref ref-type="bibr" rid="ref78">78</xref>] (<xref ref-type="table" rid="table1">Table 1</xref>; <xref ref-type="fig" rid="figure5">Figure 5</xref>).</p></sec><sec id="s3-4-3"><title>Deep Learning Algorithms</title><p>Neural networks (NNs) are considered the cornerstone of deep learning algorithms. Various NN architectures were applied in 24 (36.92%) of the reviewed studies. A multilayer perceptron neural network was used in cross-sectional [<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref97">97</xref>], longitudinal [<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref82">82</xref>], and time-series data [<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref101">101</xref>,<xref ref-type="bibr" rid="ref102">102</xref>]. Long short-term memory recurrent neural network was applied to longitudinal [<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref63">63</xref>] and time-series data [<xref ref-type="bibr" rid="ref75">75</xref>,<xref ref-type="bibr" rid="ref101">101</xref>,<xref ref-type="bibr" rid="ref102">102</xref>]. Feed-forward neural networks were used for cross-sectional data [<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref94">94</xref>]. Convolutional neural networks were used to analyze time-series [<xref ref-type="bibr" rid="ref101">101</xref>] and cross-sectional data [<xref ref-type="bibr" rid="ref50">50</xref>]. Simple Elman-type recurrent neural networks were applied in a time-series study [<xref ref-type="bibr" rid="ref101">101</xref>]. Radial basis function neural networks, fuzzy neural networks (FNNs), and probabilistic neural networks were used in a cross-sectional study [<xref ref-type="bibr" rid="ref58">58</xref>]. In addition, Transformer, gated recurrent unit with attention, WaveNet, and RNNs were used to analyze longitudinal data [<xref ref-type="bibr" rid="ref50">50</xref>]. In contrast, 11 studies did not specify the artificial neural network architecture used [<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref72">72</xref>,<xref ref-type="bibr" rid="ref75">75</xref>,<xref ref-type="bibr" rid="ref83">83</xref>,<xref ref-type="bibr" rid="ref86">86</xref>,<xref ref-type="bibr" rid="ref88">88</xref>,<xref ref-type="bibr" rid="ref89">89</xref>,<xref ref-type="bibr" rid="ref98">98</xref>] (<xref ref-type="table" rid="table1">Table 1</xref>; <xref ref-type="fig" rid="figure5">Figure 5</xref>).</p></sec><sec id="s3-4-4"><title>Support Vector Machine Algorithms</title><p>Support vector machine (SVM) algorithms were used in 19 (27.08%) studies, applied across various data types. SVM was implemented in 11 cross-sectional studies, 2 longitudinal studies, 3 time-series studies, and 2 studies that analyzed textual data. Configurations included support vector machine with a radial basis function [<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref102">102</xref>,<xref ref-type="bibr" rid="ref104">104</xref>] or a support vector machine with linear kernel [<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref73">73</xref>,<xref ref-type="bibr" rid="ref93">93</xref>,<xref ref-type="bibr" rid="ref100">100</xref>]. Eleven studies did not report the type of kernel used [<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref74">74</xref>,<xref ref-type="bibr" rid="ref84">84</xref>,<xref ref-type="bibr" rid="ref86">86</xref>,<xref ref-type="bibr" rid="ref91">91</xref>,<xref ref-type="bibr" rid="ref92">92</xref>,<xref ref-type="bibr" rid="ref97">97</xref>,<xref ref-type="bibr" rid="ref99">99</xref>] (<xref ref-type="table" rid="table1">Table 1</xref>; <xref ref-type="fig" rid="figure5">Figure 5</xref>).</p></sec></sec><sec id="s3-5"><title>Evaluation</title><p>Final model evaluation procedures were explicitly reported in 57 (87.69%) reviewed studies, with the hold-out test set being the most applied strategy. These included a hold-out test set [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref65">65</xref>-<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref71">71</xref>-<xref ref-type="bibr" rid="ref73">73</xref>,<xref ref-type="bibr" rid="ref75">75</xref>,<xref ref-type="bibr" rid="ref79">79</xref>,<xref ref-type="bibr" rid="ref82">82</xref>-<xref ref-type="bibr" rid="ref85">85</xref>,<xref ref-type="bibr" rid="ref94">94</xref>,<xref ref-type="bibr" rid="ref95">95</xref>,<xref ref-type="bibr" rid="ref100">100</xref>,<xref ref-type="bibr" rid="ref101">101</xref>], k-fold cross-validation (final evaluation) [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref68">68</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref74">74</xref>,<xref ref-type="bibr" rid="ref78">78</xref>,<xref ref-type="bibr" rid="ref81">81</xref>,<xref ref-type="bibr" rid="ref87">87</xref>,<xref ref-type="bibr" rid="ref88">88</xref>,<xref ref-type="bibr" rid="ref91">91</xref>,<xref ref-type="bibr" rid="ref92">92</xref>,<xref ref-type="bibr" rid="ref97">97</xref>,<xref ref-type="bibr" rid="ref98">98</xref>,<xref ref-type="bibr" rid="ref104">104</xref>], nested cross-validation [<xref ref-type="bibr" rid="ref64">64</xref>,<xref ref-type="bibr" rid="ref93">93</xref>], leave-one-out cross-validation (for small datasets with n&#x003C;150) [<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref76">76</xref>]. Two studies used external datasets for model performance assessment [<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref86">86</xref>]. For time-series data, 2 studies divided the dataset based on the time of acquisition, keeping an out-of-sample dataset for model evaluation [<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref99">99</xref>], while 1 study [<xref ref-type="bibr" rid="ref102">102</xref>] used 5-fold cross-validation in an offline setting followed by an online weighted resampling methodology to address drift.</p><p>Among the 11 studies that addressed regression problems, the reported evaluation metrics included mean absolute error [<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref75">75</xref>,<xref ref-type="bibr" rid="ref87">87</xref>,<xref ref-type="bibr" rid="ref102">102</xref>], mean squared error [<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref68">68</xref>,<xref ref-type="bibr" rid="ref75">75</xref>], root-mean-square error [<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref68">68</xref>,<xref ref-type="bibr" rid="ref78">78</xref>,<xref ref-type="bibr" rid="ref98">98</xref>,<xref ref-type="bibr" rid="ref99">99</xref>,<xref ref-type="bibr" rid="ref102">102</xref>], mean absolute percentage error [<xref ref-type="bibr" rid="ref102">102</xref>], and coefficient of determination (R<sup>2</sup>) [<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref68">68</xref>,<xref ref-type="bibr" rid="ref79">79</xref>,<xref ref-type="bibr" rid="ref81">81</xref>,<xref ref-type="bibr" rid="ref98">98</xref>,<xref ref-type="bibr" rid="ref99">99</xref>].</p><p>For classification problems, reported evaluation metrics included specificity and sensitivity (recall) [<xref ref-type="bibr" rid="ref41">41</xref>-<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref72">72</xref>,<xref ref-type="bibr" rid="ref76">76</xref>,<xref ref-type="bibr" rid="ref82">82</xref>,<xref ref-type="bibr" rid="ref85">85</xref>,<xref ref-type="bibr" rid="ref86">86</xref>,<xref ref-type="bibr" rid="ref91">91</xref>,<xref ref-type="bibr" rid="ref93">93</xref>,<xref ref-type="bibr" rid="ref95">95</xref>,<xref ref-type="bibr" rid="ref104">104</xref>], precision and recall [<xref ref-type="bibr" rid="ref40">40</xref>-<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref80">80</xref>,<xref ref-type="bibr" rid="ref86">86</xref>,<xref ref-type="bibr" rid="ref100">100</xref>,<xref ref-type="bibr" rid="ref101">101</xref>], the confusion matrix [<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref80">80</xref>], error rate as the proportion of misclassified observations (1 &#x2013; accuracy) [<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref72">72</xref>,<xref ref-type="bibr" rid="ref90">90</xref>], Cohen &#x03BA; [<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref72">72</xref>], <italic>F</italic><sub>1</sub>-score [<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref80">80</xref>,<xref ref-type="bibr" rid="ref86">86</xref>,<xref ref-type="bibr" rid="ref91">91</xref>,<xref ref-type="bibr" rid="ref100">100</xref>,<xref ref-type="bibr" rid="ref101">101</xref>,<xref ref-type="bibr" rid="ref104">104</xref>], and model training time [<xref ref-type="bibr" rid="ref58">58</xref>]. The most frequently used metrics were accuracy [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref41">41</xref>-<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref47">47</xref>-<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref72">72</xref>,<xref ref-type="bibr" rid="ref80">80</xref>,<xref ref-type="bibr" rid="ref82">82</xref>,<xref ref-type="bibr" rid="ref83">83</xref>,<xref ref-type="bibr" rid="ref85">85</xref>,<xref ref-type="bibr" rid="ref86">86</xref>,<xref ref-type="bibr" rid="ref88">88</xref>,<xref ref-type="bibr" rid="ref91">91</xref>,<xref ref-type="bibr" rid="ref93">93</xref>,<xref ref-type="bibr" rid="ref101">101</xref>] and area under the receiver operating characteristic curve [<xref ref-type="bibr" rid="ref41">41</xref>-<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref46">46</xref>-<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref72">72</xref>-<xref ref-type="bibr" rid="ref74">74</xref>,<xref ref-type="bibr" rid="ref76">76</xref>,<xref ref-type="bibr" rid="ref83">83</xref>,<xref ref-type="bibr" rid="ref85">85</xref>,<xref ref-type="bibr" rid="ref86">86</xref>,<xref ref-type="bibr" rid="ref91">91</xref>,<xref ref-type="bibr" rid="ref93">93</xref>,<xref ref-type="bibr" rid="ref95">95</xref>,<xref ref-type="bibr" rid="ref100">100</xref>,<xref ref-type="bibr" rid="ref101">101</xref>,<xref ref-type="bibr" rid="ref104">104</xref>] (Table S5 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Additionally, 1 epidemiologic study used the Brier score to assess cardiovascular mortality [<xref ref-type="bibr" rid="ref53">53</xref>].</p></sec><sec id="s3-6"><title>Explainability</title><p>To enhance explainability, 22 (33.84%) studies implemented specific XAI methods to clarify the contribution of each predictor and the direction of the relationship with the outcome. Of these, 21 studies used Shapley Additive Explanations (SHAP) values, while 1 used local interpretable model-agnostic explanations (LIME). As shown in <xref ref-type="fig" rid="figure6">Figure 6</xref>, XAI methods, particularly SHAP values, have been applied across different health domains, showing a remarkable increase in use in 2025. The most common visualization methods were beeswarm and bar plots, with the contribution of each feature ranked along the y-axis, placing the most important feature at the top of the plot. The number of features plotted ranges from 6 to 50, with 20 being the most common (refer to <xref ref-type="table" rid="table2">Table 2</xref>).</p><fig position="float" id="figure6"><label>Figure 6.</label><caption><p>Bar plot depicting the application of explainable artificial intelligence (XAI) algorithms in different years per health outcome (N=22). LIME: local interpretable model-agnostic explanations; SHAP: Shapley Additive Explanations.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="humanfactors_v13i1e78648_fig06.png"/></fig><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Summary of explainable artificial intelligence use by health outcome and healthy lifestyle components.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Study</td><td align="left" valign="bottom">Health outcome</td><td align="left" valign="bottom">Total number of features (features ranked)</td><td align="left" valign="bottom">Healthy lifestyle components (category, position, features ranked)</td><td align="left" valign="bottom">XAI<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup> (visualization)</td></tr></thead><tbody><tr><td align="left" valign="top">Allen [<xref ref-type="bibr" rid="ref4">4</xref>]</td><td align="left" valign="top">Obesity</td><td align="left" valign="top">64 (10)</td><td align="left" valign="top">Physical activity (physical inactivity, 1, 10); diet (food insecurity, unranked, n/a); sleep (sleep hours, unranked, n/a); stress (n/ac<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup>, n/a<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup>, n/a).</td><td align="left" valign="top">LIME<sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup> (waterfall plot)</td></tr><tr><td align="left" valign="top">Gu et al [<xref ref-type="bibr" rid="ref16">16</xref>]</td><td align="left" valign="top">Infertility risk in women</td><td align="left" valign="top">39 (10)</td><td align="left" valign="top">Physical activity (physical activity health score, unranked, n/a); diet (diet health score, 10, 10); sleep (sleep health score, unranked, n/a); stress (n/ac, n/a, n/a).</td><td align="left" valign="top">SHAP<sup><xref ref-type="table-fn" rid="table2fn5">e</xref></sup> values (beeswarm plot, bar plot, and dependency plot)</td></tr><tr><td align="left" valign="top">Guthrie et al [<xref ref-type="bibr" rid="ref17">17</xref>]</td><td align="left" valign="top">Cardiometabolic disease</td><td align="left" valign="top">13 (13)</td><td align="left" valign="top">Physical activity (minutes of physical activity, 8, 13); diet (plant-based meal, 6, 13); sleep (n/ac, n/a, n/a); stress (n/ac, n/a, n/a).</td><td align="left" valign="top">SHAP values (beeswarm plot)</td></tr><tr><td align="left" valign="top">Huang et al [<xref ref-type="bibr" rid="ref20">20</xref>]</td><td align="left" valign="top">Cognitive function</td><td align="left" valign="top">20 (20)</td><td align="left" valign="top">Physical activity (exercise, 10, 20); diet (n/ac, n/a, n/a); sleep (sleep quality, 8, 20); stress (n/ac, n/a, n/a).</td><td align="left" valign="top">SHAP values (beeswarm plot and bar plot)</td></tr><tr><td align="left" valign="top">Jin and Halili [<xref ref-type="bibr" rid="ref21">21</xref>]</td><td align="left" valign="top">Mental health</td><td align="left" valign="top">21 (21)</td><td align="left" valign="top">Physical activity (intensity, unranked, n/a); diet (n/ac, n/a, n/a); sleep (sleep hours, 1, 21); stress (n/ac, n/a, n/a).</td><td align="left" valign="top">SHAP values (bar plot)</td></tr><tr><td align="left" valign="top">Kim et al [<xref ref-type="bibr" rid="ref22">22</xref>]</td><td align="left" valign="top">Quality of life</td><td align="left" valign="top">21 (20)</td><td align="left" valign="top">Physical activity (transport-related, 4, 20; physical activity score, 7, 20); diet (eating index, 15, 20); sleep (sleep quality, 2, 20; sleep hours, 6, 20); stress (stress level, 1, 20).</td><td align="left" valign="top">SHAP values (beeswarm plot)</td></tr><tr><td align="left" valign="top">Kiss et al [<xref ref-type="bibr" rid="ref24">24</xref>]</td><td align="left" valign="top">Mental health</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">SHAP values (bar plot)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">Positive affect: 231 (20)</td><td align="left" valign="top">Physical activity (doing outdoor activities, 3, 20; duration of sitting, 6, 20; frequency of walking, 7, 20); diet (n/ac, n/a, n/a); sleep (sleep disorder, 8, 20); stress (coping strategies, 9, 20).</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">Perceived stress: 228 (20)</td><td align="left" valign="top">Physical activity (engagement, 12, 20); diet (n/ac, n/a, n/a); sleep (sleep hours, 7, 20); stress (coping strategies, 5, 20).</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">Anxiety: 228 (20)</td><td align="left" valign="top">Physical activity (engagement, unranked, n/a); diet (n/ac, n/a, n/a); sleep (sleep hours, 15, 20); stress (coping strategies, 10, 20).</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">Depressive symptoms: 240 (20)</td><td align="left" valign="top">Physical activity (engagement, 14, 20); diet (n/ac, n/a, n/a); sleep (sleep hours, 16, 20); stress (coping strategies, 9, 20).</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">Li and Song [<xref ref-type="bibr" rid="ref25">25</xref>]</td><td align="left" valign="top">Cognitive function</td><td align="left" valign="top">20 (20)</td><td align="left" valign="top">Physical activity (sport social capital index, 3, 20); diet (n/ac, n/a, n/a); sleep (n/ac, n/a, n/a); stress (n/ac, n/a, n/a).</td><td align="left" valign="top">SHAP values (beeswarm plot, heat map, temporal analysis, and dependency plot)</td></tr><tr><td align="left" valign="top">Lin et al [<xref ref-type="bibr" rid="ref28">28</xref>]</td><td align="left" valign="top">Loneliness</td><td align="left" valign="top">15 (15)</td><td align="left" valign="top">Physical activity (exercise, 7, 15); diet (n/ac, n/a, n/a); sleep (n/ac, n/a, n/a); stress (n/ac, n/a, n/a).</td><td align="left" valign="top">SHAP values (beeswarm plot)</td></tr><tr><td align="left" valign="top">Luo et al [<xref ref-type="bibr" rid="ref33">33</xref>]</td><td align="left" valign="top">Frailty</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">SHAP values (beeswarm plot and dependency plot)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">US cohort: 121 (20)</td><td align="left" valign="top">Physical activity (play sports and exercise, 8, 20; moderate physical activity, 16, 20); diet (n/ac, n/a, n/a); sleep (sleep problems, 4, 20); stress (n/ac, n/a, n/a).</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">UK cohort: 125 (20)</td><td align="left" valign="top">Physical activity (vigorous physical activity, 4, 20; moderate physical activity, 5, 20); diet (fruit consumption, 19, 20); sleep (sleep problems, 2, 20; sleep duration, 6, 20); stress (n/ac, n/a, n/a).</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">China cohort: 94 (20)</td><td align="left" valign="top">Physical activity (n/ac, n/a, n/a); diet (n/ac, n/a, n/a); sleep (sleep problems, 5, 20; sleep duration, 8, 20); stress (n/ac, n/a, n/a).</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">Majcherek et al [<xref ref-type="bibr" rid="ref34">34</xref>]</td><td align="left" valign="top">Mental health</td><td align="left" valign="top">26 (24)</td><td align="left" valign="top">Physical activity (sport, 6, 24; walking time, 11, 24); diet (vegetable portion, 13, 24; fruit portion, 14, 24); sleep (n/ac, n/a, n/a); stress (n/ac, n/a, n/a).</td><td align="left" valign="top">SHAP values (dependency plot)</td></tr><tr><td align="left" valign="top">Majcherek et al [<xref ref-type="bibr" rid="ref35">35</xref>]</td><td align="left" valign="top">Diabetes</td><td align="left" valign="top">22 (6)</td><td align="left" valign="top">Physical activity (regular physical activity, unranked, n/a); diet (habits, unranked, n/a); sleep (n/ac, n/a, n/a); stress (n/ac, n/a, n/a).</td><td align="left" valign="top">SHAP values (dependency plot)</td></tr><tr><td align="left" valign="top">Morris et al [<xref ref-type="bibr" rid="ref38">38</xref>]</td><td align="left" valign="top">Cardiovascular disease</td><td align="left" valign="top">50 (50)</td><td align="left" valign="top">Physical activity (availability of outdoor activities, 5, 50); diet (available favorable food stores, 14, 50); sleep (n/ac, n/a, n/a); stress (global stress, 18, 50).</td><td align="left" valign="top">SHAP values (bar plot)</td></tr><tr><td align="left" valign="top">Park et al [<xref ref-type="bibr" rid="ref43">43</xref>]</td><td align="left" valign="top">Visceral fat</td><td align="left" valign="top">32 (20)</td><td align="left" valign="top">Physical activity (frequency, unranked, n/a); diet (high rice consumption, 2, 20; Asian-style balanced diet, 6, 20); sleep (n/ac, n/a, n/a); stress (n/ac, n/a, n/a).</td><td align="left" valign="top">SHAP values (beeswarm plot and bar plot)</td></tr><tr><td align="left" valign="top">Ren et al [<xref ref-type="bibr" rid="ref51">51</xref>]</td><td align="left" valign="top">Cognitive function</td><td align="left" valign="top">39 (20)</td><td align="left" valign="top">Physical activity (exercise, 16, 20); diet (n/ac, n/a, n/a); sleep (n/ac, n/a, n/a); stress (n/ac, n/a, n/a).</td><td align="left" valign="top">SHAP values (beeswarm plot, bar plot, and force plot)</td></tr><tr><td align="left" valign="top">Sandri et al [<xref ref-type="bibr" rid="ref53">53</xref>]</td><td align="left" valign="top">Lifestyle (diet)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">SHAP values (beeswarm plot)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">Mediterranean diet: 41 (20)</td><td align="left" valign="top">Physical activity (sport, 8, 20); diet (fish consumption, 1, 20); sleep (sleep quality, unranked, n/a); stress (n/ac, n/a, n/a).</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">Intermittent fasting: 41 (20)</td><td align="left" valign="top">Physical activity (sport, 3, 20); diet (fish consumption, 1, 20); sleep (sleep quality, 14, 20); stress (n/ac, n/a, n/a).</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">Vegan diet: 41 (20)</td><td align="left" valign="top">Physical activity (sport, 5, 20); diet (fish consumption, 1, 20); sleep (sleep quality, 9, 20); stress (n/ac, n/a, n/a).</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">Vegetarian diet: 41 (20)</td><td align="left" valign="top">Physical activity (sport, 5, 20); diet (fish consumption, 1, 20); sleep (sleep quality, unranked, n/a); stress (n/ac, n/a, n/a).</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">Shi et al [<xref ref-type="bibr" rid="ref55">55</xref>]</td><td align="left" valign="top">Osteoporosis</td><td align="left" valign="top">45 (20)</td><td align="left" valign="top">Physical activity (physical activity health score, 16, 20); diet (diet health score, unranked, n/a); sleep (sleep health score, 5, 20); stress (n/ac, n/a, n/a).</td><td align="left" valign="top">SHAP values (beeswarm plot, waterfall plot, and force plot)</td></tr><tr><td align="left" valign="top">Su et al [<xref ref-type="bibr" rid="ref58">58</xref>]</td><td align="left" valign="top">Resilience</td><td align="left" valign="top">12 (4)</td><td align="left" valign="top">Physical activity (n/ac, n/a, n/a); diet (n/ac, n/a, n/a); sleep (sleep disturbance, 3, 4); stress (n/ac, n/a, n/a).</td><td align="left" valign="top">SHAP values (beeswarm plot, bar plot, and dependency plot)</td></tr><tr><td align="left" valign="top">Wang et al [<xref ref-type="bibr" rid="ref60">60</xref>]</td><td align="left" valign="top">Lifestyle (sleep)</td><td align="left" valign="top">7 (7)</td><td align="left" valign="top">Physical activity (n/ac, n/a, n/a); diet (nutritional status, 3, 7); sleep (outcome, n/a, n/a); stress (n/ac, n/a, n/a).</td><td align="left" valign="top">SHAP values (beeswarm plot, bar plot, and waterfall plot)</td></tr><tr><td align="left" valign="top">Xin and Ren [<xref ref-type="bibr" rid="ref62">62</xref>]</td><td align="left" valign="top">Mental health</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">SHAP values (beeswarm plot and bar plot)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">Rural older adults: 55 (20)</td><td align="left" valign="top">Physical activity (exercise, 19, 20); diet (n/ac, n/a, n/a); sleep (sleep hours, 13, 20); stress (n/ac, n/a, n/a).</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">Urban older adults: 55 (16)</td><td align="left" valign="top">Physical activity (exercise, unranked, n/a); diet (n/ac, n/a, n/a); sleep (sleep hours, 6, 16); stress (n/ac, n/a, n/a).</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">Zhang et al [<xref ref-type="bibr" rid="ref63">63</xref>]</td><td align="left" valign="top">Lifestyle (sleep)</td><td align="left" valign="top">20 (10)</td><td align="left" valign="top">Physical activity (sedentary time, 5, 10); diet (vegetable consumption, 3, 10); sleep (outcome, n/a, n/a); stress (stress score, 1, 10).</td><td align="left" valign="top">SHAP values (beeswarm plot and dependency plot)</td></tr><tr><td align="left" valign="top">Zhou et al [<xref ref-type="bibr" rid="ref63">63</xref>]</td><td align="left" valign="top">Psoriasis</td><td align="left" valign="top">150 (20)</td><td align="left" valign="top">Physical activity (intensity, 17, 20); diet (habits, unranked, n/a); sleep (n/ac, n/a, n/a); stress (n/ac, n/a, n/a).</td><td align="left" valign="top">SHAP values (beeswarm plot)</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>XAI: explainable artificial intelligence. </p></fn><fn id="table2fn2"><p><sup>b</sup>n/ac: not applicable.</p></fn><fn id="table2fn3"><p><sup>c</sup>n/a: not available.</p></fn><fn id="table2fn4"><p><sup>d</sup>LIME: local interpretable model-agnostic explanations. </p></fn><fn id="table2fn5"><p><sup>e</sup>SHAP: Shapley Additive Explanations.</p></fn></table-wrap-foot></table-wrap><p>Because the nonlifestyle features included in each model vary substantially across studies, the ranking reported in <xref ref-type="table" rid="table2">Table 2</xref> should be interpreted in relative terms. When a lifestyle behavior appears among the top-ranked features, this indicates that it contributed more strongly to the model than nonlifestyle variables included in the analysis. Conversely, lifestyle components appearing in lower positions acted as secondary predictors.</p><p>In a study on cardiometabolic disease [<xref ref-type="bibr" rid="ref76">76</xref>], the ML solution was first explained at the individual participant level to provide specific behavioral feedback, and then at the group level to reveal the ranking of features for succeeding in behavioral changes. In both models, physical activity and diet variables were among the top contributors. However, in another study [<xref ref-type="bibr" rid="ref65">65</xref>], neither regular physical activity nor diet habits were among the top 6 variables for predicting diabetes in adults.</p><p>In 4 mental health studies [<xref ref-type="bibr" rid="ref64">64</xref>,<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref80">80</xref>,<xref ref-type="bibr" rid="ref85">85</xref>], SHAP values were used to rank the contribution of each feature. In 3 of the 4 studies, lifestyle variables were among the top contributors. In [<xref ref-type="bibr" rid="ref80">80</xref>], physical activity and fruit and vegetable consumption; in [<xref ref-type="bibr" rid="ref64">64</xref>], sleep variables were the top predictors of stress in young adolescents during the COVID-19 pandemic; and in [<xref ref-type="bibr" rid="ref85">85</xref>], sleep duration was identified as important for predicting depression. However, in [<xref ref-type="bibr" rid="ref67">67</xref>], the intensity of physical activity was unranked because it was excluded from the XAI analysis during a feature selection step prior to modeling. In the same study, sleep hours were the most important variable for predicting depression among adults. Regarding mental health studies, psychological resilience was assessed among medical students [<xref ref-type="bibr" rid="ref56">56</xref>], with sleep disturbance being a key factor affecting their resilience.</p><p>Three studies focusing on older adults in China had cognitive function as their outcome [<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref63">63</xref>]. In these studies, physical activity variables were ranked as top predictors. Additionally, in 1 of these studies [<xref ref-type="bibr" rid="ref63">63</xref>], sleep quality was ranked as the eighth top feature out of 20. Furthermore, when loneliness was assessed among older adults from China [<xref ref-type="bibr" rid="ref51">51</xref>], exercise was ranked as the seventh variable out of 15.</p><p>In a study predicting quality of life [<xref ref-type="bibr" rid="ref91">91</xref>], stress, sleep quality, and physical activity emerged as the strongest predictors, with the eating index appearing in the top 15 variables.</p><p>Two studies focused on sleep as the specific outcome. In [<xref ref-type="bibr" rid="ref86">86</xref>], the SHAP values ranked stress score, vegetable consumption, and sedentary time among the top 5 variables for predicting sleep disturbance. In [<xref ref-type="bibr" rid="ref97">97</xref>], nutritional status was the third most important variable for predicting the risk of sleep disorders in older adults.</p><p>In [<xref ref-type="bibr" rid="ref88">88</xref>], &#x201C;favorable&#x201D; food stores and global stress were identified as the top variables for predicting incidence of cardiovascular disease, with the availability of outdoor activities ranking in the top 5. In a longitudinal study investigating the association of diet with long-term reduction in waist circumference, SHAP values highlighted the importance of high-quality components in reducing visceral fat [<xref ref-type="bibr" rid="ref83">83</xref>]. This study also measured exercise with a single item of frequency, which was not included in the top ranking. Regarding a diet study [<xref ref-type="bibr" rid="ref94">94</xref>], the adoption of different diets in the Spanish population was assessed, with fish consumption positioned as the most important variable for all diets studied (Mediterranean, intermittent fasting, vegan, and vegetarian). In the same study, practicing sport was ranked among the top variables across the different diets. However, sleep quality was only included in the ranking for intermittent fasting and the vegan diet.</p><p>Physical inactivity emerged as the most important feature in explaining county-level obesity using LIME [<xref ref-type="bibr" rid="ref87">87</xref>]. In this study, the food environment and insufficient sleep, both measured as single items, were not included as top predictors of obesity prevalence.</p><p>In a cross-national study assessing frailty [<xref ref-type="bibr" rid="ref68">68</xref>], sleep variables were among the 20 most important variables across all the cohorts studied. Physical activity was included in the US and UK cohorts and was also ranked in the top 20 variables. In the UK cohort, fruit consumption was the 19th out of 20 key contributors to frailty.</p><p>One study on osteoporosis [<xref ref-type="bibr" rid="ref84">84</xref>] used the Life&#x2019;s Essential 8 scores for physical activity, diet, and sleep. Sleep and physical activity scores were among the 20 most important variables, but the diet health score was unranked. Similarly, the Life&#x2019;s Essential 8 scores were used to determine infertility risk in women [<xref ref-type="bibr" rid="ref60">60</xref>], with the diet score being the only one ranked among the top 10 variables.</p><p>Finally, 1 study combined lifestyle factors with metabolites associated with psoriasis [<xref ref-type="bibr" rid="ref71">71</xref>], with physical activity intensity ranked among the 20 key factors out of 150 variables, whereas dietary habits were not ranked.</p></sec><sec id="s3-7"><title>Software to Implement ML Models</title><p>Of the included papers in the review, 23 (35.38%) used R software (R Core Team) [<xref ref-type="bibr" rid="ref105">105</xref>] for data analysis (<xref ref-type="table" rid="table3">Table 3</xref>). The R packages used were data.table for data manipulation, tidyverse [<xref ref-type="bibr" rid="ref106">106</xref>] as a general package for data science, Multivariate Imputation by Chained Equations [<xref ref-type="bibr" rid="ref107">107</xref>] for missing data imputation, missMDA for performing multiple imputation with principal component analysis, FactoMineR for exploratory data analysis and principal component analysis, Boruta [<xref ref-type="bibr" rid="ref108">108</xref>] for feature selection through a wrapper algorithm, caret (Classification and Regression Training) [<xref ref-type="bibr" rid="ref109">109</xref>] for creating models, randomForest for RF analysis, randomForestSCR for RF for survival, regression, and classification analysis, rpart for recursive partitioning and regression trees, xgboost for extreme gradient boosting, bartMachine for Bayesian additive regression trees, kernlab and e1071 for support vector machines, survival for survival analysis, lime for local interpretable model-agnostic explanations, and finally, SuperLearner [<xref ref-type="bibr" rid="ref110">110</xref>] to choose the optimal learner for a given prediction problem with a k-fold cross-validation algorithm.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Softwares used in the reviewed studies to perform machine learning (ML) algorithms.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Software used</td><td align="left" valign="bottom">Number of studies</td><td align="left" valign="bottom">Study references</td></tr></thead><tbody><tr><td align="left" valign="top">R (R Core Team)</td><td align="left" valign="top">n=23</td><td align="left" valign="top">[<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref45">45</xref>-<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref72">72</xref>-<xref ref-type="bibr" rid="ref74">74</xref>,<xref ref-type="bibr" rid="ref77">77</xref>,<xref ref-type="bibr" rid="ref78">78</xref>,<xref ref-type="bibr" rid="ref80">80</xref>,<xref ref-type="bibr" rid="ref87">87</xref>,<xref ref-type="bibr" rid="ref90">90</xref>,<xref ref-type="bibr" rid="ref93">93</xref>,<xref ref-type="bibr" rid="ref95">95</xref>-<xref ref-type="bibr" rid="ref97">97</xref>,<xref ref-type="bibr" rid="ref99">99</xref>,<xref ref-type="bibr" rid="ref101">101</xref>,<xref ref-type="bibr" rid="ref111">111</xref>]</td></tr><tr><td align="left" valign="top">Python (Python Software Foundation)</td><td align="left" valign="top">n=24</td><td align="left" valign="top">[<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref56">56</xref>,<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref64">64</xref>,<xref ref-type="bibr" rid="ref65">65</xref>,<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref76">76</xref>,<xref ref-type="bibr" rid="ref79">79</xref>,<xref ref-type="bibr" rid="ref81">81</xref>,<xref ref-type="bibr" rid="ref83">83</xref>,<xref ref-type="bibr" rid="ref84">84</xref>,<xref ref-type="bibr" rid="ref86">86</xref>,<xref ref-type="bibr" rid="ref88">88</xref>,<xref ref-type="bibr" rid="ref89">89</xref>,<xref ref-type="bibr" rid="ref91">91</xref>,<xref ref-type="bibr" rid="ref98">98</xref>,<xref ref-type="bibr" rid="ref100">100</xref>,<xref ref-type="bibr" rid="ref102">102</xref>,<xref ref-type="bibr" rid="ref104">104</xref>]</td></tr><tr><td align="left" valign="top">R and Python</td><td align="left" valign="top">n=4</td><td align="left" valign="top">[<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref68">68</xref>,<xref ref-type="bibr" rid="ref71">71</xref>]</td></tr><tr><td align="left" valign="top">SPSS (IBM Corp)</td><td align="left" valign="top">n=2</td><td align="left" valign="top">[<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref92">92</xref>]</td></tr><tr><td align="left" valign="top">MATLAB (The MathWorks Inc)</td><td align="left" valign="top">n=2</td><td align="left" valign="top">[<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref66">66</xref>]</td></tr><tr><td align="left" valign="top">KNIME [<xref ref-type="bibr" rid="ref112">112</xref>]</td><td align="left" valign="top">n=2</td><td align="left" valign="top">[<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref44">44</xref>]</td></tr></tbody></table></table-wrap><p>In contrast, 24 (36.92%) studies developed the models in Python (Python Software Foundation), using the following libraries: Scikit-learn, used in all studies for predictive data analysis; pandas, for manipulating tabular data; NumPy, for mathematical functions; Keras and TensorFlow, for implementing deep learning; lightGBM, for performing light gradient boosting machine; SHAP, to explain ML solutions; creme, for online ML; Bayesian optimization, as a global optimization package to find the maximum value of an unknown function in as few iterations as possible; imbalanced-learn, to combine either undersample or oversample methods; and TextBlob, emoji, nltk, and profanity, for processing and analyzing textual data<italic>.</italic></p><p>Finally, 4 studies used both Python and R, and 6 studies used other software programs such as SPSS, MATLAB, and KNIME. Eight papers did not report the software used [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref75">75</xref>,<xref ref-type="bibr" rid="ref82">82</xref>,<xref ref-type="bibr" rid="ref85">85</xref>,<xref ref-type="bibr" rid="ref94">94</xref>].</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Overview</title><p>This scoping review of 65 studies provides the current state of the application of supervised ML algorithms for the analysis of lifestyle data. The increase in studies in this field since 2019 indicates that it is a noteworthy area of study. The diversity in the sample origin, alongside the accessibility to new AI tools and novel methods for monitoring health outcomes (eg, wearables), denotes global attention to lifestyle. This section addresses the methodological shortcomings found in the reviewed studies.</p></sec><sec id="s4-2"><title>About Data Acquisition</title><p>In relation to lifestyle data, we found that most studies adopted a multidomain approach, integrating more than just a single component. This strategy enhances and facilitates a more comprehensive understanding of health problems related to the 4 lifestyle domains considered in this review: physical activity, diet, sleep, and stress. The distribution of lifestyle domains identified here was similar to that reported in a previous scoping meta-review [<xref ref-type="bibr" rid="ref113">113</xref>], although we observe that sleep has gained prominence in recent years, now reaching a level comparable to diet. Although these results highlight the growing recognition of the interrelated nature of lifestyle behaviors, the imbalance in the distribution of these factors limits the capacity of current studies to fully model and understand the interaction among the 4 lifestyle components and their combined effects on health.</p><p>Concerning the data acquisition process, over half of the studies acquired their own data. This acquisition process implies control over variables and reduces the time required for cleaning [<xref ref-type="bibr" rid="ref114">114</xref>]. Interestingly, both self-acquired datasets and those sourced from private or public health repositories demonstrated gender parity in the analyzed datasets. However, we detected a major limitation in this part of the process regarding the data acquisition methodology. In most studies, data were collected through single items, such as regular physical activity (response &#x201C;yes&#x201D; or &#x201C;no&#x201D;) [<xref ref-type="bibr" rid="ref58">58</xref>] or usual time of waking up and going to bed [<xref ref-type="bibr" rid="ref62">62</xref>], resulting in low representativeness of the construct being measured. The result of this acquisition method is high heterogeneity in measures, which hinders their generalizability. Therefore, the quality of data must be one of the challenges to be addressed, and specifically, the consistency in measures [<xref ref-type="bibr" rid="ref115">115</xref>,<xref ref-type="bibr" rid="ref116">116</xref>].</p><p>Nevertheless, the current accessibility and precision of health sensors such as wearables [<xref ref-type="bibr" rid="ref117">117</xref>] and the Internet of Things [<xref ref-type="bibr" rid="ref118">118</xref>] may contribute to transferability and actionability in the population [<xref ref-type="bibr" rid="ref119">119</xref>]. The growth in technology allows the integration of different data forms as well as more objective measures of lifestyle, substantially reducing the impact of retrospective bias by tracking real-time data in an ecological situation [<xref ref-type="bibr" rid="ref120">120</xref>]. Therefore, merging questionnaires and sensor data may be the key to identifying relationships between lifestyle measurements and personalizing interventions or changes in specific behaviors. This integration would include physiological, psychological, and behavioral factors, which are the most common analysis types in the ML community to extract clinical insights [<xref ref-type="bibr" rid="ref121">121</xref>].</p></sec><sec id="s4-3"><title>About Characteristics of ML Models</title><p>Regarding the analysis of ML, 2 different approaches emerged in the reviewed studies: 1 focused on prediction through classification and regression problems, and the other focused on interpretability through feature selection. The first is already an acknowledged approach, while the second typically constitutes an important component of the ML process, specifically during the preprocessing stage. However, feature selection studies do not use model evaluation metrics, which can limit their statistical validity and the generalizability of results. Remarkably, the family of ML algorithms most closely related to feature selection is tree-based because it provides indices of the importance of each variable. Although most papers in this scoping review combined different families of algorithms and compared their results, the most common model family was tree-based, which was applied for each data typology identified. Specifically, RF is the most used algorithm, which may be due to its robustness in handling missing values, the consideration of complex interaction in the data [<xref ref-type="bibr" rid="ref122">122</xref>], and its lower sensitivity to variable scales [<xref ref-type="bibr" rid="ref123">123</xref>]. Despite the benefits of RF, the underusage of DL algorithms represents a critical missed opportunity for robustly analyzing complex and multimodal data. In this review, DL algorithms were underused for lifestyle data. This result may reflect a gap in expertise or access to computational resources among lifestyle researchers, potentially limiting the application of more complex models. With ongoing advances in computational power and algorithmic efficiency, it is expected that the use of DL algorithms will become more widespread in the near future [<xref ref-type="bibr" rid="ref124">124</xref>].</p><p>Regarding the preprocessing stage, most studies detailed some phases of the process, but there is no consensus on the description of this stage of ML. Variable transformation is a crucial step for certain algorithms, particularly for SVM and specific architectures of DL that exhibit sensitivity to the raw form of the variables. In this review, 12 out of 19 studies that performed the SVM algorithm, and 13 out of 26 studies focused on DL, reported variable transformation. Additionally, it is worth noting that these algorithms cannot handle missing values, requiring imputation before the modeling phase. Among the SVM studies, 11 out of 19 reported techniques for missing imputation, and 17 out of 26 DL studies explicitly addressed this. In contrast, tree-based algorithms are less sensitive to variable scales and missing values, yet incorporating these feature engineering steps could enhance model performance [<xref ref-type="bibr" rid="ref123">123</xref>]. It is noteworthy that the preprocessing steps, specifically how missing values are addressed, have been identified as a potential concern for transparency. This procedural aspect could introduce sampling biases, thereby influencing the generalizability and comprehension of the dataset context [<xref ref-type="bibr" rid="ref125">125</xref>].</p><p>Resampling techniques, aiming to balance the dataset, are commonly implemented in classification problems. SMOTE has been the most widely used technique in this review, especially because it achieves better results than a simple undersampling of the majority class. In the health domain, imbalanced datasets are common, and SMOTE oversamples the minority class with synthetic examples and randomly undersamples the majority class to balance the dataset [<xref ref-type="bibr" rid="ref126">126</xref>].</p><p>Finally, dimensionality reduction enables capturing the most relevant information for the outcome while eliminating noise and redundant information. In this review, dimensionality reduction was the most frequent preprocessing step, appearing in 38 studies. Notably, not only could SVM and DL models benefit from removing irrelevant predictors, but also in tree-based algorithms, dimensionality reduction minimizes model complexity, resource consumption, and data acquisition costs [<xref ref-type="bibr" rid="ref123">123</xref>].</p><p>The division of the original dataset is an essential step for assessing the performance of the ML solution. In this review, 8 studies did not report how they split their data to assess the model, which denotes a lack of generalization of their results. This omission represents a common issue in ML research that should be carefully addressed to minimize bias [<xref ref-type="bibr" rid="ref127">127</xref>]. Train and test division, also known as &#x201C;hold out,&#x201D; is a method with considerable variability due to the use of a unique random data distribution [<xref ref-type="bibr" rid="ref127">127</xref>]. Therefore, other methods might be more suitable. For example, leave-one-out cross-validation, which trains the model on &#x201C;n &#x2013; 1&#x201D; observations and makes predictions on the remaining one. Although effective for small datasets, it is computationally intensive with large datasets [<xref ref-type="bibr" rid="ref128">128</xref>]. K-fold cross-validation involves randomly dividing the original dataset into k groups. K-fold cross-validation not only offers computational advantage over leave-one-out, but also gives more accurate estimations due to the bias-variance trade-off [<xref ref-type="bibr" rid="ref128">128</xref>]. In time-series data, only 1 paper [<xref ref-type="bibr" rid="ref102">102</xref>] introduced a different form of data split, considering the dependencies of the entire series. Ideally, this type of data should be treated with a method called rolling forecast origin resampling, which estimates the model with historical data and evaluates it with the most recent data [<xref ref-type="bibr" rid="ref129">129</xref>]. In other words, the training set should ideally comprise observations that occurred before those in the test set; however, this method was not found in this review.</p><p>Regarding the evaluation of ML models, the choice of metrics depends on the nature of the problem, whether regression or classification. Specific evaluation metrics tailored to each problem are crucial for correct evaluation, aligning with the priorities and needs of each field. For instance, in medical studies where the cost of treatment in terms of health is high, it becomes crucial to identify true patients over false positives. In contrast, if the treatment has minimal side effects and has demonstrated benefits, sensitivity might not be as important as specificity. It is worth highlighting that in the field of data science, precision and recall are more commonly used, whereas in medical fields, specificity and sensitivity are more prevalent [<xref ref-type="bibr" rid="ref18">18</xref>]. These differences may cause misunderstandings between the 2 domains.</p></sec><sec id="s4-4"><title>About Explainability Methods</title><p>Regarding model explainability, 22 studies incorporated a dedicated step in the ML process for explainability. SHAP values and LIME were the only XAI methods applied to lifestyle data, and these 2 methods were the most common in a recent systematic review on XAI methods [<xref ref-type="bibr" rid="ref130">130</xref>]. XAI-related studies in this review were published since 2019, with a notable increase in the number of publications in 2025, comprising half of the papers. This exponential growth was also found in [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>], where the trend in published papers occurred between 2016 and 2022. Thus, our review demonstrates this exponential distribution in the health and behavioral sciences, where XAI methods are gaining prominence.</p><p>Although tree-based algorithms, especially decision trees, are known for facilitating interpretation, SHAP values can be applied to any type of model [<xref ref-type="bibr" rid="ref131">131</xref>]. The adoption of XAI in lifestyle studies remains low (33.84%). One possible explanation for this is that explainability algorithms are often not integrated into a standard ML pipeline, thereby increasing the technical complexity of the workflow. However, some efforts are being made by R and Python developers to incorporate XAI algorithms into pipelines using libraries such as H2O [<xref ref-type="bibr" rid="ref132">132</xref>].</p><p>In this review, lifestyle components (physical activity, diet, sleep, and stress) consistently appeared among the top-ranked features in models using XAI techniques, highlighting their substantive contribution relative to nonlifestyle variables. These findings align with prior research emphasizing the integration of diverse lifestyle components [<xref ref-type="bibr" rid="ref133">133</xref>,<xref ref-type="bibr" rid="ref134">134</xref>]. However, the level of interpretability achieved also depends on the quality of data used in the models, which in some studies did not meet expected standards. For instance, in a study where the focus was on obesity, the diet component was not among the top-ranked features [<xref ref-type="bibr" rid="ref87">87</xref>]. In this county-level study, a food environment index was measured as a single item, potentially inadequately representing the diet component of lifestyle.</p><p>Therefore, integrating XAI methods into the ML process could enable tailored interventions based on model results, provided that measures are collected accurately. Furthermore, the adoption of XAI algorithms contributes to increased trust and verification of the fairness of the models. This approach can also facilitate the translation of findings to stakeholders and health systems, thereby enhancing transparency, promoting the adoption of models in society, and supporting informed decision-making [<xref ref-type="bibr" rid="ref27">27</xref>].</p></sec><sec id="s4-5"><title>About the Software for Implementing ML Models</title><p>Competition between Python and R for ML software dominance in data science is currently intense. Both Python and R are freely distributed, object-oriented software with large and active communities. Python, as a programming language, offers specific implementations through libraries tailored for statistical analysis, including ML and DL. In contrast, R is a statistical software that integrates fundamental statistics into its base functionalities. While Python requires libraries for each stage of analysis, its well-established libraries streamline the process. On the other hand, R faces challenges due to its heterogeneous libraries, which hinder replicability and require expertise in varying syntax across packages. To address this concern, the meta-package tidymodels (Max Kuhn and Hadley Wickham) resolves these issues by integrating all necessary packages for each ML step, using a unified syntax. Additionally, tidymodels integrates user-friendly interfaces and promotes good methodological practice, thereby preventing user errors [<xref ref-type="bibr" rid="ref135">135</xref>]. Conversely, Python presents a preferable environment for DL with the TensorFlow and PyTorch frameworks. In this regard, the possibility of developing ML projects on powerful computational cloud-based platforms, such as Google Colaboratory (also referred to as Google Colab) [<xref ref-type="bibr" rid="ref136">136</xref>], offers Python a remarkable advantage over R local environments.</p></sec><sec id="s4-6"><title>Methodological and Reporting Guidelines and Checklist</title><p>Based on the review&#x2019;s results and to enhance transparency and replicability in multidisciplinary sciences [<xref ref-type="bibr" rid="ref137">137</xref>], we provide comprehensive methodological and reporting guidelines and a checklist for ML projects. Although various studies have proposed guidelines and checklists [<xref ref-type="bibr" rid="ref138">138</xref>,<xref ref-type="bibr" rid="ref139">139</xref>], the rapid expansion of ML algorithms in health domains necessitates iterative evaluation to incorporate new steps into the ML research workflow. The guidelines and checklist (<xref ref-type="supplementary-material" rid="app3">Checklist 2</xref>) are based on the 5 stages of the ML workflow, as depicted in <xref ref-type="fig" rid="figure2">Figure 2</xref>, with added software tools.</p><sec id="s4-6-1"><title>Data Acquisition</title><p>The integration of multidomain data enhances the comprehension of real-world problems. Using appropriate methods to collect data ensures representativeness. We recommend the use of standardized questionnaires and validated sensors. Regarding health repositories, we recommend providing information about data characteristics such as gender distribution, sample size, and variable descriptions [<xref ref-type="bibr" rid="ref140">140</xref>].</p></sec><sec id="s4-6-2"><title>Preprocessing</title><p>Reporting the preprocessing methods used in the data analysis is particularly crucial for ensuring replicability. While preprocessing contributes to improving data quality, different preprocessing methods can lead to different results. We propose the following recommendations for each preprocessing step, although not all steps need to be performed in every ML project.</p><sec id="s4-6-2-1"><title>Transformation</title><p>Categorical data should be encoded using methods such as one-hot encoding and dummy variables. Continuous data should be transformed using normalization or rescaling of features with different units to ensure algorithm performance, particularly for those sensitive to the raw form of variables [<xref ref-type="bibr" rid="ref123">123</xref>].</p></sec><sec id="s4-6-2-2"><title>Missing Imputation</title><p>Some algorithms cannot handle missing data and require imputation before modeling. Depending on the number of observations and the data distribution, imputation with the mean, median, or mode is typical. For time-series data, imputation with the last or next observation is preferred, though rolling statistics imputation or interpolation may offer better solutions [<xref ref-type="bibr" rid="ref141">141</xref>].</p></sec><sec id="s4-6-2-3"><title>Resampling</title><p>Imbalanced datasets can bias models, resulting in poor performance on underrepresented classes [<xref ref-type="bibr" rid="ref142">142</xref>]. While SMOTE is an effective technique for handling imbalanced datasets, it is not without its limitations. However, when the class imbalance ratio is extremely high, SMOTE can potentially bias the model performance by overfitting the minority class. This issue is particularly pronounced in datasets containing noise, as synthetic observations may replicate these artifacts. To mitigate these challenges, recent studies have proposed tree algorithms, which have shown effectiveness in handling class imbalance [<xref ref-type="bibr" rid="ref143">143</xref>]. Furthermore, due to their robustness, the use of tree-based algorithms is increasingly recommended when working with class imbalance [<xref ref-type="bibr" rid="ref144">144</xref>].</p></sec><sec id="s4-6-2-4"><title>Dimensionality Reduction</title><p>Removing noise from the dataset and retaining features directly related to the outcome can enhance both data acquisition and modeling efficiency. Removing correlated features is particularly beneficial [<xref ref-type="bibr" rid="ref123">123</xref>].</p></sec></sec></sec><sec id="s4-7"><title>Modeling</title><p>Our guidelines focused on SL algorithms for classification and regression problems. The choice of algorithms depends on the measurement of the outcome. We recommend using multiple algorithms to compare results and select the best fit, given that there is significant variability across problems [<xref ref-type="bibr" rid="ref145">145</xref>]. Additionally, comparing different families of algorithms is also advisable, as some improvements exist within the same family. When it comes to replicability and transparency, reporting algorithm hyperparameters is crucial in ML problems, as different configurations can yield varying results [<xref ref-type="bibr" rid="ref146">146</xref>].</p></sec><sec id="s4-8"><title>Evaluation</title><p>Avoiding overfitting requires dividing the original dataset appropriately. This step is fundamental in ML implementation and should be considered in every study to ensure that the extracted insights are reliable and generalizable. This division depends on data typology; we identified 3 different typologies relevant at this stage, defined by whether time is an implicit factor in the data acquisition process.</p><sec id="s4-8-1"><title>Cross-Sectional</title><p>Data are collected at a single point in time, with no temporal dependencies. Leave-one-out cross-validation is effective for small datasets (n&#x003C;150) typically seen in life sciences; the computational complexity increases [<xref ref-type="bibr" rid="ref147">147</xref>]. K-fold cross-validation is recommended for large datasets to balance the bias-variance trade-off [<xref ref-type="bibr" rid="ref128">128</xref>]. Cross-validation with bootstrap resampling can also be used to evaluate the performance of the models and estimate CIs of performance metrics [<xref ref-type="bibr" rid="ref148">148</xref>].</p></sec><sec id="s4-8-2"><title>Longitudinal</title><p>In longitudinal studies, researchers collect repeated measures, potentially with dependencies between observations and high correlation that can bias the model [<xref ref-type="bibr" rid="ref135">135</xref>]. Data should be divided by grouping individual participants&#x2019; information. The methods used are similar to those for cross-sectional data, but with consideration of partitioning.</p></sec><sec id="s4-8-3"><title>Time Series</title><p>Time series data are a sequence of data points in chronological order. Rolling forecast origin resampling is suitable for this data [<xref ref-type="bibr" rid="ref129">129</xref>]. The training set should include observations occurring before those in the test set.</p></sec><sec id="s4-8-4"><title>Evaluation Metrics</title><p>Appropriate metrics should be selected based on the type of ML problem (regression or classification) [<xref ref-type="bibr" rid="ref149">149</xref>] and the characteristics of the study field [<xref ref-type="bibr" rid="ref18">18</xref>]. It is also recommended to compute evaluation metrics repeatedly across cross-validation samples and to apply nonparametric tests, such as the Wilcoxon signed-rank test and the Friedman test, to assess model performance [<xref ref-type="bibr" rid="ref149">149</xref>]. For imbalanced datasets, performance metrics such as balanced accuracy and <italic>F</italic><sub>1</sub>-score are recommended. For example, in an imbalanced dataset, a model may achieve high accuracy by predominantly predicting the majority class. In contrast, balanced accuracy assigns equal weight to each class regardless of its frequency, providing a more informative evaluation of model performance [<xref ref-type="bibr" rid="ref150">150</xref>].</p></sec></sec><sec id="s4-9"><title>Explainability</title><sec id="s4-9-1"><title>Explainability Overview</title><p>Reporting the method of explainability used in the ML projects is essential. It is important to distinguish between interpretability and explainability. While explainability refers to understanding the effect of each feature on the original model, interpretability involves deriving actionable insights from the model&#x2019;s prediction. Although tree-based methods include importance metrics, they do not indicate the direction of relationships with the outcome. Incorporating explainable resources such as SHAP values [<xref ref-type="bibr" rid="ref151">151</xref>] or LIME [<xref ref-type="bibr" rid="ref152">152</xref>] enhances the interpretability of the results, providing both actionability and transparency, and transforming black boxes into glass box models. The H2O package in R offers XAI algorithms that are compatible with the framework tidymodels, enabling a unified workflow for modeling and explainability. For a more detailed taxonomy of XAI packages in R, we refer the reader to [<xref ref-type="bibr" rid="ref153">153</xref>].</p><p>Additionally, the choice of appropriate visualization methods and the number of features displayed are crucial for ensuring comprehensive results and supporting fine-grained decision-making. Regarding the number of features, we recommend visualizing at least the top 20 features whenever possible, as this allows a broader understanding of the contribution of the most important variables. Furthermore, future studies should report all model features used in the ML analysis, not only the top-ranked ones, to ensure full transparency and allow readers to verify which HL components were excluded or had low impact in the model. Based on SHAP values, we propose the following XAI visualization techniques [<xref ref-type="bibr" rid="ref94">94</xref>,<xref ref-type="bibr" rid="ref154">154</xref>]:</p></sec><sec id="s4-9-2"><title>Beeswarm Plot</title><p>This is the most common summary plot, where features are ranked on the y-axis from most to least contribution by their mean absolute SHAP value. The x-axis represents the SHAP values, which express the change in the log-odds (or model output), resulting in a positive or negative contribution for a specific observation. Each dot represents an observation in the dataset, and the color is indicative of the original value for that observation. Higher values are displayed as red and lower values as blue. The vertical dotted line represents the zero SHAP contribution. Contributions to the right assign a positive effect, and those to the left assign a negative effect.</p></sec><sec id="s4-9-3"><title>Dependency Plots</title><p>Scatter plots that show the effect a single feature has on the model&#x2019;s predictions. Each point represents an instance&#x2019;s feature value and its corresponding SHAP value. This plot provides a detailed and clear explanation of the direction and magnitude of the relationship (whether linear or nonlinear) between the feature and the outcome.</p></sec><sec id="s4-9-4"><title>Bar Plot</title><p>This plot provides information on the global feature importance. Features are ordered on the y-axis from the highest to the lowest average contribution to the outcome.</p></sec><sec id="s4-9-5"><title>Waterfall Plot</title><p>This plot is a local explanation that illustrates the contribution of each feature in transforming the expected value <inline-formula><mml:math id="ieqn1"><mml:mstyle><mml:mrow><mml:mstyle displaystyle="false"><mml:mi>E</mml:mi><mml:mo stretchy="false">[</mml:mo><mml:mi>f</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>x</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo stretchy="false">]</mml:mo></mml:mstyle></mml:mrow></mml:mstyle></mml:math></inline-formula> into the final prediction <inline-formula><mml:math id="ieqn2"><mml:mstyle><mml:mrow><mml:mstyle displaystyle="false"><mml:mi>f</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>x</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mstyle></mml:mrow></mml:mstyle></mml:math></inline-formula> for a specific instance. Each row represents a feature&#x2019;s contribution; positive contributions are red, while negative contributions are blue.</p></sec><sec id="s4-9-6"><title>Force Plot</title><p>This plot is a local explanation that shows the effect and the direction of the most impactful features for a given observation.</p></sec></sec><sec id="s4-10"><title>Software</title><p>Python and R were the most widely used software in the review. However, the variety of libraries can complicate the process. To address this, the metapackage &#x201C;tidymodels&#x201D; provides unified syntax, enhancing replicability [<xref ref-type="bibr" rid="ref135">135</xref>]. For DL, Python offers a more powerful environment thanks to PyTorch and TensorFlow frameworks and the possibility of developing analyses on cloud services such as Google Colab. Furthermore, we encourage researchers to make their code publicly available in open repositories such as GitHub.</p></sec><sec id="s4-11"><title>Limitations</title><p>At the level of the review itself, some limitations emerge. Although time-series data were frequently used in the analysis of lifestyle behaviors, the primary focus of this review was on the methodological framework of supervised ML, rather than on specific time-series modeling approaches. Future research should specifically address this gap by examining the current use of time-series models applied to wearable data to better capture human behavior. Moreover, the exclusion of UL algorithms limits the scope of ML algorithms covered in this review. For example, cluster analysis has been used to classify children according to their eating behaviors and identify features related to obesity [<xref ref-type="bibr" rid="ref155">155</xref>], with findings suggesting that interventions such as reducing eating speed may help prevent childhood obesity. This scoping review focuses on supervised ML approaches, but future research could examine the current application of UL in lifestyle data. Finally, a further limitation of this review is that the search strategy prioritized studies using the umbrella term &#x201C;healthy lifestyle.&#x201D; While this approach captured a representative sample of research explicitly conceptualized as HL, it may have excluded multidimensional studies examining combinations of physical activity, diet, sleep, or stress that did not use this terminology. Although an interaction block was incorporated to address the interconnectedness among these domains, we acknowledge that some multidomain research may not have been retrieved due to the specificity of the search string.</p></sec><sec id="s4-12"><title>Conclusion</title><p>This review has identified several limitations within the studies reviewed that need to be addressed. First, ensuring data quality remains a significant challenge that must be addressed by carefully selecting data acquisition methods to build reliable and robust models. Second, the evaluation process is crucial for preventing overfitting, and using hold-out cross-validation can lead to high variance partitioning. Therefore, it is recommended to implement k-fold cross-validation at various stages, such as during validation; for time-series data, rolling forecast origin resampling is recommended [<xref ref-type="bibr" rid="ref129">129</xref>].</p><p>In conclusion, this scoping review provides a comprehensive analysis of lifestyle using ML models and serves as a guideline for future research. While the relationship between lifestyle and health is well-established, ongoing efforts are needed to refine how we measure lifestyle to create robust models. It is essential to focus not only on model performance but also on data representativeness, which is closely related to the granularity established during data collection. Although RF algorithms are prominent in lifestyle data analysis, it is recommended to compare their performance with other algorithms within and across families. Future research should also incorporate SHAP values to enhance interpretability within the ML workflow. Additionally, the <italic>tidymodels</italic> metapackage (R software) with H2O for XAI can assist researchers in evaluating process quality with unified syntax, thereby contributing to replicability.</p></sec></sec></body><back><ack><p>This work was supported by the Catalonian Government through a FI-SDUR grant (ref 2023FISDU_00217).</p></ack><notes><sec><title>Funding</title><p>This work was supported by grants PID2019-107473RB-C21 and PID2022-141403NB-I00, funded by MCIN/AEI/10.13039/501100011033/FEDER, UE, and 2021SGR-00806, funded by the Catalonian Government. Additional funding was provided by the Catalonian Government through an FI-SDUR grant (ref 2023FISDU_00217).</p></sec><sec><title>Data Availability</title><p>The datasets generated or analyzed during this study are available in the</p><p>CORA Repositori de Dades de Recerca repository [<xref ref-type="bibr" rid="ref31">31</xref>].</p></sec></notes><fn-group><fn fn-type="con"><p>TE contributed to conceptualization, validation, formal analysis, investigation, data curation, writing of the original draft, and visualization. LC contributed to conceptualization, writing (review and editing), supervision, project administration, and funding acquisition. CA contributed to validation and writing (review and editing). JML contributed to conceptualization, methodology, writing (review and editing), supervision, project administration, and funding acquisition.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbrevations</title><def-list><def-item><term id="abb1">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb2">DASS</term><def><p>Depression Anxiety Stress Scale</p></def></def-item><def-item><term id="abb3">FFQ</term><def><p>Food Frequency Questionnaire</p></def></def-item><def-item><term id="abb4">FNN</term><def><p>fuzzy neural network</p></def></def-item><def-item><term id="abb5">GPAQ</term><def><p>Global Physical Activity Questionnaire</p></def></def-item><def-item><term id="abb6">HL</term><def><p>healthy lifestyle</p></def></def-item><def-item><term id="abb7">IMS-PAQ</term><def><p>Indian Migration Study Physical Activity Questionnaire</p></def></def-item><def-item><term id="abb8">INPLASY</term><def><p>International Platform of Registered Systematic Review and Meta-Analysis Protocols</p></def></def-item><def-item><term id="abb9">IPAQ</term><def><p>International Physical Activity Questionnaire</p></def></def-item><def-item><term id="abb10">LIME</term><def><p>local interpretable model-agnostic explanations</p></def></def-item><def-item><term id="abb11">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb12">NN</term><def><p>neural network</p></def></def-item><def-item><term id="abb13">NutSo-HH</term><def><p>Nutritional and Social Healthy Habits Scale</p></def></def-item><def-item><term id="abb14">PRESS</term><def><p>Peer Review of Electronic Search Strategies</p></def></def-item><def-item><term id="abb15">PRISMA-S</term><def><p>Preferred Reporting Items for Systematic Reviews and Meta-Analyses&#x2013;Search extension</p></def></def-item><def-item><term id="abb16">PRISMA-ScR</term><def><p>Preferred Reporting Items for Systematic Reviews and Meta-Analyses extension for Scoping Reviews</p></def></def-item><def-item><term id="abb17">RF</term><def><p>random forest</p></def></def-item><def-item><term id="abb18">SHAP</term><def><p>Shapley Additive Explanation</p></def></def-item><def-item><term id="abb19">SL</term><def><p>supervised learning</p></def></def-item><def-item><term id="abb20">SMOTE</term><def><p>synthetic minority oversampling technique</p></def></def-item><def-item><term id="abb21">SQUASH</term><def><p>Short Questionnaire to Assess Health-Enhancing Physical Activity</p></def></def-item><def-item><term id="abb22">SVM</term><def><p>support vector machine</p></def></def-item><def-item><term id="abb23">UL</term><def><p>unsupervised learning</p></def></def-item><def-item><term id="abb24">XAI</term><def><p>explainable artificial intelligence</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Furihata</surname><given-names>R</given-names> </name><name name-style="western"><surname>Konno</surname><given-names>C</given-names> </name><name name-style="western"><surname>Suzuki</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Unhealthy lifestyle factors and depressive symptoms: a Japanese general adult population survey</article-title><source>J Affect Disord</source><year>2018</year><month>07</month><volume>234</volume><fpage>156</fpage><lpage>161</lpage><pub-id pub-id-type="doi">10.1016/j.jad.2018.02.093</pub-id><pub-id pub-id-type="medline">29529548</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nudelman</surname><given-names>G</given-names> </name><name name-style="western"><surname>Shiloh</surname><given-names>S</given-names> </name></person-group><article-title>Connectionism and behavioral clusters: differential patterns in predicting expectations to engage in health behaviors</article-title><source>Ann Behav Med</source><year>2018</year><month>09</month><day>13</day><volume>52</volume><issue>10</issue><fpage>890</fpage><lpage>901</lpage><pub-id pub-id-type="doi">10.1093/abm/kax063</pub-id><pub-id pub-id-type="medline">30212846</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nudelman</surname><given-names>G</given-names> </name><name name-style="western"><surname>Shiloh</surname><given-names>S</given-names> </name></person-group><article-title>Mapping health behaviors: constructing and validating a common-sense taxonomy of health behaviors</article-title><source>Soc Sci Med</source><year>2015</year><month>12</month><volume>146</volume><fpage>1</fpage><lpage>10</lpage><pub-id pub-id-type="doi">10.1016/j.socscimed.2015.10.004</pub-id><pub-id pub-id-type="medline">26473449</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kaminsky</surname><given-names>LA</given-names> </name><name name-style="western"><surname>German</surname><given-names>C</given-names> </name><name name-style="western"><surname>Imboden</surname><given-names>M</given-names> </name><name name-style="western"><surname>Ozemek</surname><given-names>C</given-names> </name><name name-style="western"><surname>Peterman</surname><given-names>JE</given-names> </name><name name-style="western"><surname>Brubaker</surname><given-names>PH</given-names> </name></person-group><article-title>The importance of healthy lifestyle behaviors in the prevention of cardiovascular disease</article-title><source>Prog Cardiovasc Dis</source><year>2022</year><month>01</month><volume>70</volume><fpage>8</fpage><lpage>15</lpage><pub-id pub-id-type="doi">10.1016/j.pcad.2021.12.001</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Braun</surname><given-names>C</given-names> </name><name name-style="western"><surname>Foreyt</surname><given-names>JP</given-names> </name><name name-style="western"><surname>Johnston</surname><given-names>CA</given-names> </name></person-group><article-title>Stress: a core lifestyle issue</article-title><source>Am J Lifestyle Med</source><year>2016</year><volume>10</volume><issue>4</issue><fpage>235</fpage><lpage>238</lpage><pub-id pub-id-type="doi">10.1177/1559827616642400</pub-id><pub-id pub-id-type="medline">30202277</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wong</surname><given-names>VWH</given-names> </name><name name-style="western"><surname>Ho</surname><given-names>FYY</given-names> </name><name name-style="western"><surname>Shi</surname><given-names>NK</given-names> </name><name name-style="western"><surname>Sarris</surname><given-names>J</given-names> </name><name name-style="western"><surname>Chung</surname><given-names>KF</given-names> </name><name name-style="western"><surname>Yeung</surname><given-names>WF</given-names> </name></person-group><article-title>Lifestyle medicine for depression: a meta-analysis of randomized controlled trials</article-title><source>J Affect Disord</source><year>2021</year><month>04</month><volume>284</volume><fpage>203</fpage><lpage>216</lpage><pub-id pub-id-type="doi">10.1016/j.jad.2021.02.012</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sagner</surname><given-names>M</given-names> </name><name name-style="western"><surname>Katz</surname><given-names>D</given-names> </name><name name-style="western"><surname>Egger</surname><given-names>G</given-names> </name><etal/></person-group><article-title>Lifestyle medicine potential for reversing a world of chronic disease epidemics: from cell to community</article-title><source>Int J Clin Pract</source><year>2014</year><month>11</month><volume>68</volume><issue>11</issue><fpage>1289</fpage><lpage>1292</lpage><pub-id pub-id-type="doi">10.1111/ijcp.12509</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cerf</surname><given-names>ME</given-names> </name></person-group><article-title>Healthy lifestyles and noncommunicable diseases: nutrition, the life&#x2010;course, and health promotion</article-title><source>Lifestyle Medicine</source><year>2021</year><month>04</month><access-date>2026-02-20</access-date><volume>2</volume><issue>2</issue><fpage>e31</fpage><comment><ext-link ext-link-type="uri" xlink:href="https://onlinelibrary.wiley.com/toc/26883740/2/2">https://onlinelibrary.wiley.com/toc/26883740/2/2</ext-link></comment><pub-id pub-id-type="doi">10.1002/lim2.31</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gurrin</surname><given-names>C</given-names> </name><name name-style="western"><surname>Smeaton</surname><given-names>AF</given-names> </name><name name-style="western"><surname>Doherty</surname><given-names>AR</given-names> </name></person-group><article-title>LifeLogging: personal big data</article-title><source>Foundations and Trends&#x00AE; in Information Retrieval</source><year>2014</year><month>06</month><day>16</day><volume>8</volume><issue>1</issue><fpage>1</fpage><lpage>125</lpage><pub-id pub-id-type="doi">10.1561/1500000033</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lim</surname><given-names>J</given-names> </name><name name-style="western"><surname>Jeong</surname><given-names>CY</given-names> </name><name name-style="western"><surname>Lim</surname><given-names>JM</given-names> </name><etal/></person-group><article-title>Assessing sleep quality using mobile EMAs: opportunities, practical consideration, and challenges</article-title><source>IEEE Access</source><year>2022</year><volume>10</volume><fpage>2063</fpage><lpage>2076</lpage><pub-id pub-id-type="doi">10.1109/ACCESS.2021.3140074</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kline</surname><given-names>A</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Li</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Multimodal machine learning in precision health: a scoping review</article-title><source>NPJ Digit Med</source><year>2022</year><month>11</month><day>7</day><volume>5</volume><issue>1</issue><fpage>171</fpage><pub-id pub-id-type="doi">10.1038/s41746-022-00712-8</pub-id><pub-id pub-id-type="medline">36344814</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Beam</surname><given-names>AL</given-names> </name><name name-style="western"><surname>Kohane</surname><given-names>IS</given-names> </name></person-group><article-title>Big data and machine learning in health care</article-title><source>JAMA</source><year>2018</year><month>04</month><day>3</day><volume>319</volume><issue>13</issue><fpage>1317</fpage><lpage>1318</lpage><pub-id pub-id-type="doi">10.1001/jama.2017.18391</pub-id><pub-id pub-id-type="medline">29532063</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Maleki</surname><given-names>F</given-names> </name><name name-style="western"><surname>Ovens</surname><given-names>K</given-names> </name><name name-style="western"><surname>Najafian</surname><given-names>K</given-names> </name><name name-style="western"><surname>Forghani</surname><given-names>B</given-names> </name><name name-style="western"><surname>Reinhold</surname><given-names>C</given-names> </name><name name-style="western"><surname>Forghani</surname><given-names>R</given-names> </name></person-group><article-title>Overview of machine learning part 1</article-title><source>Neuroimaging Clin N Am</source><year>2020</year><month>11</month><volume>30</volume><issue>4</issue><fpage>e17</fpage><lpage>e32</lpage><pub-id pub-id-type="doi">10.1016/j.nic.2020.08.007</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Secinaro</surname><given-names>S</given-names> </name><name name-style="western"><surname>Calandra</surname><given-names>D</given-names> </name><name name-style="western"><surname>Secinaro</surname><given-names>A</given-names> </name><name name-style="western"><surname>Muthurangu</surname><given-names>V</given-names> </name><name name-style="western"><surname>Biancone</surname><given-names>P</given-names> </name></person-group><article-title>The role of artificial intelligence in healthcare: a structured literature review</article-title><source>BMC Med Inform Decis Mak</source><year>2021</year><month>04</month><day>10</day><volume>21</volume><issue>1</issue><fpage>125</fpage><pub-id pub-id-type="doi">10.1186/s12911-021-01488-9</pub-id><pub-id pub-id-type="medline">33836752</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Breiman</surname><given-names>L</given-names> </name></person-group><article-title>Statistical modeling: the two cultures (with comments and a rejoinder by the author)</article-title><source>Statist Sci</source><year>2001</year><month>08</month><day>1</day><volume>16</volume><issue>3</issue><pub-id pub-id-type="doi">10.1214/ss/1009213726</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Choi</surname><given-names>RY</given-names> </name><name name-style="western"><surname>Coyner</surname><given-names>AS</given-names> </name><name name-style="western"><surname>Kalpathy-Cramer</surname><given-names>J</given-names> </name><name name-style="western"><surname>Chiang</surname><given-names>MF</given-names> </name><name name-style="western"><surname>Campbell</surname><given-names>JP</given-names> </name></person-group><article-title>Introduction to machine learning, neural networks, and deep learning</article-title><source>Transl Vis Sci Technol</source><year>2020</year><month>02</month><day>27</day><volume>9</volume><issue>2</issue><fpage>14</fpage><pub-id pub-id-type="doi">10.1167/tvst.9.2.14</pub-id><pub-id pub-id-type="medline">32704420</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Efron</surname><given-names>B</given-names> </name></person-group><article-title>Prediction, estimation, and attribution</article-title><source>Int Statistical Rev</source><year>2020</year><month>12</month><access-date>2026-02-20</access-date><volume>88</volume><issue>S1</issue><comment><ext-link ext-link-type="uri" xlink:href="https://onlinelibrary.wiley.com/toc/17515823/88/S1">https://onlinelibrary.wiley.com/toc/17515823/88/S1</ext-link></comment><pub-id pub-id-type="doi">10.1111/insr.12409</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Bruce</surname><given-names>PC</given-names> </name><name name-style="western"><surname>Bruce</surname><given-names>A</given-names> </name><name name-style="western"><surname>Gedeck</surname><given-names>P</given-names> </name></person-group><source>Estad&#x00ED;stica Pr&#x00E1;ctica Para Ciencia de Datos Con R y Python: M&#x00E1;s de 50 Conceptos Esenciales</source><year>2022</year><edition>2</edition><publisher-name>Marcombo</publisher-name><pub-id pub-id-type="other">978-84-267-3443-3</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>James</surname><given-names>G</given-names> </name><name name-style="western"><surname>Witten</surname><given-names>D</given-names> </name><name name-style="western"><surname>Hastie</surname><given-names>T</given-names> </name><name name-style="western"><surname>Learning</surname><given-names>TRS</given-names> </name></person-group><source>An Introduction to Statistical Learning</source><year>2021</year><publisher-name>Springer</publisher-name><fpage>15</fpage><lpage>57</lpage><pub-id pub-id-type="doi">10.1007/978-1-0716-1418-1_2</pub-id><pub-id pub-id-type="other">978-1-0716-1417-4</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Saqib</surname><given-names>K</given-names> </name><name name-style="western"><surname>Khan</surname><given-names>AF</given-names> </name><name name-style="western"><surname>Butt</surname><given-names>ZA</given-names> </name></person-group><article-title>Machine learning methods for predicting postpartum depression: scoping review</article-title><source>JMIR Ment Health</source><year>2021</year><month>11</month><day>24</day><volume>8</volume><issue>11</issue><fpage>e29838</fpage><pub-id pub-id-type="doi">10.2196/29838</pub-id><pub-id pub-id-type="medline">34822337</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shatte</surname><given-names>ABR</given-names> </name><name name-style="western"><surname>Hutchinson</surname><given-names>DM</given-names> </name><name name-style="western"><surname>Teague</surname><given-names>SJ</given-names> </name></person-group><article-title>Machine learning in mental health: a scoping review of methods and applications</article-title><source>Psychol Med</source><year>2019</year><month>07</month><volume>49</volume><issue>9</issue><fpage>1426</fpage><lpage>1448</lpage><pub-id pub-id-type="doi">10.1017/S0033291719000151</pub-id><pub-id pub-id-type="medline">30744717</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ono</surname><given-names>S</given-names> </name><name name-style="western"><surname>Goto</surname><given-names>T</given-names> </name></person-group><article-title>Introduction to supervised machine learning in clinical epidemiology</article-title><source>Ann Clin Epidemiol</source><year>2022</year><volume>4</volume><issue>3</issue><fpage>63</fpage><lpage>71</lpage><pub-id pub-id-type="doi">10.37737/ace.22009</pub-id><pub-id pub-id-type="medline">38504945</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bi</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Goodman</surname><given-names>KE</given-names> </name><name name-style="western"><surname>Kaminsky</surname><given-names>J</given-names> </name><name name-style="western"><surname>Lessler</surname><given-names>J</given-names> </name></person-group><article-title>What is machine learning? A primer for the epidemiologist</article-title><source>Am J Epidemiol</source><year>2019</year><month>12</month><day>31</day><volume>188</volume><issue>12</issue><fpage>2222</fpage><lpage>2239</lpage><pub-id pub-id-type="doi">10.1093/aje/kwz189</pub-id><pub-id pub-id-type="medline">31509183</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Aggarwal</surname><given-names>A</given-names> </name><name name-style="western"><surname>Tam</surname><given-names>CC</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>D</given-names> </name><name name-style="western"><surname>Li</surname><given-names>X</given-names> </name><name name-style="western"><surname>Qiao</surname><given-names>S</given-names> </name></person-group><article-title>Artificial intelligence-based chatbots for promoting health behavioral changes: systematic review</article-title><source>J Med Internet Res</source><year>2023</year><month>02</month><day>24</day><volume>25</volume><fpage>e40789</fpage><pub-id pub-id-type="doi">10.2196/40789</pub-id><pub-id pub-id-type="medline">36826990</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Goh</surname><given-names>YS</given-names> </name><name name-style="western"><surname>Ow Yong</surname><given-names>JQY</given-names> </name><name name-style="western"><surname>Chee</surname><given-names>BQH</given-names> </name><name name-style="western"><surname>Kuek</surname><given-names>JHL</given-names> </name><name name-style="western"><surname>Ho</surname><given-names>CSH</given-names> </name></person-group><article-title>Machine learning in health promotion and behavioral change: scoping review</article-title><source>J Med Internet Res</source><year>2022</year><month>06</month><day>2</day><volume>24</volume><issue>6</issue><fpage>e35831</fpage><pub-id pub-id-type="doi">10.2196/35831</pub-id><pub-id pub-id-type="medline">35653177</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lai</surname><given-names>X</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>J</given-names> </name><name name-style="western"><surname>Lai</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Using large language models to enhance exercise recommendations and physical activity in clinical and healthy populations: scoping review</article-title><source>JMIR Med Inform</source><year>2025</year><month>05</month><day>27</day><volume>13</volume><fpage>e59309</fpage><pub-id pub-id-type="doi">10.2196/59309</pub-id><pub-id pub-id-type="medline">40424584</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Mersha</surname><given-names>M</given-names> </name><name name-style="western"><surname>Wood</surname><given-names>J</given-names> </name><name name-style="western"><surname>AlShami</surname><given-names>A</given-names> </name><name name-style="western"><surname>Kalita</surname><given-names>J</given-names> </name><name name-style="western"><surname>Lam</surname><given-names>K</given-names> </name></person-group><article-title>Explainable artificial intelligence: a survey of needs, techniques, applications, and future direction</article-title><source>arXiv</source><comment>Preprint posted online on  Aug 30, 2024</comment><pub-id pub-id-type="doi">10.48550/ARXIV.2409.00265</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ali</surname><given-names>S</given-names> </name><name name-style="western"><surname>Abuhmed</surname><given-names>T</given-names> </name><name name-style="western"><surname>El-Sappagh</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Explainable artificial intelligence (XAI): what we know and what is left to attain trustworthy artificial intelligence</article-title><source>Information Fusion</source><year>2023</year><month>11</month><volume>99</volume><fpage>101805</fpage><pub-id pub-id-type="doi">10.1016/j.inffus.2023.101805</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Munn</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Peters</surname><given-names>MDJ</given-names> </name><name name-style="western"><surname>Stern</surname><given-names>C</given-names> </name><name name-style="western"><surname>Tufanaru</surname><given-names>C</given-names> </name><name name-style="western"><surname>McArthur</surname><given-names>A</given-names> </name><name name-style="western"><surname>Aromataris</surname><given-names>E</given-names> </name></person-group><article-title>Systematic review or scoping review? Guidance for authors when choosing between a systematic or scoping review approach</article-title><source>BMC Med Res Methodol</source><year>2018</year><month>11</month><day>19</day><volume>18</volume><issue>1</issue><fpage>143</fpage><pub-id pub-id-type="doi">10.1186/s12874-018-0611-x</pub-id><pub-id pub-id-type="medline">30453902</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tricco</surname><given-names>AC</given-names> </name><name name-style="western"><surname>Lillie</surname><given-names>E</given-names> </name><name name-style="western"><surname>Zarin</surname><given-names>W</given-names> </name><etal/></person-group><article-title>PRISMA Extension for Scoping Reviews (PRISMA-ScR): checklist and explanation</article-title><source>Ann Intern Med</source><year>2018</year><month>10</month><day>2</day><volume>169</volume><issue>7</issue><fpage>467</fpage><lpage>473</lpage><pub-id pub-id-type="doi">10.7326/M18-0850</pub-id><pub-id pub-id-type="medline">30178033</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Estrella</surname><given-names>T</given-names> </name><name name-style="western"><surname>Alfonso</surname><given-names>C</given-names> </name><name name-style="western"><surname>Capdevila</surname><given-names>L</given-names> </name><name name-style="western"><surname>Losilla</surname><given-names>JM</given-names> </name></person-group><article-title>Machine learning for the analysis of healthy lifestyle data: a scoping review protocol</article-title><source>Universitat Aut&#x00F2;noma de Barcelona</source><year>2023</year><month>03</month><access-date>2026-02-20</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://portalrecerca.uab.cat/en/publications/machine-learning-for-the-analysis-of-healthy-lifestyle-data-a-sco/">https://portalrecerca.uab.cat/en/publications/machine-learning-for-the-analysis-of-healthy-lifestyle-data-a-sco/</ext-link></comment></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="report"><person-group person-group-type="author"><name name-style="western"><surname>Estrella</surname><given-names>T</given-names> </name><name name-style="western"><surname>Capdevila</surname><given-names>L</given-names> </name><name name-style="western"><surname>Alfonso</surname><given-names>C</given-names> </name><name name-style="western"><surname>Losilla</surname><given-names>JM</given-names> </name></person-group><article-title>Replication data for machine learning for the analysis of healthy lifestyle data: a scoping review</article-title><year>2024</year><publisher-name>CORA.Repositori de Dades de Recerca</publisher-name><pub-id pub-id-type="doi">10.34810/DATA1088</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>McGowan</surname><given-names>J</given-names> </name><name name-style="western"><surname>Sampson</surname><given-names>M</given-names> </name><name name-style="western"><surname>Salzwedel</surname><given-names>DM</given-names> </name><name name-style="western"><surname>Cogo</surname><given-names>E</given-names> </name><name name-style="western"><surname>Foerster</surname><given-names>V</given-names> </name><name name-style="western"><surname>Lefebvre</surname><given-names>C</given-names> </name></person-group><article-title>PRESS Peer Review of Electronic Search Strategies: 2015 guideline statement</article-title><source>J Clin Epidemiol</source><year>2016</year><month>07</month><volume>75</volume><fpage>40</fpage><lpage>46</lpage><pub-id pub-id-type="doi">10.1016/j.jclinepi.2016.01.021</pub-id><pub-id pub-id-type="medline">27005575</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rethlefsen</surname><given-names>ML</given-names> </name><name name-style="western"><surname>Kirtley</surname><given-names>S</given-names> </name><name name-style="western"><surname>Waffenschmidt</surname><given-names>S</given-names> </name><etal/></person-group><article-title>PRISMA-S: an extension to the PRISMA Statement for reporting literature searches in systematic reviews</article-title><source>Syst Rev</source><year>2021</year><month>01</month><day>26</day><volume>10</volume><issue>1</issue><fpage>39</fpage><pub-id pub-id-type="doi">10.1186/s13643-020-01542-z</pub-id><pub-id pub-id-type="medline">33499930</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Loef</surname><given-names>M</given-names> </name><name name-style="western"><surname>Walach</surname><given-names>H</given-names> </name></person-group><article-title>The combined effects of healthy lifestyle behaviors on all cause mortality: a systematic review and meta-analysis</article-title><source>Prev Med</source><year>2012</year><month>09</month><volume>55</volume><issue>3</issue><fpage>163</fpage><lpage>170</lpage><pub-id pub-id-type="doi">10.1016/j.ypmed.2012.06.017</pub-id><pub-id pub-id-type="medline">22735042</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Feng</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>JH</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>Y</given-names> </name></person-group><article-title>Combined effect of healthy lifestyle factors and risks of colorectal adenoma, colorectal cancer, and colorectal cancer mortality: systematic review and meta-analysis</article-title><source>Front Oncol</source><year>2022</year><month>07</month><day>22</day><volume>12</volume><fpage>827019</fpage><pub-id pub-id-type="doi">10.3389/fonc.2022.827019</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lippman</surname><given-names>D</given-names> </name><name name-style="western"><surname>Stump</surname><given-names>M</given-names> </name><name name-style="western"><surname>Veazey</surname><given-names>E</given-names> </name><etal/></person-group><article-title>Foundations of lifestyle medicine and its evolution</article-title><source>Mayo Clin Proc Innov Qual Outcomes</source><year>2024</year><month>02</month><volume>8</volume><issue>1</issue><fpage>97</fpage><lpage>111</lpage><pub-id pub-id-type="doi">10.1016/j.mayocpiqo.2023.11.004</pub-id><pub-id pub-id-type="medline">38304165</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sayburn</surname><given-names>A</given-names> </name></person-group><article-title>Lifestyle medicine: a new medical specialty?</article-title><source>BMJ</source><year>2018</year><month>10</month><day>25</day><fpage>k4442</fpage><pub-id pub-id-type="doi">10.1136/bmj.k4442</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fleig</surname><given-names>L</given-names> </name><name name-style="western"><surname>Ngo</surname><given-names>J</given-names> </name><name name-style="western"><surname>Roman</surname><given-names>B</given-names> </name><etal/></person-group><article-title>Beyond single behaviour theory: adding cross&#x2010;behaviour cognitions to the health action process approach</article-title><source>British J Health Psychol</source><year>2015</year><month>11</month><access-date>2026-02-20</access-date><volume>20</volume><issue>4</issue><fpage>824</fpage><lpage>841</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://bpspsychub.onlinelibrary.wiley.com/toc/20448287/20/4">https://bpspsychub.onlinelibrary.wiley.com/toc/20448287/20/4</ext-link></comment><pub-id pub-id-type="doi">10.1111/bjhp.12144</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Butkevi&#x010D;i&#x016B;t&#x0117;</surname><given-names>E</given-names> </name><name name-style="western"><surname>Bikul&#x010D;ien&#x0117;</surname><given-names>L</given-names> </name><name name-style="western"><surname>&#x017D;vironien&#x0117;</surname><given-names>A</given-names> </name></person-group><article-title>Physiological state evaluation in working environment using expert system and random forest machine learning algorithm</article-title><source>Healthcare (Basel)</source><year>2023</year><month>01</month><day>11</day><volume>11</volume><issue>2</issue><fpage>220</fpage><pub-id pub-id-type="doi">10.3390/healthcare11020220</pub-id><pub-id pub-id-type="medline">36673588</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cai</surname><given-names>T</given-names> </name><name name-style="western"><surname>Long</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kuang</surname><given-names>J</given-names> </name><name name-style="western"><surname>You</surname><given-names>F</given-names> </name><name name-style="western"><surname>Zou</surname><given-names>T</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>L</given-names> </name></person-group><article-title>Applying machine learning methods to develop a successful aging maintenance prediction model based on physical fitness tests</article-title><source>Geriatrics Gerontology Int</source><year>2020</year><month>06</month><volume>20</volume><issue>6</issue><fpage>637</fpage><lpage>642</lpage><pub-id pub-id-type="doi">10.1111/ggi.13926</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lim</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>J</given-names> </name><name name-style="western"><surname>Cheon</surname><given-names>S</given-names> </name></person-group><article-title>A deep neural network-based method for early detection of osteoarthritis using statistical data</article-title><source>Int J Environ Res Public Health</source><year>2019</year><month>04</month><day>10</day><volume>16</volume><issue>7</issue><fpage>1281</fpage><pub-id pub-id-type="doi">10.3390/ijerph16071281</pub-id><pub-id pub-id-type="medline">30974803</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Recenti</surname><given-names>M</given-names> </name><name name-style="western"><surname>Ricciardi</surname><given-names>C</given-names> </name><name name-style="western"><surname>Edmunds</surname><given-names>KJ</given-names> </name><etal/></person-group><article-title>Healthy aging within an image: using muscle radiodensitometry and lifestyle factors to predict diabetes and hypertension</article-title><source>IEEE J Biomed Health Inform</source><year>2021</year><month>06</month><volume>25</volume><issue>6</issue><fpage>2103</fpage><lpage>2112</lpage><pub-id pub-id-type="doi">10.1109/JBHI.2020.3044158</pub-id><pub-id pub-id-type="medline">33306475</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Recenti</surname><given-names>M</given-names> </name><name name-style="western"><surname>Ricciardi</surname><given-names>C</given-names> </name><name name-style="western"><surname>Edmunds</surname><given-names>K</given-names> </name><name name-style="western"><surname>Jacob</surname><given-names>D</given-names> </name><name name-style="western"><surname>Gambacorta</surname><given-names>M</given-names> </name><name name-style="western"><surname>Gargiulo</surname><given-names>P</given-names> </name></person-group><article-title>Testing soft tissue radiodensity parameters interplay with age and self-reported physical activity</article-title><source>Eur J Transl Myol</source><year>2021</year><month>07</month><day>12</day><volume>31</volume><issue>3</issue><fpage>9929</fpage><pub-id pub-id-type="doi">10.4081/ejtm.2021.9929</pub-id><pub-id pub-id-type="medline">34251162</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Staudenmayer</surname><given-names>J</given-names> </name><name name-style="western"><surname>He</surname><given-names>S</given-names> </name><name name-style="western"><surname>Hickey</surname><given-names>A</given-names> </name><name name-style="western"><surname>Sasaki</surname><given-names>J</given-names> </name><name name-style="western"><surname>Freedson</surname><given-names>P</given-names> </name></person-group><article-title>Methods to estimate aspects of physical activity and sedentary behavior from high-frequency wrist accelerometer measurements</article-title><source>J Appl Physiol</source><year>2015</year><month>08</month><day>15</day><volume>119</volume><issue>4</issue><fpage>396</fpage><lpage>403</lpage><pub-id pub-id-type="doi">10.1152/japplphysiol.00026.2015</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhou</surname><given-names>M</given-names> </name><name name-style="western"><surname>Fukuoka</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Goldberg</surname><given-names>K</given-names> </name><name name-style="western"><surname>Vittinghoff</surname><given-names>E</given-names> </name><name name-style="western"><surname>Aswani</surname><given-names>A</given-names> </name></person-group><article-title>Applying machine learning to predict future adherence to physical activity programs</article-title><source>BMC Med Inform Decis Mak</source><year>2019</year><month>08</month><day>22</day><volume>19</volume><issue>1</issue><fpage>169</fpage><pub-id pub-id-type="doi">10.1186/s12911-019-0890-0</pub-id><pub-id pub-id-type="medline">31438926</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dianati-Nasab</surname><given-names>M</given-names> </name><name name-style="western"><surname>Salimifard</surname><given-names>K</given-names> </name><name name-style="western"><surname>Mohammadi</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Machine learning algorithms to uncover risk factors of breast cancer: insights from a large case-control study</article-title><source>Front Oncol</source><year>2023</year><volume>13</volume><fpage>1276232</fpage><pub-id pub-id-type="doi">10.3389/fonc.2023.1276232</pub-id><pub-id pub-id-type="medline">38425674</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Matta</surname><given-names>SC</given-names> </name><name name-style="western"><surname>Sankari</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Rihana</surname><given-names>S</given-names> </name></person-group><article-title>Heart rate variability analysis using neural network models for automatic detection of lifestyle activities</article-title><source>Biomed SIGNAL Process CONTROL</source><year>2018</year><month>04</month><volume>42</volume><fpage>145</fpage><lpage>157</lpage><pub-id pub-id-type="doi">10.1016/j.bspc.2018.01.016</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Park</surname><given-names>H</given-names> </name><name name-style="western"><surname>Jung</surname><given-names>SY</given-names> </name><name name-style="western"><surname>Han</surname><given-names>MK</given-names> </name><etal/></person-group><article-title>Lowering barriers to health risk assessments in promoting personalized health management</article-title><source>J Pers Med</source><year>2024</year><month>03</month><day>18</day><volume>14</volume><issue>3</issue><fpage>316</fpage><pub-id pub-id-type="doi">10.3390/jpm14030316</pub-id><pub-id pub-id-type="medline">38541058</pub-id></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Song</surname><given-names>H</given-names> </name></person-group><article-title>The association between sports social capital and cognitive health: a longitudinal study of middle-aged and elderly adults in China</article-title><source>SSM Popul Health</source><year>2025</year><month>06</month><volume>30</volume><fpage>101778</fpage><pub-id pub-id-type="doi">10.1016/j.ssmph.2025.101778</pub-id><pub-id pub-id-type="medline">40212736</pub-id></nlm-citation></ref><ref id="ref51"><label>51</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lin</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Li</surname><given-names>C</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Li</surname><given-names>H</given-names> </name></person-group><article-title>Development of a machine learning-based risk assessment model for loneliness among elderly Chinese: a cross-sectional study based on Chinese longitudinal healthy longevity survey</article-title><source>BMC Geriatr</source><year>2024</year><month>11</month><day>14</day><volume>24</volume><issue>1</issue><pub-id pub-id-type="doi">10.1186/s12877-024-05443-x</pub-id></nlm-citation></ref><ref id="ref52"><label>52</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ren</surname><given-names>H</given-names> </name><name name-style="western"><surname>Zheng</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Li</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Using machine learning to predict cognitive decline in older adults from the Chinese longitudinal healthy longevity survey: model development and validation study</article-title><source>JMIR Aging</source><year>2025</year><month>04</month><day>30</day><volume>8</volume><fpage>e67437</fpage><pub-id pub-id-type="doi">10.2196/67437</pub-id><pub-id pub-id-type="medline">40305830</pub-id></nlm-citation></ref><ref id="ref53"><label>53</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>X</given-names> </name><name name-style="western"><surname>Luo</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Jing</surname><given-names>F</given-names> </name><etal/></person-group><article-title>Estimating cardiovascular mortality in patients with hypertension using machine learning: the role of depression classification based on lifestyle and physical activity</article-title><source>J Psychosom Res</source><year>2025</year><month>02</month><volume>189</volume><fpage>112030</fpage><pub-id pub-id-type="doi">10.1016/j.jpsychores.2024.112030</pub-id><pub-id pub-id-type="medline">39752763</pub-id></nlm-citation></ref><ref id="ref54"><label>54</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Am&#x00FA; Ruiz</surname><given-names>FA</given-names> </name><name name-style="western"><surname>Gonzalez Bustamante</surname><given-names>DA</given-names> </name><name name-style="western"><surname>Ortiz Gonz&#x00E1;lez</surname><given-names>K</given-names> </name><name name-style="western"><surname>Sandoval</surname><given-names>KM</given-names> </name></person-group><article-title>&#x00C1;rbol de clasificaci&#x00F3;n para la identificaci&#x00F3;n de s&#x00ED;ntomas asociados a la depresi&#x00F3;n en estudiantes de una universidad p&#x00FA;blica (Classification tree for the identification of symptoms associated with depression in students of a public university)</article-title><source>Retos</source><year>2024</year><volume>52</volume><fpage>104</fpage><lpage>114</lpage><pub-id pub-id-type="doi">10.47197/retos.v52.100138</pub-id></nlm-citation></ref><ref id="ref55"><label>55</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wallace</surname><given-names>ML</given-names> </name><name name-style="western"><surname>Coleman</surname><given-names>TS</given-names> </name><name name-style="western"><surname>Mentch</surname><given-names>LK</given-names> </name><etal/></person-group><article-title>Physiological sleep measures predict time to 15&#x2010;year mortality in community adults: application of a novel machine learning framework</article-title><source>J Sleep Res</source><year>2021</year><month>12</month><volume>30</volume><issue>6</issue><fpage>e13386</fpage><pub-id pub-id-type="doi">10.1111/jsr.13386</pub-id><pub-id pub-id-type="medline">33991144</pub-id></nlm-citation></ref><ref id="ref56"><label>56</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Su</surname><given-names>W</given-names> </name><name name-style="western"><surname>Jia</surname><given-names>H</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>W</given-names> </name><etal/></person-group><article-title>The secrets of medical students&#x2019; psychological resilience: a dual perspective of machine learning and path analysis</article-title><source>Int J Med Inform</source><year>2026</year><month>01</month><volume>205</volume><fpage>106111</fpage><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2025.106111</pub-id></nlm-citation></ref><ref id="ref57"><label>57</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Luo</surname><given-names>W</given-names> </name><name name-style="western"><surname>Gong</surname><given-names>L</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>X</given-names> </name><etal/></person-group><article-title>Lifestyle and chronic kidney disease: a machine learning modeling study</article-title><source>Front Nutr</source><year>2022</year><volume>9</volume><fpage>918576</fpage><pub-id pub-id-type="doi">10.3389/fnut.2022.918576</pub-id><pub-id pub-id-type="medline">35938107</pub-id></nlm-citation></ref><ref id="ref58"><label>58</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Afrash</surname><given-names>MR</given-names> </name><name name-style="western"><surname>Bayani</surname><given-names>A</given-names> </name><name name-style="western"><surname>Shanbehzadeh</surname><given-names>M</given-names> </name><name name-style="western"><surname>Bahadori</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kazemi-Arpanahi</surname><given-names>H</given-names> </name></person-group><article-title>Developing the breast cancer risk prediction system using hybrid machine learning algorithms</article-title><source>J Educ Health Promot</source><year>2022</year><volume>11</volume><fpage>272</fpage><pub-id pub-id-type="doi">10.4103/jehp.jehp_42_22</pub-id><pub-id pub-id-type="medline">36325225</pub-id></nlm-citation></ref><ref id="ref59"><label>59</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alshurafa</surname><given-names>N</given-names> </name><name name-style="western"><surname>Sideris</surname><given-names>C</given-names> </name><name name-style="western"><surname>Pourhomayoun</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kalantarian</surname><given-names>H</given-names> </name><name name-style="western"><surname>Sarrafzadeh</surname><given-names>M</given-names> </name><name name-style="western"><surname>Eastwood</surname><given-names>JA</given-names> </name></person-group><article-title>Remote health monitoring outcome success prediction using baseline and first month intervention data</article-title><source>IEEE J Biomed Health Inform</source><year>2017</year><month>03</month><volume>21</volume><issue>2</issue><fpage>507</fpage><lpage>514</lpage><pub-id pub-id-type="doi">10.1109/JBHI.2016.2518673</pub-id><pub-id pub-id-type="medline">26780823</pub-id></nlm-citation></ref><ref id="ref60"><label>60</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gu</surname><given-names>X</given-names> </name><name name-style="western"><surname>Li</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>X</given-names> </name></person-group><article-title>Using Life&#x2019;s Essential 8 and heavy metal exposure to determine infertility risk in American women: a machine learning prediction model based on the SHAP method</article-title><source>Front Endocrinol (Lausanne)</source><year>2025</year><volume>16</volume><fpage>1586828</fpage><pub-id pub-id-type="doi">10.3389/fendo.2025.1586828</pub-id><pub-id pub-id-type="medline">40687585</pub-id></nlm-citation></ref><ref id="ref61"><label>61</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nichols</surname><given-names>ES</given-names> </name><name name-style="western"><surname>Pathak</surname><given-names>HS</given-names> </name><name name-style="western"><surname>Bgeginski</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Machine learning-based predictive modeling of resilience to stressors in pregnant women during COVID-19: a prospective cohort study</article-title><source>PLoS ONE</source><year>2022</year><volume>17</volume><issue>8</issue><fpage>e0272862</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0272862</pub-id><pub-id pub-id-type="medline">35951588</pub-id></nlm-citation></ref><ref id="ref62"><label>62</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>B&#x00F4;to</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Marreiros</surname><given-names>A</given-names> </name><name name-style="western"><surname>Diogo</surname><given-names>P</given-names> </name><etal/></person-group><article-title>Health behaviours as predictors of the Mediterranean diet adherence: a decision tree approach</article-title><source>Public Health Nutr</source><year>2022</year><month>07</month><volume>25</volume><issue>7</issue><fpage>1864</fpage><lpage>1876</lpage><pub-id pub-id-type="doi">10.1017/S1368980021003293</pub-id><pub-id pub-id-type="medline">34369348</pub-id></nlm-citation></ref><ref id="ref63"><label>63</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Huang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>Q</given-names> </name><etal/></person-group><article-title>Predicting mild cognitive impairment among Chinese older adults: a longitudinal study based on long short-term memory networks and machine learning</article-title><source>Front AGING Neurosci</source><year>2023</year><volume>15</volume><pub-id pub-id-type="doi">10.3389/fnagi.2023.1283243</pub-id></nlm-citation></ref><ref id="ref64"><label>64</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kiss</surname><given-names>O</given-names> </name><name name-style="western"><surname>Alzueta</surname><given-names>E</given-names> </name><name name-style="western"><surname>Yuksel</surname><given-names>D</given-names> </name><etal/></person-group><article-title>The pandemic&#x2019;s toll on young adolescents: prevention and intervention targets to preserve their mental health</article-title><source>J Adolesc Health</source><year>2022</year><month>03</month><volume>70</volume><issue>3</issue><fpage>387</fpage><lpage>395</lpage><pub-id pub-id-type="doi">10.1016/j.jadohealth.2021.11.023</pub-id><pub-id pub-id-type="medline">35090817</pub-id></nlm-citation></ref><ref id="ref65"><label>65</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Majcherek</surname><given-names>D</given-names> </name><name name-style="western"><surname>Ciesielski</surname><given-names>A</given-names> </name><name name-style="western"><surname>Sobczak</surname><given-names>P</given-names> </name></person-group><article-title>AI-driven analysis of diabetes risk determinants in U.S. adults: exploring disease prevalence and health factors</article-title><source>PLoS ONE</source><year>2025</year><volume>20</volume><issue>9</issue><fpage>e0328655</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0328655</pub-id><pub-id pub-id-type="medline">40901823</pub-id></nlm-citation></ref><ref id="ref66"><label>66</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mousavi</surname><given-names>H</given-names> </name><name name-style="western"><surname>Karandish</surname><given-names>M</given-names> </name><name name-style="western"><surname>Jamshidnezhad</surname><given-names>A</given-names> </name><name name-style="western"><surname>Hadianfard</surname><given-names>AM</given-names> </name></person-group><article-title>Determining the effective factors in predicting diet adherence using an intelligent model</article-title><source>Sci Rep</source><year>2022</year><month>07</month><day>19</day><volume>12</volume><issue>1</issue><fpage>12340</fpage><pub-id pub-id-type="doi">10.1038/s41598-022-16680-8</pub-id><pub-id pub-id-type="medline">35853992</pub-id></nlm-citation></ref><ref id="ref67"><label>67</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jin</surname><given-names>T</given-names> </name><name name-style="western"><surname>Halili</surname><given-names>A</given-names> </name></person-group><article-title>Predicting the risk of depression in older adults with disability using machine learning: an analysis based on CHARLS data</article-title><source>Front Artif Intell</source><year>2025</year><volume>8</volume><fpage>1624171</fpage><pub-id pub-id-type="doi">10.3389/frai.2025.1624171</pub-id><pub-id pub-id-type="medline">40673213</pub-id></nlm-citation></ref><ref id="ref68"><label>68</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Luo</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Guo</surname><given-names>M</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>Q</given-names> </name></person-group><article-title>Cross-national analysis of social determinants of frailty among middle-aged and older adults: a machine learning study in the USA, England, and China</article-title><source>Humanit Soc Sci Commun</source><year>2025</year><month>05</month><day>30</day><volume>12</volume><issue>1</issue><pub-id pub-id-type="doi">10.1057/s41599-025-05088-0</pub-id></nlm-citation></ref><ref id="ref69"><label>69</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Puterman</surname><given-names>E</given-names> </name><name name-style="western"><surname>Weiss</surname><given-names>J</given-names> </name><name name-style="western"><surname>Hives</surname><given-names>BA</given-names> </name><etal/></person-group><article-title>Predicting mortality from 57 economic, behavioral, social, and psychological factors</article-title><source>Proc Natl Acad Sci USA</source><year>2020</year><month>07</month><day>14</day><volume>117</volume><issue>28</issue><fpage>16273</fpage><lpage>16282</lpage><pub-id pub-id-type="doi">10.1073/pnas.1918455117</pub-id></nlm-citation></ref><ref id="ref70"><label>70</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Qasrawi</surname><given-names>R</given-names> </name><name name-style="western"><surname>Vicuna Polo</surname><given-names>S</given-names> </name><name name-style="western"><surname>Abu Khader</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Machine learning techniques for identifying mental health risk factor associated with schoolchildren cognitive ability living in politically violent environments</article-title><source>Front PSYCHIATRY</source><year>2023</year><volume>14</volume><fpage>1071622</fpage><pub-id pub-id-type="doi">10.3389/fpsyt.2023.1071622</pub-id><pub-id pub-id-type="medline">37304448</pub-id></nlm-citation></ref><ref id="ref71"><label>71</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhou</surname><given-names>X</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>Q</given-names> </name><etal/></person-group><article-title>Lifestyle-associated serum metabolites profiling in relation to risk of late-onset psoriasis</article-title><source>J Eur Acad Dermatol Venereol</source><year>2025</year><month>09</month><pub-id pub-id-type="doi">10.2139/ssrn.5085567</pub-id><pub-id pub-id-type="medline">40956048</pub-id></nlm-citation></ref><ref id="ref72"><label>72</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Abdul Rahman</surname><given-names>H</given-names> </name><name name-style="western"><surname>Kwicklis</surname><given-names>M</given-names> </name><name name-style="western"><surname>Ottom</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Machine learning-based prediction of mental well-being using health behavior data from university students</article-title><source>Bioengineering (Basel)</source><year>2023</year><month>05</month><day>10</day><volume>10</volume><issue>5</issue><fpage>575</fpage><pub-id pub-id-type="doi">10.3390/bioengineering10050575</pub-id><pub-id pub-id-type="medline">37237644</pub-id></nlm-citation></ref><ref id="ref73"><label>73</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cort&#x00E9;s-Iba&#x00F1;ez</surname><given-names>FO</given-names> </name><name name-style="western"><surname>Nagaraj</surname><given-names>SB</given-names> </name><name name-style="western"><surname>Cornelissen</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Prediction of incident cancers in the lifelines population-based cohort</article-title><source>Cancers (Basel)</source><year>2021</year><month>04</month><day>28</day><volume>13</volume><issue>9</issue><fpage>2133</fpage><pub-id pub-id-type="doi">10.3390/cancers13092133</pub-id><pub-id pub-id-type="medline">33925159</pub-id></nlm-citation></ref><ref id="ref74"><label>74</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cort&#x00E9;s-Iba&#x00F1;ez</surname><given-names>FO</given-names> </name><name name-style="western"><surname>Belur Nagaraj</surname><given-names>S</given-names> </name><name name-style="western"><surname>Cornelissen</surname><given-names>L</given-names> </name><name name-style="western"><surname>Sidorenkov</surname><given-names>G</given-names> </name><name name-style="western"><surname>de Bock</surname><given-names>GH</given-names> </name></person-group><article-title>A classification approach for cancer survivors from those cancer-free, based on health behaviors: analysis of the lifelines cohort</article-title><source>CANCERS (Basel)</source><year>2021</year><month>05</month><day>12</day><volume>13</volume><issue>10</issue><fpage>2335</fpage><pub-id pub-id-type="doi">10.3390/cancers13102335</pub-id><pub-id pub-id-type="medline">34066093</pub-id></nlm-citation></ref><ref id="ref75"><label>75</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Faruqui</surname><given-names>SHA</given-names> </name><name name-style="western"><surname>Du</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Meka</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Development of a deep learning model for dynamic forecasting of blood glucose level for type 2 diabetes mellitus: secondary analysis of a randomized controlled trial</article-title><source>JMIR Mhealth Uhealth</source><year>2019</year><month>11</month><day>1</day><volume>7</volume><issue>11</issue><fpage>e14452</fpage><pub-id pub-id-type="doi">10.2196/14452</pub-id><pub-id pub-id-type="medline">31682586</pub-id></nlm-citation></ref><ref id="ref76"><label>76</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Guthrie</surname><given-names>NL</given-names> </name><name name-style="western"><surname>Carpenter</surname><given-names>J</given-names> </name><name name-style="western"><surname>Edwards</surname><given-names>KL</given-names> </name><etal/></person-group><article-title>Emergence of digital biomarkers to predict and modify treatment efficacy: machine learning study</article-title><source>BMJ Open</source><year>2019</year><month>07</month><day>23</day><volume>9</volume><issue>7</issue><fpage>e030710</fpage><pub-id pub-id-type="doi">10.1136/bmjopen-2019-030710</pub-id><pub-id pub-id-type="medline">31337662</pub-id></nlm-citation></ref><ref id="ref77"><label>77</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hu</surname><given-names>L</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>B</given-names> </name><name name-style="western"><surname>Li</surname><given-names>Y</given-names> </name></person-group><article-title>Ranking sociodemographic, health behavior, prevention, and environmental factors in predicting neighborhood cardiovascular health: a Bayesian machine learning approach</article-title><source>Prev Med</source><year>2020</year><month>12</month><volume>141</volume><fpage>106240</fpage><pub-id pub-id-type="doi">10.1016/j.ypmed.2020.106240</pub-id><pub-id pub-id-type="medline">32860821</pub-id></nlm-citation></ref><ref id="ref78"><label>78</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hu</surname><given-names>L</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>B</given-names> </name><name name-style="western"><surname>Ji</surname><given-names>J</given-names> </name><name name-style="western"><surname>Li</surname><given-names>Y</given-names> </name></person-group><article-title>Tree-based machine learning to identify and understand major determinants for stroke at the neighborhood level</article-title><source>J Am Heart Assoc</source><year>2020</year><month>11</month><day>17</day><volume>9</volume><issue>22</issue><fpage>e016745</fpage><pub-id pub-id-type="doi">10.1161/JAHA.120.016745</pub-id><pub-id pub-id-type="medline">33140687</pub-id></nlm-citation></ref><ref id="ref79"><label>79</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Luo</surname><given-names>L</given-names> </name><name name-style="western"><surname>Yuan</surname><given-names>J</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Mental health issues and 24-Hour movement guidelines&#x2013;based intervention strategies for university students with high-risk social network addiction: cross-sectional study using a machine learning approach</article-title><source>J Med Internet Res</source><year>2025</year><month>06</month><day>13</day><volume>27</volume><fpage>e72260</fpage><pub-id pub-id-type="doi">10.2196/72260</pub-id><pub-id pub-id-type="medline">40512996</pub-id></nlm-citation></ref><ref id="ref80"><label>80</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Majcherek</surname><given-names>D</given-names> </name><name name-style="western"><surname>Kowalski</surname><given-names>AM</given-names> </name><name name-style="western"><surname>Lewandowska</surname><given-names>MS</given-names> </name></person-group><article-title>Lifestyle, demographic and socio-economic determinants of mental health disorders of employees in the European countries</article-title><source>Int J Environ Res Public Health</source><year>2022</year><month>09</month><day>21</day><volume>19</volume><issue>19</issue><fpage>11913</fpage><pub-id pub-id-type="doi">10.3390/ijerph191911913</pub-id><pub-id pub-id-type="medline">36231214</pub-id></nlm-citation></ref><ref id="ref81"><label>81</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mun</surname><given-names>EY</given-names> </name><name name-style="western"><surname>Geng</surname><given-names>F</given-names> </name></person-group><article-title>Predicting post-experiment fatigue among healthy young adults: random forest regression analysis</article-title><source>Psychol Test Assess Model</source><year>2019</year><month>11</month><day>8</day><volume>61</volume><issue>4</issue><fpage>471</fpage><lpage>493</lpage><pub-id pub-id-type="medline">32038903</pub-id></nlm-citation></ref><ref id="ref82"><label>82</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Park</surname><given-names>J</given-names> </name><name name-style="western"><surname>Edington</surname><given-names>DW</given-names> </name></person-group><article-title>Application of a prediction model for identification of individuals at diabetic risk</article-title><source>Methods Inf Med</source><year>2004</year><volume>43</volume><issue>3</issue><fpage>273</fpage><lpage>281</lpage><pub-id pub-id-type="medline">15227557</pub-id></nlm-citation></ref><ref id="ref83"><label>83</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Park</surname><given-names>S</given-names> </name></person-group><article-title>Association of a high healthy eating index diet with long-term visceral fat loss in a large longitudinal study</article-title><source>Nutrients</source><year>2024</year><month>02</month><volume>16</volume><issue>4</issue><fpage>534</fpage><pub-id pub-id-type="doi">10.3390/nu16040534</pub-id></nlm-citation></ref><ref id="ref84"><label>84</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shi</surname><given-names>H</given-names> </name><name name-style="western"><surname>Fang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Ma</surname><given-names>X</given-names> </name></person-group><article-title>Application of machine learning algorithms in osteoporosis analysis based on cardiovascular health assessed by life&#x2019;s essential 8: a cross-sectional study</article-title><source>J Health Popul Nutr</source><year>2025</year><month>05</month><day>29</day><volume>44</volume><issue>1</issue><pub-id pub-id-type="doi">10.1186/s41043-025-00941-z</pub-id></nlm-citation></ref><ref id="ref85"><label>85</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xin</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Ren</surname><given-names>X</given-names> </name></person-group><article-title>Predicting depression among rural and urban disabled elderly in China using a random forest classifier</article-title><source>BMC Psychiatry</source><year>2022</year><month>02</month><day>15</day><volume>22</volume><issue>1</issue><fpage>118</fpage><pub-id pub-id-type="doi">10.1186/s12888-022-03742-4</pub-id><pub-id pub-id-type="medline">35168579</pub-id></nlm-citation></ref><ref id="ref86"><label>86</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>L</given-names> </name><name name-style="western"><surname>Zhao</surname><given-names>S</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Zheng</surname><given-names>H</given-names> </name><name name-style="western"><surname>Lei</surname><given-names>M</given-names> </name></person-group><article-title>An artificial intelligence platform to stratify the risk of experiencing sleep disturbance in university students after analyzing psychological health, lifestyle, and sports: a multicenter externally validated study</article-title><source>Psychol Res Behav Manag</source><year>2024</year><volume>17</volume><fpage>1057</fpage><lpage>1071</lpage><pub-id pub-id-type="doi">10.2147/PRBM.S448698</pub-id><pub-id pub-id-type="medline">38505352</pub-id></nlm-citation></ref><ref id="ref87"><label>87</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Allen</surname><given-names>B</given-names> </name></person-group><article-title>An interpretable machine learning model of cross-sectional U.S. county-level obesity prevalence using explainable artificial intelligence</article-title><source>PLOS ONE</source><year>2023</year><volume>18</volume><issue>10</issue><fpage>e0292341</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0292341</pub-id><pub-id pub-id-type="medline">37796874</pub-id></nlm-citation></ref><ref id="ref88"><label>88</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Morris</surname><given-names>MC</given-names> </name><name name-style="western"><surname>Moradi</surname><given-names>H</given-names> </name><name name-style="western"><surname>Aslani</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Predicting incident cardiovascular disease among African-American adults: a deep learning approach to evaluate social determinants of health in the Jackson heart study</article-title><source>PLOS ONE</source><year>2023</year><volume>18</volume><issue>11</issue><fpage>e0294050</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0294050</pub-id><pub-id pub-id-type="medline">37948388</pub-id></nlm-citation></ref><ref id="ref89"><label>89</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Moon</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Woo</surname><given-names>H</given-names> </name></person-group><article-title>Key risk factors of generalized anxiety disorder in adolescents: machine learning study</article-title><source>Front Public Health</source><year>2024</year><volume>12</volume><fpage>1504739</fpage><pub-id pub-id-type="doi">10.3389/fpubh.2024.1504739</pub-id><pub-id pub-id-type="medline">39839408</pub-id></nlm-citation></ref><ref id="ref90"><label>90</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cheung</surname><given-names>YK</given-names> </name><name name-style="western"><surname>Hsueh</surname><given-names>PYS</given-names> </name><name name-style="western"><surname>Qian</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Are nomothetic or ideographic approaches superior in predicting daily exercise behaviors?</article-title><source>METHODS Inf Med</source><year>2017</year><volume>56</volume><issue>6</issue><fpage>452</fpage><lpage>460</lpage><pub-id pub-id-type="doi">10.3414/ME16-02-0051</pub-id><pub-id pub-id-type="medline">29582914</pub-id></nlm-citation></ref><ref id="ref91"><label>91</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>J</given-names> </name><name name-style="western"><surname>Jeong</surname><given-names>K</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>S</given-names> </name><name name-style="western"><surname>Baek</surname><given-names>Y</given-names> </name></person-group><article-title>Machine-learning model predicting quality of life using multifaceted lifestyles in middle-aged South Korean adults: a cross-sectional study</article-title><source>BMC Public Health</source><year>2024</year><month>01</month><day>11</day><volume>24</volume><issue>1</issue><fpage>159</fpage><pub-id pub-id-type="doi">10.1186/s12889-023-17457-y</pub-id><pub-id pub-id-type="medline">38212741</pub-id></nlm-citation></ref><ref id="ref92"><label>92</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pereira</surname><given-names>MG</given-names> </name><name name-style="western"><surname>Santos</surname><given-names>M</given-names> </name><name name-style="western"><surname>Magalh&#x00E3;es</surname><given-names>R</given-names> </name><name name-style="western"><surname>Rodrigues</surname><given-names>C</given-names> </name><name name-style="western"><surname>Ara&#x00FA;jo</surname><given-names>O</given-names> </name><name name-style="western"><surname>Dur&#x00E3;es</surname><given-names>D</given-names> </name></person-group><article-title>Burnout risk profiles in psychology students: an exploratory study with machine learning</article-title><source>Behav Sci (Basel)</source><year>2025</year><month>04</month><day>9</day><volume>15</volume><issue>4</issue><fpage>505</fpage><pub-id pub-id-type="doi">10.3390/bs15040505</pub-id><pub-id pub-id-type="medline">40282126</pub-id></nlm-citation></ref><ref id="ref93"><label>93</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ai</surname><given-names>M</given-names> </name><name name-style="western"><surname>Morris</surname><given-names>TP</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Resting-state MRI functional connectivity as a neural correlate of multidomain lifestyle adherence in older adults at risk for Alzheimer&#x2019;s disease</article-title><source>Sci Rep</source><year>2023</year><month>05</month><day>9</day><volume>13</volume><issue>1</issue><fpage>7487</fpage><pub-id pub-id-type="doi">10.1038/s41598-023-32714-1</pub-id><pub-id pub-id-type="medline">37160915</pub-id></nlm-citation></ref><ref id="ref94"><label>94</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sandri</surname><given-names>E</given-names> </name><name name-style="western"><surname>Cerd&#x00E1; Olmedo</surname><given-names>G</given-names> </name><name name-style="western"><surname>Piredda</surname><given-names>M</given-names> </name><name name-style="western"><surname>Werner</surname><given-names>LU</given-names> </name><name name-style="western"><surname>Dentamaro</surname><given-names>V</given-names> </name></person-group><article-title>Explanatory AI predicts the diet adopted based on nutritional and lifestyle habits in the Spanish population</article-title><source>Eur J Investig Health Psychol Educ</source><year>2025</year><month>01</month><day>24</day><volume>15</volume><issue>2</issue><fpage>11</fpage><pub-id pub-id-type="doi">10.3390/ejihpe15020011</pub-id><pub-id pub-id-type="medline">39997075</pub-id></nlm-citation></ref><ref id="ref95"><label>95</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Birk</surname><given-names>N</given-names> </name><name name-style="western"><surname>Matsuzaki</surname><given-names>M</given-names> </name><name name-style="western"><surname>Fung</surname><given-names>TT</given-names> </name><etal/></person-group><article-title>Exploration of machine learning and statistical techniques in development of a low-cost screening method featuring the global diet quality score for detecting prediabetes in rural India</article-title><source>J Nutr</source><year>2021</year><month>10</month><day>23</day><volume>151</volume><issue>12 Suppl 2</issue><fpage>110S</fpage><lpage>118S</lpage><pub-id pub-id-type="doi">10.1093/jn/nxab281</pub-id><pub-id pub-id-type="medline">34689190</pub-id></nlm-citation></ref><ref id="ref96"><label>96</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wallace</surname><given-names>ML</given-names> </name><name name-style="western"><surname>Buysse</surname><given-names>DJ</given-names> </name><name name-style="western"><surname>Redline</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Multidimensional sleep and mortality in older adults: a machine-learning comparison with other risk factors</article-title><source>J Gerontol A Biol Sci Med Sci</source><year>2019</year><month>11</month><day>13</day><volume>74</volume><issue>12</issue><fpage>1903</fpage><lpage>1909</lpage><pub-id pub-id-type="doi">10.1093/gerona/glz044</pub-id><pub-id pub-id-type="medline">30778527</pub-id></nlm-citation></ref><ref id="ref97"><label>97</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>D</given-names> </name><name name-style="western"><surname>Lu</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Development and validation of an explainable machine learning model for predicting the risk of sleep disorders in older adults with multimorbidity: a cross-sectional study</article-title><source>Front Public Health</source><year>2025</year><volume>13</volume><fpage>1619406</fpage><pub-id pub-id-type="doi">10.3389/fpubh.2025.1619406</pub-id><pub-id pub-id-type="medline">40860561</pub-id></nlm-citation></ref><ref id="ref98"><label>98</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhou</surname><given-names>RZ</given-names> </name><name name-style="western"><surname>Hu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Tirabassi</surname><given-names>JN</given-names> </name><name name-style="western"><surname>Ma</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>Z</given-names> </name></person-group><article-title>Deriving neighborhood-level diet and physical activity measurements from anonymized mobile phone location data for enhancing obesity estimation</article-title><source>Int J Health Geogr</source><year>2022</year><month>12</month><day>30</day><volume>21</volume><issue>1</issue><fpage>22</fpage><pub-id pub-id-type="doi">10.1186/s12942-022-00321-4</pub-id><pub-id pub-id-type="medline">36585658</pub-id></nlm-citation></ref><ref id="ref99"><label>99</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Oladeji</surname><given-names>O</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>C</given-names> </name><name name-style="western"><surname>Moradi</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Monitoring information-seeking patterns and obesity prevalence in Africa with internet search data: observational study</article-title><source>JMIR Public Health Surveill</source><year>2021</year><month>04</month><day>29</day><volume>7</volume><issue>4</issue><fpage>e24348</fpage><pub-id pub-id-type="doi">10.2196/24348</pub-id><pub-id pub-id-type="medline">33913815</pub-id></nlm-citation></ref><ref id="ref100"><label>100</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Stemmer</surname><given-names>M</given-names> </name><name name-style="western"><surname>Parmet</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Ravid</surname><given-names>G</given-names> </name></person-group><article-title>Identifying patients with inflammatory bowel disease on Twitter and learning from their personal experience: retrospective cohort study</article-title><source>J Med Internet Res</source><year>2022</year><month>08</month><day>2</day><volume>24</volume><issue>8</issue><fpage>e29186</fpage><pub-id pub-id-type="doi">10.2196/29186</pub-id><pub-id pub-id-type="medline">35917151</pub-id></nlm-citation></ref><ref id="ref101"><label>101</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sathyanarayana</surname><given-names>A</given-names> </name><name name-style="western"><surname>Joty</surname><given-names>S</given-names> </name><name name-style="western"><surname>Fernandez-Luque</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Sleep quality prediction from wearable data using deep learning</article-title><source>JMIR Mhealth Uhealth</source><year>2016</year><month>11</month><day>4</day><volume>4</volume><issue>4</issue><fpage>e125</fpage><pub-id pub-id-type="doi">10.2196/mhealth.6562</pub-id><pub-id pub-id-type="medline">27815231</pub-id></nlm-citation></ref><ref id="ref102"><label>102</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chiang</surname><given-names>PH</given-names> </name><name name-style="western"><surname>Dey</surname><given-names>S</given-names> </name></person-group><article-title>Offline and online learning techniques for personalized blood pressure prediction and health behavior recommendations</article-title><source>IEEE Access</source><year>2019</year><volume>7</volume><fpage>130854</fpage><lpage>130864</lpage><pub-id pub-id-type="doi">10.1109/ACCESS.2019.2939218</pub-id></nlm-citation></ref><ref id="ref103"><label>103</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhong</surname><given-names>J</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>W</given-names> </name><name name-style="western"><surname>Niu</surname><given-names>B</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>X</given-names> </name><name name-style="western"><surname>Deng</surname><given-names>Y</given-names> </name></person-group><article-title>Role of built environments on physical activity and health promotion: a review and policy insights</article-title><source>Front Public Health</source><year>2022</year><volume>10</volume><fpage>950348</fpage><pub-id pub-id-type="doi">10.3389/fpubh.2022.950348</pub-id><pub-id pub-id-type="medline">35910910</pub-id></nlm-citation></ref><ref id="ref104"><label>104</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kimura</surname><given-names>N</given-names> </name><name name-style="western"><surname>Aota</surname><given-names>T</given-names> </name><name name-style="western"><surname>Aso</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Predicting positron emission tomography brain amyloid positivity using interpretable machine learning models with wearable sensor data and lifestyle factors</article-title><source>Alz Res THERAPY</source><year>2023</year><volume>15</volume><issue>1</issue><pub-id pub-id-type="doi">10.1186/s13195-023-01363-x</pub-id></nlm-citation></ref><ref id="ref105"><label>105</label><nlm-citation citation-type="web"><article-title>The R project for statistical computing</article-title><year>2022</year><access-date>2026-02-20</access-date><publisher-name>R Foundation for Statistical Computing</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://www.R-project.org/">https://www.R-project.org/</ext-link></comment></nlm-citation></ref><ref id="ref106"><label>106</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wickham</surname><given-names>H</given-names> </name><name name-style="western"><surname>Averick</surname><given-names>M</given-names> </name><name name-style="western"><surname>Bryan</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Welcome to the Tidyverse</article-title><source>JOSS</source><year>2019</year><month>11</month><day>21</day><volume>4</volume><issue>43</issue><fpage>1686</fpage><pub-id pub-id-type="doi">10.21105/joss.01686</pub-id></nlm-citation></ref><ref id="ref107"><label>107</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Groothuis-Oudshoorn</surname><given-names>K</given-names> </name></person-group><article-title>mice: multivariate imputation by chained equations in R</article-title><source>J Stat Soft</source><year>2011</year><volume>45</volume><issue>3</issue><pub-id pub-id-type="doi">10.18637/jss.v045.i03</pub-id></nlm-citation></ref><ref id="ref108"><label>108</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kursa</surname><given-names>MB</given-names> </name><name name-style="western"><surname>Rudnicki</surname><given-names>WR</given-names> </name></person-group><article-title>Feature selection with the Boruta package</article-title><source>J Stat Soft</source><year>2010</year><volume>36</volume><issue>11</issue><pub-id pub-id-type="doi">10.18637/jss.v036.i11</pub-id></nlm-citation></ref><ref id="ref109"><label>109</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kuhn</surname><given-names>M</given-names> </name></person-group><article-title>Building predictive models in R using the caret package</article-title><source>J Stat Soft</source><year>2008</year><volume>28</volume><issue>5</issue><pub-id pub-id-type="doi">10.18637/jss.v028.i05</pub-id></nlm-citation></ref><ref id="ref110"><label>110</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>van der Laan</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Polley</surname><given-names>EC</given-names> </name><name name-style="western"><surname>Hubbard</surname><given-names>AE</given-names> </name></person-group><article-title>Super learner</article-title><source>Stat Appl Genet Mol Biol</source><year>2007</year><volume>6</volume><issue>1</issue><pub-id pub-id-type="doi">10.2202/1544-6115.1309</pub-id><pub-id pub-id-type="medline">17910531</pub-id></nlm-citation></ref><ref id="ref111"><label>111</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lin</surname><given-names>S (Lamson</given-names> </name></person-group><article-title>The &#x201C;loneliness epidemic&#x201D;, intersecting risk factors and relations to mental health help-seeking: a population-based study during COVID-19 lockdown in Canada</article-title><source>J Affect Disord</source><year>2023</year><month>01</month><volume>320</volume><fpage>7</fpage><lpage>17</lpage><pub-id pub-id-type="doi">10.1016/j.jad.2022.08.131</pub-id></nlm-citation></ref><ref id="ref112"><label>112</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Berthold</surname><given-names>MR</given-names> </name><name name-style="western"><surname>Cebron</surname><given-names>N</given-names> </name><name name-style="western"><surname>Dill</surname><given-names>F</given-names> </name><etal/></person-group><article-title>KNIME - the Konstanz information miner: version 2.0 and beyond</article-title><source>SIGKDD Explor Newsl</source><year>2009</year><month>11</month><day>16</day><volume>11</volume><issue>1</issue><fpage>26</fpage><lpage>31</lpage><pub-id pub-id-type="doi">10.1145/1656274.1656280</pub-id></nlm-citation></ref><ref id="ref113"><label>113</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Castro</surname><given-names>R</given-names> </name><name name-style="western"><surname>Ribeiro-Alves</surname><given-names>M</given-names> </name><name name-style="western"><surname>Oliveira</surname><given-names>C</given-names> </name><etal/></person-group><article-title>What are we measuring when we evaluate digital interventions for improving lifestyle? A scoping meta-review</article-title><source>Front Public Health</source><year>2021</year><volume>9</volume><fpage>735624</fpage><pub-id pub-id-type="doi">10.3389/fpubh.2021.735624</pub-id><pub-id pub-id-type="medline">35047469</pub-id></nlm-citation></ref><ref id="ref114"><label>114</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pasquetto</surname><given-names>IV</given-names> </name><name name-style="western"><surname>Borgman</surname><given-names>CL</given-names> </name><name name-style="western"><surname>Wofford</surname><given-names>MF</given-names> </name></person-group><article-title>Uses and reuses of scientific data: the data creators&#x2019; advantage</article-title><source>HDSR</source><year>2019</year><access-date>2026-02-20</access-date><volume>1</volume><issue>2</issue><comment><ext-link ext-link-type="uri" xlink:href="https://hdsr.mitpress.mit.edu/collection/af83430a">https://hdsr.mitpress.mit.edu/collection/af83430a</ext-link></comment><pub-id pub-id-type="doi">10.1162/99608f92.fc14bf2d</pub-id></nlm-citation></ref><ref id="ref115"><label>115</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Aldoseri</surname><given-names>A</given-names> </name><name name-style="western"><surname>Al-Khalifa</surname><given-names>KN</given-names> </name><name name-style="western"><surname>Hamouda</surname><given-names>AM</given-names> </name></person-group><article-title>Re-thinking data strategy and integration for artificial intelligence: concepts, opportunities, and challenges</article-title><source>Appl Sci (Basel)</source><year>2023</year><month>06</month><day>13</day><volume>13</volume><issue>12</issue><fpage>7082</fpage><pub-id pub-id-type="doi">10.3390/app13127082</pub-id></nlm-citation></ref><ref id="ref116"><label>116</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>KH</given-names> </name><name name-style="western"><surname>Oh</surname><given-names>SW</given-names> </name><name name-style="western"><surname>Ko</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>KH</given-names> </name><name name-style="western"><surname>Choi</surname><given-names>W</given-names> </name><name name-style="western"><surname>Choi</surname><given-names>IY</given-names> </name></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Meri</surname><given-names>A</given-names> </name></person-group><article-title>Healthcare data quality assessment for improving the quality of the Korea Biobank Network</article-title><source>PLoS ONE</source><year>2023</year><volume>18</volume><issue>11</issue><fpage>e0294554</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0294554</pub-id><pub-id pub-id-type="medline">37983215</pub-id></nlm-citation></ref><ref id="ref117"><label>117</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Iqbal</surname><given-names>SMA</given-names> </name><name name-style="western"><surname>Mahgoub</surname><given-names>I</given-names> </name><name name-style="western"><surname>Du</surname><given-names>E</given-names> </name><name name-style="western"><surname>Leavitt</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Asghar</surname><given-names>W</given-names> </name></person-group><article-title>Advances in healthcare wearable devices</article-title><source>npj Flex Electron</source><year>2021</year><volume>5</volume><issue>1</issue><fpage>9</fpage><pub-id pub-id-type="doi">10.1038/s41528-021-00107-x</pub-id></nlm-citation></ref><ref id="ref118"><label>118</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Mohanta</surname><given-names>B</given-names> </name><name name-style="western"><surname>Das</surname><given-names>P</given-names> </name><name name-style="western"><surname>Patnaik</surname><given-names>S</given-names> </name></person-group><article-title>Healthcare 5.0: a paradigm shift in digital healthcare system using artificial intelligence, IOT and 5G communication</article-title><year>2019</year><conf-name>2019 International Conference on Applied Machine Learning (ICAML)</conf-name><conf-date>May 25-26, 2019</conf-date><conf-loc>Bhubaneswar, India</conf-loc><fpage>191</fpage><lpage>196</lpage><pub-id pub-id-type="doi">10.1109/ICAML48257.2019.00044</pub-id></nlm-citation></ref><ref id="ref119"><label>119</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kamel Boulos</surname><given-names>MN</given-names> </name><name name-style="western"><surname>Koh</surname><given-names>K</given-names> </name></person-group><article-title>Smart city lifestyle sensing, big data, geo-analytics and intelligence for smarter public health decision-making in overweight, obesity and type 2 diabetes prevention: the research we should be doing</article-title><source>Int J Health Geogr</source><year>2021</year><month>03</month><day>3</day><volume>20</volume><issue>1</issue><fpage>12</fpage><pub-id pub-id-type="doi">10.1186/s12942-021-00266-0</pub-id><pub-id pub-id-type="medline">33658039</pub-id></nlm-citation></ref><ref id="ref120"><label>120</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Perez-Pozuelo</surname><given-names>I</given-names> </name><name name-style="western"><surname>Zhai</surname><given-names>B</given-names> </name><name name-style="western"><surname>Palotti</surname><given-names>J</given-names> </name><etal/></person-group><article-title>The future of sleep health: a data-driven revolution in sleep science and medicine</article-title><source>NPJ Digit Med</source><year>2020</year><volume>3</volume><issue>1</issue><fpage>42</fpage><pub-id pub-id-type="doi">10.1038/s41746-020-0244-4</pub-id><pub-id pub-id-type="medline">32219183</pub-id></nlm-citation></ref><ref id="ref121"><label>121</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Reinertsen</surname><given-names>E</given-names> </name><name name-style="western"><surname>Clifford</surname><given-names>GD</given-names> </name></person-group><article-title>A review of physiological and behavioral monitoring with digital sensors for neuropsychiatric illnesses</article-title><source>Physiol Meas</source><year>2018</year><month>05</month><day>15</day><volume>39</volume><issue>5</issue><fpage>05TR01</fpage><pub-id pub-id-type="doi">10.1088/1361-6579/aabf64</pub-id><pub-id pub-id-type="medline">29671754</pub-id></nlm-citation></ref><ref id="ref122"><label>122</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Breiman</surname><given-names>L</given-names> </name></person-group><article-title>Random forests</article-title><source>Mach Learn</source><year>2001</year><month>10</month><volume>45</volume><issue>1</issue><fpage>5</fpage><lpage>32</lpage><pub-id pub-id-type="doi">10.1023/A:1010933404324</pub-id></nlm-citation></ref><ref id="ref123"><label>123</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Kuhn</surname><given-names>M</given-names> </name><name name-style="western"><surname>Johnson</surname><given-names>K</given-names> </name></person-group><source>Feature Engineering and Selection: A Practical Approach for Predictive Models</source><year>2020</year><publisher-name>CRC Press, Taylor &#x0026; Francis Group</publisher-name><pub-id pub-id-type="other">978-1-138-07922-9</pub-id></nlm-citation></ref><ref id="ref124"><label>124</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Thompson</surname><given-names>NC</given-names> </name><name name-style="western"><surname>Ge</surname><given-names>S</given-names> </name><name name-style="western"><surname>Manso</surname><given-names>GF</given-names> </name></person-group><article-title>The importance of (exponentially more) computing power</article-title><source>arXiv</source><comment>Preprint posted online on  Jun 28, 2022</comment><pub-id pub-id-type="doi">10.48550/ARXIV.2206.14007</pub-id></nlm-citation></ref><ref id="ref125"><label>125</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Arora</surname><given-names>A</given-names> </name><name name-style="western"><surname>Alderman</surname><given-names>JE</given-names> </name><name name-style="western"><surname>Palmer</surname><given-names>J</given-names> </name><etal/></person-group><article-title>The value of standards for health datasets in artificial intelligence-based applications</article-title><source>Nat Med</source><year>2023</year><month>11</month><volume>29</volume><issue>11</issue><fpage>2929</fpage><lpage>2938</lpage><pub-id pub-id-type="doi">10.1038/s41591-023-02608-w</pub-id></nlm-citation></ref><ref id="ref126"><label>126</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chawla</surname><given-names>NV</given-names> </name><name name-style="western"><surname>Bowyer</surname><given-names>KW</given-names> </name><name name-style="western"><surname>Hall</surname><given-names>LO</given-names> </name><name name-style="western"><surname>Kegelmeyer</surname><given-names>WP</given-names> </name></person-group><article-title>SMOTE: Synthetic Minority Over-sampling Technique</article-title><source>jair</source><year>2002</year><month>06</month><day>1</day><volume>16</volume><fpage>321</fpage><lpage>357</lpage><pub-id pub-id-type="doi">10.1613/jair.953</pub-id></nlm-citation></ref><ref id="ref127"><label>127</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Aliferis</surname><given-names>C</given-names> </name><name name-style="western"><surname>Overfitting</surname><given-names>SG</given-names> </name></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Simon</surname><given-names>GJ</given-names> </name><name name-style="western"><surname>Aliferis</surname><given-names>C</given-names> </name></person-group><article-title>Underfitting and general model overconfidence and under-performance pitfalls and best practices in machine learning and AI</article-title><source>Artificial Intelligence and Machine Learning in Health Care and Medical Sciences</source><year>2024</year><publisher-name>Springer International Publishing</publisher-name><fpage>477</fpage><lpage>524</lpage><pub-id pub-id-type="doi">10.1007/978-3-031-39355-6_10</pub-id><pub-id pub-id-type="other">978-3-031-39354-9</pub-id></nlm-citation></ref><ref id="ref128"><label>128</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>James</surname><given-names>G</given-names> </name><name name-style="western"><surname>Witten</surname><given-names>D</given-names> </name><name name-style="western"><surname>Hastie</surname><given-names>T</given-names> </name><name name-style="western"><surname>Methods</surname><given-names>TRR</given-names> </name></person-group><source>Resampling Methods An Introduction to Statistical Learning</source><year>2021</year><publisher-name>Springer</publisher-name><fpage>197</fpage><lpage>223</lpage><pub-id pub-id-type="doi">10.1007/978-1-0716-1418-1_5</pub-id><pub-id pub-id-type="other">978-1-0716-1417-4</pub-id></nlm-citation></ref><ref id="ref129"><label>129</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Hyndman</surname><given-names>RJ</given-names> </name><name name-style="western"><surname>Athanasopoulos</surname><given-names>G</given-names> </name></person-group><source>Forecasting: Principles and Practice</source><year>2018</year><access-date>2026-02-20</access-date><edition>2</edition><publisher-name>OTexts</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://otexts.org/fpp2/">https://otexts.org/fpp2/</ext-link></comment></nlm-citation></ref><ref id="ref130"><label>130</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Saarela</surname><given-names>M</given-names> </name><name name-style="western"><surname>Podgorelec</surname><given-names>V</given-names> </name></person-group><article-title>Recent applications of explainable AI (XAI): a systematic literature review</article-title><source>Appl Sci (Basel)</source><year>2024</year><month>10</month><day>2</day><volume>14</volume><issue>19</issue><fpage>8884</fpage><pub-id pub-id-type="doi">10.3390/app14198884</pub-id></nlm-citation></ref><ref id="ref131"><label>131</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rodr&#x00ED;guez-P&#x00E9;rez</surname><given-names>R</given-names> </name><name name-style="western"><surname>Bajorath</surname><given-names>J</given-names> </name></person-group><article-title>Interpretation of compound activity predictions from complex machine learning models using local approximations and Shapley values</article-title><source>J Med Chem</source><year>2020</year><month>08</month><day>27</day><volume>63</volume><issue>16</issue><fpage>8761</fpage><lpage>8777</lpage><pub-id pub-id-type="doi">10.1021/acs.jmedchem.9b01101</pub-id><pub-id pub-id-type="medline">31512867</pub-id></nlm-citation></ref><ref id="ref132"><label>132</label><nlm-citation citation-type="web"><article-title>Overview</article-title><source>H2O.ai</source><year>2024</year><access-date>2026-02-20</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://docs.h2o.ai/h2o/latest-stable/h2o-docs/index.html">https://docs.h2o.ai/h2o/latest-stable/h2o-docs/index.html</ext-link></comment></nlm-citation></ref><ref id="ref133"><label>133</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hosker</surname><given-names>DK</given-names> </name><name name-style="western"><surname>Elkins</surname><given-names>RM</given-names> </name><name name-style="western"><surname>Potter</surname><given-names>MP</given-names> </name></person-group><article-title>Promoting mental health and wellness in youth through physical activity, nutrition, and sleep</article-title><source>Child Adolesc Psychiatr Clin N Am</source><year>2019</year><month>04</month><volume>28</volume><issue>2</issue><fpage>171</fpage><lpage>193</lpage><pub-id pub-id-type="doi">10.1016/j.chc.2018.11.010</pub-id><pub-id pub-id-type="medline">30832951</pub-id></nlm-citation></ref><ref id="ref134"><label>134</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kris-Etherton</surname><given-names>PM</given-names> </name><name name-style="western"><surname>Sapp</surname><given-names>PA</given-names> </name><name name-style="western"><surname>Riley</surname><given-names>TM</given-names> </name><name name-style="western"><surname>Davis</surname><given-names>KM</given-names> </name><name name-style="western"><surname>Hart</surname><given-names>T</given-names> </name><name name-style="western"><surname>Lawler</surname><given-names>O</given-names> </name></person-group><article-title>The dynamic interplay of healthy lifestyle behaviors for cardiovascular health</article-title><source>Curr Atheroscler Rep</source><year>2022</year><month>12</month><volume>24</volume><issue>12</issue><fpage>969</fpage><lpage>980</lpage><pub-id pub-id-type="doi">10.1007/s11883-022-01068-w</pub-id><pub-id pub-id-type="medline">36422788</pub-id></nlm-citation></ref><ref id="ref135"><label>135</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Kuhn</surname><given-names>M</given-names> </name><name name-style="western"><surname>Silge</surname><given-names>J</given-names> </name></person-group><source>Tidy Modeling with R: A Framework for Modeling in the Tidyverse</source><year>2022</year><edition>1</edition><publisher-name>O&#x2019;Reilly</publisher-name><pub-id pub-id-type="other">978-1-4920-9648-1</pub-id></nlm-citation></ref><ref id="ref136"><label>136</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Colaboratory</surname><given-names>BEG</given-names> </name></person-group><source>Building Machine Learning and Deep Learning Models on Google Cloud Platform</source><year>2019</year><publisher-name>Apress</publisher-name><fpage>59</fpage><lpage>64</lpage><pub-id pub-id-type="doi">10.1007/978-1-4842-4470-8_7</pub-id><pub-id pub-id-type="other">978-1-4842-4469-2</pub-id></nlm-citation></ref><ref id="ref137"><label>137</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Han</surname><given-names>S</given-names> </name><name name-style="western"><surname>Olonisakin</surname><given-names>TF</given-names> </name><name name-style="western"><surname>Pribis</surname><given-names>JP</given-names> </name><etal/></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Boltze</surname><given-names>J</given-names> </name></person-group><article-title>A checklist is associated with increased quality of reporting preclinical biomedical research: a systematic review</article-title><source>PLoS ONE</source><year>2017</year><volume>12</volume><issue>9</issue><fpage>e0183591</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0183591</pub-id></nlm-citation></ref><ref id="ref138"><label>138</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Luo</surname><given-names>W</given-names> </name><name name-style="western"><surname>Phung</surname><given-names>D</given-names> </name><name name-style="western"><surname>Tran</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Guidelines for developing and reporting machine learning predictive models in biomedical research: a multidisciplinary view</article-title><source>J Med Internet Res</source><year>2016</year><month>12</month><day>16</day><volume>18</volume><issue>12</issue><fpage>e323</fpage><pub-id pub-id-type="doi">10.2196/jmir.5870</pub-id><pub-id pub-id-type="medline">27986644</pub-id></nlm-citation></ref><ref id="ref139"><label>139</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Al-Zaiti</surname><given-names>SS</given-names> </name><name name-style="western"><surname>Alghwiri</surname><given-names>AA</given-names> </name><name name-style="western"><surname>Hu</surname><given-names>X</given-names> </name><etal/></person-group><article-title>A clinician&#x2019;s guide to understanding and critically appraising machine learning studies: a checklist for Ruling Out Bias Using Standard Tools in Machine Learning (ROBUST-ML)</article-title><source>Eur Heart J Digit Health</source><year>2022</year><month>06</month><volume>3</volume><issue>2</issue><fpage>125</fpage><lpage>140</lpage><pub-id pub-id-type="doi">10.1093/ehjdh/ztac016</pub-id><pub-id pub-id-type="medline">36713011</pub-id></nlm-citation></ref><ref id="ref140"><label>140</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Stevens</surname><given-names>GA</given-names> </name><name name-style="western"><surname>Alkema</surname><given-names>L</given-names> </name><name name-style="western"><surname>Black</surname><given-names>RE</given-names> </name><etal/></person-group><article-title>Guidelines for accurate and transparent health estimates reporting: the GATHER statement</article-title><source>The Lancet</source><year>2016</year><month>12</month><volume>388</volume><issue>10062</issue><fpage>e19</fpage><lpage>e23</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(16)30388-9</pub-id></nlm-citation></ref><ref id="ref141"><label>141</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Moritz</surname><given-names>S</given-names> </name><name name-style="western"><surname>Sard&#x00E1;</surname><given-names>A</given-names> </name><name name-style="western"><surname>Bartz-Beielstein</surname><given-names>T</given-names> </name><name name-style="western"><surname>Zaefferer</surname><given-names>M</given-names> </name><name name-style="western"><surname>Stork</surname><given-names>J</given-names> </name></person-group><article-title>Comparison of different methods for univariate time series imputation in r</article-title><source>arXiv</source><comment>Preprint posted online on  Oct 13, 2015</comment><pub-id pub-id-type="doi">10.48550/ARXIV.1510.03924</pub-id></nlm-citation></ref><ref id="ref142"><label>142</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mohsen</surname><given-names>F</given-names> </name><name name-style="western"><surname>Al-Absi</surname><given-names>HRH</given-names> </name><name name-style="western"><surname>Yousri</surname><given-names>NA</given-names> </name><name name-style="western"><surname>El Hajj</surname><given-names>N</given-names> </name><name name-style="western"><surname>Shah</surname><given-names>Z</given-names> </name></person-group><article-title>A scoping review of artificial intelligence-based methods for diabetes risk prediction</article-title><source>NPJ Digit Med</source><year>2023</year><month>10</month><day>25</day><volume>6</volume><issue>1</issue><fpage>197</fpage><pub-id pub-id-type="doi">10.1038/s41746-023-00933-5</pub-id><pub-id pub-id-type="medline">37880301</pub-id></nlm-citation></ref><ref id="ref143"><label>143</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Safi</surname><given-names>SK</given-names> </name><name name-style="western"><surname>Gul</surname><given-names>S</given-names> </name></person-group><article-title>An enhanced tree ensemble for classification in the presence of extreme class imbalance</article-title><source>Mathematics</source><year>2024</year><month>10</month><day>16</day><volume>12</volume><issue>20</issue><fpage>3243</fpage><pub-id pub-id-type="doi">10.3390/math12203243</pub-id></nlm-citation></ref><ref id="ref144"><label>144</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Velarde</surname><given-names>G</given-names> </name><name name-style="western"><surname>Weichert</surname><given-names>M</given-names> </name><name name-style="western"><surname>Deshmunkh</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Tree boosting methods for balanced and imbalanced classification and their robustness over time in risk assessment</article-title><source>Intelligent Systems with Applications</source><year>2024</year><month>06</month><volume>22</volume><fpage>200354</fpage><pub-id pub-id-type="doi">10.1016/j.iswa.2024.200354</pub-id></nlm-citation></ref><ref id="ref145"><label>145</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Caruana</surname><given-names>R</given-names> </name><name name-style="western"><surname>Niculescu-Mizil</surname><given-names>A</given-names> </name></person-group><article-title>An empirical comparison of supervised learning algorithms</article-title><year>2006</year><access-date>2026-02-20</access-date><conf-name>Proceedings of the 23rd international conference on Machine learning - ICML &#x2019;06</conf-name><conf-date>Jul 24-28, 2006</conf-date><conf-loc>Pittsburgh, PA</conf-loc><fpage>161</fpage><lpage>168</lpage><comment><ext-link ext-link-type="uri" xlink:href="http://portal.acm.org/citation.cfm?doid=1143844">http://portal.acm.org/citation.cfm?doid=1143844</ext-link></comment><pub-id pub-id-type="doi">10.1145/1143844.1143865</pub-id></nlm-citation></ref><ref id="ref146"><label>146</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Arnold</surname><given-names>C</given-names> </name><name name-style="western"><surname>Biedebach</surname><given-names>L</given-names> </name><name name-style="western"><surname>K&#x00FC;pfer</surname><given-names>A</given-names> </name><name name-style="western"><surname>Neunhoeffer</surname><given-names>M</given-names> </name></person-group><article-title>The role of hyperparameters in machine learning models and how to tune them</article-title><source>PSRM</source><year>2024</year><month>10</month><volume>12</volume><issue>4</issue><fpage>841</fpage><lpage>848</lpage><pub-id pub-id-type="doi">10.1017/psrm.2023.61</pub-id></nlm-citation></ref><ref id="ref147"><label>147</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Arlot</surname><given-names>S</given-names> </name><name name-style="western"><surname>Celisse</surname><given-names>A</given-names> </name></person-group><article-title>A survey of cross-validation procedures for model selection</article-title><source>Statist Surv</source><comment>Preprint posted online on 2009</comment><pub-id pub-id-type="doi">10.1214/09-SS054</pub-id></nlm-citation></ref><ref id="ref148"><label>148</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tsamardinos</surname><given-names>I</given-names> </name><name name-style="western"><surname>Greasidou</surname><given-names>E</given-names> </name><name name-style="western"><surname>Borboudakis</surname><given-names>G</given-names> </name></person-group><article-title>Bootstrapping the out-of-sample predictions for efficient and accurate cross-validation</article-title><source>Mach Learn</source><year>2018</year><month>12</month><volume>107</volume><issue>12</issue><fpage>1895</fpage><lpage>1922</lpage><pub-id pub-id-type="doi">10.1007/s10994-018-5714-4</pub-id></nlm-citation></ref><ref id="ref149"><label>149</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rainio</surname><given-names>O</given-names> </name><name name-style="western"><surname>Teuho</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kl&#x00E9;n</surname><given-names>R</given-names> </name></person-group><article-title>Evaluation metrics and statistical tests for machine learning</article-title><source>Sci Rep</source><year>2024</year><month>03</month><day>13</day><volume>14</volume><issue>1</issue><fpage>6086</fpage><pub-id pub-id-type="doi">10.1038/s41598-024-56706-x</pub-id></nlm-citation></ref><ref id="ref150"><label>150</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Grandini</surname><given-names>M</given-names> </name><name name-style="western"><surname>Bagli</surname><given-names>E</given-names> </name><name name-style="western"><surname>Visani</surname><given-names>G</given-names> </name></person-group><article-title>Metrics for multi-class classification: an overview</article-title><source>arXiv</source><comment>Preprint posted online on  Aug 13, 2020</comment><pub-id pub-id-type="doi">10.48550/ARXIV.2008.05756</pub-id></nlm-citation></ref><ref id="ref151"><label>151</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Lundberg</surname><given-names>S</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>SI</given-names> </name></person-group><article-title>A unified approach to interpreting model predictions</article-title><source>arXiv</source><access-date>2024-04-22</access-date><comment>Preprint posted online on  May 22, 2017</comment><comment><ext-link ext-link-type="uri" xlink:href="http://arxiv.org/abs/1705.07874">http://arxiv.org/abs/1705.07874</ext-link></comment></nlm-citation></ref><ref id="ref152"><label>152</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Ribeiro</surname><given-names>MT</given-names> </name><name name-style="western"><surname>Singh</surname><given-names>S</given-names> </name><name name-style="western"><surname>Guestrin</surname><given-names>C</given-names> </name></person-group><article-title>Model-agnostic interpretability of machine learning</article-title><source>arXiv</source><comment>Preprint posted online on  Jun 16, 2016</comment><pub-id pub-id-type="doi">10.48550/ARXIV.1606.05386</pub-id></nlm-citation></ref><ref id="ref153"><label>153</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Maksymiuk</surname><given-names>S</given-names> </name><name name-style="western"><surname>Gosiewska</surname><given-names>A</given-names> </name><name name-style="western"><surname>Biecek</surname><given-names>P</given-names> </name></person-group><article-title>Landscape of R packages for explainable artificial intelligence</article-title><source>arXiv</source><comment>Preprint posted online on  Sep 24, 2020</comment><pub-id pub-id-type="doi">10.48550/ARXIV.2009.13248</pub-id></nlm-citation></ref><ref id="ref154"><label>154</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ponce&#x2010;Bobadilla</surname><given-names>AV</given-names> </name><name name-style="western"><surname>Schmitt</surname><given-names>V</given-names> </name><name name-style="western"><surname>Maier</surname><given-names>CS</given-names> </name><name name-style="western"><surname>Mensing</surname><given-names>S</given-names> </name><name name-style="western"><surname>Stodtmann</surname><given-names>S</given-names> </name></person-group><article-title>Practical guide to SHAP analysis: explaining supervised machine learning model predictions in drug development</article-title><source>Clinical Translational Sci</source><year>2024</year><month>11</month><access-date>2026-02-20</access-date><volume>17</volume><issue>11</issue><comment><ext-link ext-link-type="uri" xlink:href="https://ascpt.onlinelibrary.wiley.com/toc/17528062/17/11">https://ascpt.onlinelibrary.wiley.com/toc/17528062/17/11</ext-link></comment><pub-id pub-id-type="doi">10.1111/cts.70056</pub-id></nlm-citation></ref><ref id="ref155"><label>155</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lim</surname><given-names>H</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>H</given-names> </name></person-group><article-title>Eating habits and lifestyle factors related to childhood obesity among children aged 5-6 years: cluster analysis of panel survey data in Korea</article-title><source>JMIR Public Health Surveill</source><year>2024</year><month>04</month><day>5</day><volume>10</volume><fpage>e51581</fpage><pub-id pub-id-type="doi">10.2196/51581</pub-id><pub-id pub-id-type="medline">38578687</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Extended data and detailed analyses of the included studies.</p><media xlink:href="humanfactors_v13i1e78648_app1.docx" xlink:title="DOCX File, 5266 KB"/></supplementary-material><supplementary-material id="app2"><label>Checklist 1</label><p>PRISMA checklist.</p><media xlink:href="humanfactors_v13i1e78648_app2.pdf" xlink:title="PDF File, 178 KB"/></supplementary-material><supplementary-material id="app3"><label>Checklist 2</label><p>Reporting checklist for machine learning analysis in healthy lifestyle data.</p><media xlink:href="humanfactors_v13i1e78648_app3.docx" xlink:title="DOCX File, 17 KB"/></supplementary-material></app-group></back></article>