<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="review-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR AI</journal-id><journal-id journal-id-type="publisher-id">ai</journal-id><journal-id journal-id-type="index">41</journal-id><journal-title>JMIR AI</journal-title><abbrev-journal-title>JMIR AI</abbrev-journal-title><issn pub-type="epub">2817-1705</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v5i1e87819</article-id><article-id pub-id-type="doi">10.2196/87819</article-id><article-categories><subj-group subj-group-type="heading"><subject>Review</subject></subj-group></article-categories><title-group><article-title>Methodological Approaches to and Reported Performance of Applications of Automated Machine Learning in Diabetes Risk Prediction: Rapid Review</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Castonguay</surname><given-names>Alexandre</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Hegg-Deloye</surname><given-names>Sandrine</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Chatton</surname><given-names>Arthur</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Goyette</surname><given-names>Am&#x00E9;lie</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib></contrib-group><aff id="aff1"><institution>Facult&#x00E9; des sciences infirmi&#x00E8;res, Universit&#x00E9; de Montr&#x00E9;al</institution><addr-line>Pavillon Marguerite d'Youville, 2375, Chemin de la C&#x00F4;te-Sainte-Catherine</addr-line><addr-line>Montr&#x00E9;al</addr-line><addr-line>QC</addr-line><country>Canada</country></aff><aff id="aff2"><institution>D&#x00E9;partement de m&#x00E9;decine sociale et pr&#x00E9;ventive, Universit&#x00E9; de Montr&#x00E9;al</institution><addr-line>Montr&#x00E9;al</addr-line><addr-line>QC</addr-line><country>Canada</country></aff><aff id="aff3"><institution>Centre de recherche Azrieli, CHU Sainte-Justine</institution><addr-line>Montr&#x00E9;al</addr-line><addr-line>QC</addr-line><country>Canada</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Luo</surname><given-names>Gang</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Lim</surname><given-names>Gilbert</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Dai</surname><given-names>Jingang</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Sandrine Hegg-Deloye, PhD, Facult&#x00E9; des sciences infirmi&#x00E8;res, Universit&#x00E9; de Montr&#x00E9;al, Pavillon Marguerite d'Youville, 2375, Chemin de la C&#x00F4;te-Sainte-Catherine, Montr&#x00E9;al, QC, H3T 1A8, Canada, 1 4182626594; <email>Sandrine.hegg@umontreal.ca</email></corresp></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>12</day><month>5</month><year>2026</year></pub-date><volume>5</volume><elocation-id>e87819</elocation-id><history><date date-type="received"><day>19</day><month>11</month><year>2025</year></date><date date-type="rev-recd"><day>04</day><month>03</month><year>2026</year></date><date date-type="accepted"><day>04</day><month>03</month><year>2026</year></date></history><copyright-statement>&#x00A9; Alexandre Castonguay, Sandrine Hegg-Deloye, Arthur Chatton, Am&#x00E9;lie Goyette. Originally published in JMIR AI (<ext-link ext-link-type="uri" xlink:href="https://ai.jmir.org">https://ai.jmir.org</ext-link>), 12.5.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR AI, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.ai.jmir.org/">https://www.ai.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://ai.jmir.org/2026/1/e87819"/><abstract><sec><title>Background</title><p>Type 2 diabetes (T2D) is a complex, chronic condition that imposes a substantial burden on health care systems. Prevention and early detection are critical to mitigating its impact. Automated machine learning (AutoML) models have the potential to predict individual risk and guide personalized interventions. However, their clinical deployment remains limited due to the retrospective nature of most datasets, a lack of external validation, and heterogeneity in variable selection.</p></sec><sec><title>Objective</title><p>This study aimed to map AutoML approaches applied to T2D risk prediction, with a specific focus on their ability to integrate clinical, behavioral, environmental, and genomic data.</p></sec><sec sec-type="methods"><title>Methods</title><p>A PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses)-guided rapid review was conducted across 6 databases (PubMed, Scopus, Web of Science, IEEE Xplore, Google Scholar, and Embase) to identify empirical studies (published between 2015 and 2025) that used AutoML tools for T2D prediction based on at least 2 data types (eg, clinical, behavioral, environmental, and genomic). Screening, data extraction, and synthesis were performed systematically by 2 independent reviewers, with arbitration by ChatGPT acting as an artificial intelligence&#x2013;based third reviewer.</p></sec><sec sec-type="results"><title>Results</title><p>In total, 13 studies met the inclusion criteria. Methodological diversity ranged from conventional machine learning with manual feature selection to partially or fully automated pipelines using tools such as the Tree-Based Pipeline Optimization Tool, H2O AutoML, or Azure Machine Learning. Reported performance varied (area under the curve=0.74&#x2010;0.99); however, external validation was uncommon. Behavioral and environmental data were only partially integrated, and no study incorporated genomic data despite its recognized potential. Most studies lacked transparency and reproducibility, with no public code or pipeline sharing.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>AutoML holds significant promise for improving T2D risk prediction through automation and model explainability. However, to support clinical adoption and generalizability, future AutoML pipelines must be developed using prospective, multicenter datasets; integrate diverse, harmonized data types, including genomics; and adhere to open science principles of transparency, reproducibility, and interpretability.</p></sec></abstract><kwd-group><kwd>automated machine learning</kwd><kwd>AutoML</kwd><kwd>type 2 diabetes risk prediction</kwd><kwd>multimodal data integration</kwd><kwd>machine learning validation</kwd><kwd>explainable artificial intelligence</kwd><kwd>artificial intelligence</kwd><kwd>AI</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Type 2 diabetes (T2D) is a growing global public health challenge, affecting an estimated 589 million adults in 2024 (11%) and projected to reach 853 million (13%) by 2050. It is a leading cause of serious complications, such as cardiovascular disease, kidney failure, and vision loss, and is responsible for about 12% of global health expenditure [<xref ref-type="bibr" rid="ref1">1</xref>]. Early detection through risk-based screening and targeted prevention strategies, including lifestyle interventions, is recommended by the American Diabetes Association to reduce morbidity, mortality, and the health care burden associated with T2D and its comorbidities [<xref ref-type="bibr" rid="ref2">2</xref>]. Recent meta-analytic evidence shows that machine learning (ML) models can identify people at high risk of developing T2D with high accuracy, correctly flagging about 8 out of 10 future cases while avoiding false alarms for about 8 of 10 people who will remain diabetes-free, outperforming traditional risk scores in long-term follow-up studies [<xref ref-type="bibr" rid="ref3">3</xref>].</p><p>Over the past decade, many studies have applied ML to predict diabetes risk using data from clinical cohorts, electronic health records, and large population studies. Comparative evaluations show that while these models can improve discrimination over traditional risk scores, such gains are often modest and vary across datasets [<xref ref-type="bibr" rid="ref4">4</xref>]. Moreover, as seen across the broader prognostic modeling literature, calibration, defined as how closely predicted risks match actual outcomes, is rarely assessed; when evaluated, models with good discrimination have sometimes been poorly calibrated [<xref ref-type="bibr" rid="ref5">5</xref>].</p><p>A landmark meta-analysis across diverse prognostic models found that any apparent superiority of ML over logistic regression was largely confined to studies at high risk of bias, with no advantage in those at low risk [<xref ref-type="bibr" rid="ref6">6</xref>]. Many diabetes-related ML studies also rely on retrospective data without validation in new, independent populations, limiting confidence in their generalizability [<xref ref-type="bibr" rid="ref7">7</xref>]. Differences in data quality, variable definitions, and study design further complicate translation into practice. To move the field forward, future work should routinely report both discrimination and calibration, assess potential clinical benefit (eg, through decision-curve analysis), and plan for robust external validation from the outset.</p><p>Automated machine learning (AutoML) frameworks aim to make the development of artificial intelligence (AI) prediction models easier and more consistent by automating key steps such as data preprocessing, feature selection, model selection, and hyperparameter tuning. Many now also include tools to help explain how the model makes predictions, such as identifying which factors are most important [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. Some platforms, such as Auto-PyTorch, go a step further by automatically testing both traditional and deep learning approaches to find the best combination for the data at hand [<xref ref-type="bibr" rid="ref10">10</xref>].</p><p>This type of standardization could improve the reproducibility and comparability of diabetes prediction studies, but real-world use still depends on strong study designs, such as testing in new patient groups and involving both data scientists and clinicians. Recent reviews point to the untapped potential of AutoML for T2D, especially for combining information from different sources, such as medical records, lifestyle factors, and genetic profiles, into more personalized risk scores [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>]. Such capabilities are particularly relevant for T2D, where risk prediction often requires integrating heterogeneous, multimodal data spanning clinical, behavioral, and genetic domains.</p><p>At the same time, challenges remain, such as the difficulty of applying genetic risk scores across different populations and the need to make these complex models understandable to clinicians. These opportunities and barriers motivate a closer look at how AutoML is currently being used in diabetes research and whether it can truly deliver models that are both accurate and ready for clinical use.</p><p>To explore the current state of this emerging field and its practical implications, we conducted a rapid review of AutoML applications in T2D risk prediction (2015&#x2010;2025). Our aim was to summarize how these approaches have been applied, the types of data and methods used, and what has been reported about their performance and clinical readiness, thereby informing their future development and providing insights directly relevant to implementation in real-world settings.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Design</title><p>We conducted a structured rapid review following the PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) guidelines. Consistent with a rapid review approach, the study adhered to PRISMA principles but did not aim for exhaustive coverage, duplicate data extraction at all stages, or meta-analytic synthesis characteristic of a full systematic review. Methodological streamlining, including a restricted time frame and narrative synthesis, was implemented to provide a timely overview of emerging AutoML applications in a fast-evolving field. Accordingly, the findings should be interpreted as a structured mapping of methodological approaches rather than a comprehensive appraisal of the evidence. Although some features overlap with exploratory or scoping reviews, the use of predefined eligibility criteria, a focused research question, and a formal risk-of-bias assessment support the classification of this study as a rapid review. The research question was structured using the population, intervention, comparator, and outcome (PICO) framework to guide eligibility criteria, search strategy, and data extraction.</p></sec><sec id="s2-2"><title>Eligibility Criteria</title><p>Eligibility criteria were defined based on the PICO framework (<xref ref-type="other" rid="box1">Textbox 1</xref>).</p><boxed-text id="box1"><title> Eligibility criteria, defined based on the population, intervention, comparator, and outcome (PICO) framework.</title><p><bold>Population</bold></p><p>Studies included individuals at risk of type 2 diabetes (T2D), regardless of age, sex, or geography. Eligible datasets had to include at least one data type relevant to risk prediction&#x2014;genomic, behavioral, environmental, or clinical.</p><p><bold>Intervention</bold></p><p>Eligible studies applied an AutoML framework (eg, Tree-Based Pipeline Optimization Tool, H2O AutoML, auto-sklearn, and Auto-PyTorch) to predict T2D onset or future risk. These tools had to automate key steps such as data preprocessing, variable selection, algorithm choice, hyperparameter tuning, or model ensembling. For the purpose of this review, AutoML was defined pragmatically as the use of computational pipelines that automate one or more key stages of the modeling workflow. Individual techniques, such as least absolute shrinkage and selection operator regression or gradient-boosted trees (eg, extreme gradient boosting), were considered part of an AutoML approach only when embedded within a partially or fully automated pipeline, rather than applied as standalone, manually specified models.</p><p><bold>Comparator</bold></p><p>When present, comparators included conventional machine learning workflows (manual feature selection and tuning) or alternative AutoML pipelines. Studies without comparators were also eligible.</p><p><bold>Outcomes</bold></p><p>Studies had to report how AutoML was implemented (tools, data types, and modeling strategies) and its predictive performance, including interpretability, the integration of multiple data sources, and methodological innovations for real-world use.</p></boxed-text><p>Eligible studies were empirical investigations using AutoML to predict T2D onset or risk from observational or experimental datasets (eg, cohorts, case-control studies, clinical datasets, or open-access data).</p></sec><sec id="s2-3"><title>Search Strategy</title><p>A structured search strategy was developed, combining four thematic blocks: (1) diabetes (&#x201C;diabet*,&#x201D; &#x201C;type 1,&#x201D; &#x201C;type 2,&#x201D; &#x201C;T1D,&#x201D; &#x201C;T2D,&#x201D; &#x201C;pre-diabet*,&#x201D; &#x201C;insulin resistance,&#x201D; &#x201C;impaired glucose tolerance,&#x201D; &#x201C;HbA1c,&#x201D; &#x201C;hyperglycemia,&#x201D; and &#x201C;glycemic control&#x201D;), (2) AutoML and ML (&#x201C;automated machine learning,&#x201D; &#x201C;machine learning,&#x201D; &#x201C;artificial intelligence,&#x201D; &#x201C;deep learning,&#x201D; &#x201C;neural network,&#x201D; &#x201C;random forest,&#x201D; &#x201C;support vector machine,&#x201D; &#x201C;decision tree,&#x201D; &#x201C;XGBoost,&#x201D; &#x201C;TPOT,&#x201D; &#x201C;H2O.ai,&#x201D; &#x201C;DataRobot,&#x201D; &#x201C;feature selection,&#x201D; and &#x201C;pipeline automation&#x201D;), (3) data types of interest (&#x201C;genom*,&#x201D; &#x201C;DNA,&#x201D; &#x201C;SNP,&#x201D; &#x201C;gene expression,&#x201D; &#x201C;epigenetic,&#x201D; and &#x201C;GWAS&#x201D;; &#x201C;diet,&#x201D; &#x201C;physical activity,&#x201D; &#x201C;sleep,&#x201D; and &#x201C;lifestyle&#x201D;; &#x201C;pollution,&#x201D; &#x201C;air quality,&#x201D; &#x201C;urban,&#x201D; &#x201C;deprivation,&#x201D; and &#x201C;exposure&#x201D;; and &#x201C;combined model,&#x201D; &#x201C;multi-input,&#x201D; and &#x201C;fusion model&#x201D;), and (4) prediction (&#x201C;predict*,&#x201D; &#x201C;forecast*,&#x201D; &#x201C;risk model*,&#x201D; &#x201C;classification model*,&#x201D; and &#x201C;risk prediction&#x201D;). This strategy was adapted and applied across 6 databases: PubMed, Scopus, Web of Science, IEEE Xplore, Google Scholar, and Embase. Filters were used to limit the search to original scientific articles published between January 2015 and May 2025 in English or French.</p></sec><sec id="s2-4"><title>Study Selection and Reference Management</title><p>All 851 retrieved studies were imported into Covidence (Veritas Health Innovation), and duplicates were removed. Title and abstract screening were performed independently by 2 reviewers, with ChatGPT (OpenAI) acting as an AI-based third reviewer for adjudication. Articles deemed potentially relevant (59/743, 7.9%) underwent full-text assessment against the predefined eligibility criteria using the same dual-reviewer process and AI-assisted adjudication.</p></sec><sec id="s2-5"><title>Data Extraction and Synthesis</title><p>Data extraction for the final 22.0% (13/59) of the studies was conducted in Covidence using a standardized form pretested on 3 to 5 studies. Extracted fields covered bibliographic details, study context, design, population, data types, predictors, AutoML implementation, performance metrics, interpretability, reproducibility, limitations, and clinical relevance. All data were cross-checked for completeness and consistency. ChatGPT served as an AI-assisted third reviewer solely to support adjudication in cases of disagreement by summarizing relevant methodological elements; final decisions were reached by consensus between human reviewers and were not determined by AI-generated outputs. All final inclusion decisions were verified and confirmed by human assessors, strengthening methodological rigor. The extracted study-level data are provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s2-6"><title>Data Analysis</title><p>Extracted data were narratively synthesized and summarized in tables, detailing study methods, data types, AutoML approaches, and key performance metrics, including calibration. The analysis emphasized validation strategies, interpretability, and clinical applicability. All synthesis steps were cross-checked by ChatGPT as an AI-based third reviewer to ensure coherence. Risk of bias was assessed using the PROBAST (Prediction Model Risk of Bias Assessment Tool)+AI tool [<xref ref-type="bibr" rid="ref7">7</xref>], evaluating participants, predictors, outcomes, and analysis domains.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Study Selection</title><p>The database search yielded 851 records, of which 743 (87.3%) were screened. Following title and abstract screening and full-text review, 13 studies published between 2017 and 2025 met the eligibility criteria (<xref ref-type="fig" rid="figure1">Figure 1</xref>; <xref ref-type="supplementary-material" rid="app2">Checklist 1</xref>).</p><p>The studies spanned Brazil, Greece, India, Australia, South Korea, Pakistan, China, Spain, the United States, Japan, and Iraq and used a variety of designs. Most were observational (prospective or retrospective), although 1 study conducted in 2022 by Mora-Ortiz et al [<xref ref-type="bibr" rid="ref13">13</xref>] used a randomized controlled trial dataset. Among the 13 included studies, 2 (15.4%) used fully automated pipelines, 1 (7.7%) used semiautomated workflows, and 10 (76.9%) relied predominantly on manual ML approaches. Sample sizes ranged from 183 participants in a targeted clinical trial to 25,406 participants in a large community-based cohort.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) flow diagram of study selection.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v5i1e87819_fig01.png"/></fig></sec><sec id="s3-2"><title>Scope of Outcomes</title><p>Not all studies predicted incident T2D. Several addressed related but distinct outcomes, including diagnosis, disease subtyping, or engagement in prevention programs. These outcomes differ fundamentally in clinical meaning, prediction horizon, and class balance. Consequently, performance metrics such as the area under the receiver operating characteristic curve (AUROC) or accuracy are not directly comparable across studies, and apparent differences in performance should be interpreted with caution. Therefore, AUROC values derived from these different prediction tasks should not be interpreted as directly comparable.</p></sec><sec id="s3-3"><title>Data Sources and Feature Types</title><p>Clinical variables, such as anthropometry, biochemical measures, and demographics, were the most common predictors. Behavioral variables appeared in several studies; genomic and environmental features were rare or absent. Data sources included large public cohorts (eg, Brazilian Longitudinal Study of Adult Health, English Longitudinal Study of Ageing&#x2013;UK, Korean Genome and Epidemiology Study, and University of California, Irvine repositories); commercial platforms (eg, Noom); and local hospital records. The number of predictors ranged from fewer than 10 to more than 200.</p></sec><sec id="s3-4"><title>AutoML Tools and Modeling Approaches</title><p>A few studies used general-purpose AutoML frameworks (eg, Tree-Based Pipeline Optimization Tool [TPOT], H2O AutoML, and Azure Machine Learning), while many relied on partially automated or traditional workflows. Common algorithms included random forests, gradient-boosted methods, artificial neural networks, and logistic regression. Most studies combined limited automation (eg, feature selection or tuning) with manual preprocessing, corresponding to semiautomated pipelines under the operational definition used in this review.</p></sec><sec id="s3-5"><title>Validation Strategies</title><p>Internal validation was common, particularly 10-fold cross-validation and holdout splits (eg, 70/30 or 80/20), often with stratified or repeated sampling. External or prospective validation was reported in a small subset, and performance sometimes declined compared with internal results. A few studies incorporated external or prospective validation [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]; however, these were the exception.</p></sec><sec id="s3-6"><title>Model Performance</title><p>Reported performance varied by dataset, outcome definition, and modeling approach. AUROC values ranged from approximately 0.74 to 0.99 across studies, and accuracy ranged from approximately 75% to 97.7%. In some cases, AutoML-derived models outperformed established clinical risk scores; for instance, Fazakis et al [<xref ref-type="bibr" rid="ref4">4</xref>] achieved an AUROC of 0.884 compared with 0.821 for the Finnish Diabetes Risk Score (FINDRISC). AUROC values near 0.99 were observed primarily in training or test splits or for nonincidence tasks (eg, engagement prediction in digital prevention programs), and these often lacked external validation [<xref ref-type="bibr" rid="ref4">4</xref>]. However, calibration measures and decision-analytic metrics were rarely reported, limiting the clinical interpretability of high AUROC values.</p></sec><sec id="s3-7"><title>Interpretability and Reproducibility</title><p>Most studies included some form of interpretability, such as feature importance rankings, Shapley additive explanations (SHAP) values, or Boruta-based feature selection. Reproducibility was rarely addressed: few studies provided open-source code, complete model parameters, or complete datasets.</p></sec><sec id="s3-8"><title>Clinical Readiness</title><p>Although several studies discussed potential clinical applications, only a minority incorporated elements aligned with real-world implementation, such as prospective validation, workflow integration, or usability testing for clinicians. Overall, methodological performance was often high, but concrete steps toward clinical adoption remained limited.</p></sec><sec id="s3-9"><title>Risk of Bias: PROBAST Assessment</title><p>A risk-of-bias assessment using the PROBAST framework examined 4 domains: participants, predictors, outcomes, and analysis.</p><p>In the participants domain, most studies showed a high risk of bias, although populations were generally well defined and clinically relevant [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>].</p><p>The predictors domain was more heterogeneous: some studies used automated feature selection methods such as least absolute shrinkage and selection operator (LASSO) or SHAP, while others relied on manual or poorly documented approaches, leading to moderate to high risk of bias. In the outcome domain, risk was low, as predictive targets were consistently well defined [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref18">18</xref>].</p><p>Regarding analysis, most studies applied appropriate validation techniques (cross-validation, training or test splits, or external validation), although a few lacked sufficient methodological detail [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref18">18</xref>-<xref ref-type="bibr" rid="ref20">20</xref>].</p><p>Overall, approximately one-third of studies were at high risk of bias, one-third at moderate risk, and only a few at low risk across all PROBAST domains.</p><p>Across studies, the PROBAST domains most frequently associated with high risk of bias were predictor selection and analysis, often due to manual feature selection, limited reporting of preprocessing steps, or the lack of external validation. Studies using more automated and standardized pipelines tended to show lower risk in the predictors domain but not necessarily in the analysis domain. Notably, very high AUROC values were more frequently observed in studies with a higher overall risk of bias.</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>In this review, clinical readiness was defined as the presence of key elements required for real-world deployment, including external validation, calibration reporting, assessment of clinical utility, workflow integration, and interpretability for end users. The included studies spanned multiple regions and addressed heterogeneous objectives, such as early screening, cardiovascular risk stratification, T2D subtyping, and support for digital prevention programs [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref18">18</xref>]. This diversity reflects the breadth of current AutoML applications in diabetes research but also underscores the need for caution when comparing performance across fundamentally different prediction tasks.</p><p>From a methodological standpoint, supervised algorithms such as random forest, extreme gradient boosting (XGBoost), and light gradient boosting machine were predominant, balancing performance and interpretability. Several studies used SHAP or decision trees to identify key predictors and improve clinical usability [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. However, most relied on retrospective, single-center data, with limited external validation and potential selection bias [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. This gap between methodological rigor and generalizability remains a major barrier to clinical translation.</p><p>Bias also arose from manual predictor selection [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. In contrast, studies embedding techniques such as LASSO or Boruta within automated or semiautomated pipelines demonstrated improved standardization [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. In this review, such techniques were considered part of AutoML only when integrated into an automated workflow rather than applied as standalone methods. Fully automated AutoML pipelines&#x2014;encompassing preprocessing, feature selection, and hyperparameter tuning&#x2014;remained rare; only 1 study implemented Azure Machine Learning without complete pipeline automation [<xref ref-type="bibr" rid="ref19">19</xref>]. Nevertheless, a gradual shift toward semiautomated and externally validated approaches was observed over time [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref14">14</xref>].</p><p>Reported performance was high (area under the curve=0.74-0.99), but comparability suffered from heterogeneous outcomes and metrics [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. Few studies reported calibration or predictive value measures, despite their importance for clinical risk prediction. Reproducibility also remained a major weakness, with no study sharing full code or modeling pipelines, contrary to open science recommendations [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. Overall, AutoML approaches did not consistently outperform non-AutoML models under rigorous validation conditions, underscoring the primacy of external validation and calibration over nominal performance gains, particularly across heterogeneous prediction tasks.</p><p>Finally, interpretability remains a key challenge, as AutoML systems are often perceived as &#x201C;black boxes&#x201D; [<xref ref-type="bibr" rid="ref11">11</xref>]. Integrating explainable AI tools such as SHAP, local interpretable model-agnostic explanations, and integrated gradients directly into AutoML frameworks (eg, AutoGluon) could enhance transparency and usability, thereby supporting clinical adoption [<xref ref-type="bibr" rid="ref11">11</xref>]. Future research should prioritize data diversity; prospective multicenter validation; and the development of standardized, shareable AutoML pipelines to facilitate reproducibility and real-world implementation [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref14">14</xref>].</p><p>Notably, none of the reviewed studies included genomic data, despite its potential to improve prediction accuracy. Beyond technical considerations, practical barriers such as cost, limited availability of genomic data in routine care, population-specific transferability of polygenic risk scores, and data governance constraints likely contribute to the absence of genomic predictors in current AutoML-based T2D models. Nevertheless, existing evidence suggests that integrating polygenic risk information could enhance future AutoML-based prediction models [<xref ref-type="bibr" rid="ref17">17</xref>].</p></sec><sec id="s4-2"><title>Reported Limitations and Author Suggestions</title><p>The included studies reported several recurring limitations, notably the reliance on regional or hospital-based datasets, limited external or prospective validation, and incomplete integration of behavioral or genomic predictors. Authors consistently emphasized the need for broader and more diverse predictor sets, multicenter study designs, and prospective validation. Taken together, these limitations mirror the methodological and clinical gaps identified in this review and underscore the need for standardized, explainable, and reproducible AutoML pipelines oriented toward real-world clinical use.</p></sec><sec id="s4-3"><title>Conclusions</title><p>This rapid review underscores the promising yet underrealized potential of AutoML for predicting T2D risk. Across 13 studies (2017&#x2010;2025), models showed strong discrimination and a growing use of interpretable methods (eg, SHAP and decision trees). However, clinical translation remains constrained by local or retrospective data; limited external validation; and the absence of fully automated, reproducible pipelines.</p><p>To overcome these gaps, future research should adopt prospective, multicenter designs and integrate diverse data sources&#x2014;clinical, behavioral, environmental, and omics data. Developing standardized, transparent, and shareable AutoML frameworks is essential for building trust and enabling real-world applications.</p><p>Some actionable recommendations are as follows:</p><list list-type="bullet"><list-item><p>Ensure open access to code, trained models, and reproducible pipelines</p></list-item><list-item><p>Promote multicenter, demographically diverse cohorts, explicitly including genomic and other omic features</p></list-item><list-item><p>Benchmark explainable AutoML frameworks (eg, SHAP integrated with AutoGluon) under prospective, externally validated conditions, with calibration and clinical utility metrics reported alongside AUROC</p></list-item></list><p>Collectively, these actions can transform AutoML from a high-performing research tool into a transparent, reliable decision support system with tangible public health benefits.</p></sec></sec></body><back><ack><p>During the preparation of this manuscript, GPT-4o (OpenAI), a generative language model, was used via the ChatGPT interface to assist with translation, linguistic revision, structural refinement, and clarity enhancement. The authors also used ChatGPT to support narrative development and thematic clarification throughout the writing process, in accordance with emerging evidence on the constructive role of generative artificial intelligence (AI) in meaning-making and reflective synthesis in academic contexts. All AI-generated outputs were carefully reviewed, edited, and approved by the authors and by relevant professionals to ensure accuracy, relevance, and adherence to principles of responsible use of generative AI in scholarly writing. The final version of the manuscript was subsequently reviewed by a professional proofreader to ensure clarity and consistency.</p></ack><notes><sec><title>Funding</title><p>The authors declare that no financial support was received for this work.</p></sec><sec><title>Data Availability</title><p>The data analyzed in this rapid review were extracted from the published articles included in the review. The extracted study-level data are available in Multimedia Appendix 1.</p><p/></sec></notes><fn-group><fn fn-type="con"><p>Conceptualization: A Castonguay, SH-D</p><p>Data curation: A Castonguay, SH-D</p><p>Formal analysis: SH-D, AG</p><p>Methodology: A Castonguay, SH-D, AG</p><p>Project administration: A Castonguay, SH-D</p><p>Supervision: A Castonguay, SH-D</p><p>Validation: A Chatton</p><p>Writing&#x2014;original draft: A Castonguay, SH-D</p><p>Writing&#x2014;review and editing: A Castonguay, SH-D, A Chatton, AG</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb2">AUROC</term><def><p>area under the receiver operating characteristic curve</p></def></def-item><def-item><term id="abb3">AutoML</term><def><p>automated machine learning</p></def></def-item><def-item><term id="abb4">FINDRISC</term><def><p>Finnish Diabetes Risk Score</p></def></def-item><def-item><term id="abb5">LASSO</term><def><p>least absolute shrinkage and selection operator</p></def></def-item><def-item><term id="abb6">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb7">PICO</term><def><p>population, intervention, comparator, and outcome</p></def></def-item><def-item><term id="abb8">PRISMA</term><def><p>Preferred Reporting Items for Systematic Reviews and Meta-Analyses</p></def></def-item><def-item><term id="abb9">PRISMA-ScR</term><def><p>Preferred Reporting Items for Systematic Reviews and Meta-Analyses extension for Scoping Reviews</p></def></def-item><def-item><term id="abb10">PROBAST</term><def><p>Prediction Model Risk of Bias Assessment Tool</p></def></def-item><def-item><term id="abb11">SHAP</term><def><p>Shapley additive explanations</p></def></def-item><def-item><term id="abb12">T2D</term><def><p>type 2 diabetes</p></def></def-item><def-item><term id="abb13">TPOT</term><def><p>Tree-Based Pipeline Optimization Tool</p></def></def-item><def-item><term id="abb14">XGBoost</term><def><p>extreme gradient boosting</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="report"><article-title>IDF Diabetes Atlas 2025</article-title><access-date>2026-04-08</access-date><publisher-name>International Diabetes Federation</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://diabetesatlas.org/resources/idf-diabetes-atlas-2025/">https://diabetesatlas.org/resources/idf-diabetes-atlas-2025/</ext-link></comment></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><collab>American Diabetes Association Professional Practice Committee</collab></person-group><article-title>3. Prevention or delay of diabetes and associated comorbidities: Standards of Care in Diabetes-2025</article-title><source>Diabetes Care</source><year>2025</year><month>01</month><day>1</day><volume>48</volume><issue>1 Suppl 1</issue><fpage>S50</fpage><lpage>S58</lpage><pub-id pub-id-type="doi">10.2337/dc25-S003</pub-id><pub-id pub-id-type="medline">39651971</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kodama</surname><given-names>S</given-names> </name><name name-style="western"><surname>Fujihara</surname><given-names>K</given-names> </name><name name-style="western"><surname>Horikawa</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Predictive ability of current machine learning algorithms for type&#x2009;2 diabetes mellitus: a meta-analysis</article-title><source>J Diabetes Investig</source><year>2022</year><month>05</month><volume>13</volume><issue>5</issue><fpage>900</fpage><lpage>908</lpage><pub-id pub-id-type="doi">10.1111/jdi.13736</pub-id><pub-id pub-id-type="medline">34942059</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fazakis</surname><given-names>N</given-names> </name><name name-style="western"><surname>Kocsis</surname><given-names>O</given-names> </name><name name-style="western"><surname>Dritsas</surname><given-names>E</given-names> </name><name name-style="western"><surname>Alexiou</surname><given-names>S</given-names> </name><name name-style="western"><surname>Fakotakis</surname><given-names>N</given-names> </name><name name-style="western"><surname>Moustakas</surname><given-names>K</given-names> </name></person-group><article-title>Machine learning tools for long-term type 2 diabetes risk prediction</article-title><source>IEEE Access</source><year>2021</year><volume>9</volume><fpage>103737</fpage><lpage>103757</lpage><pub-id pub-id-type="doi">10.1109/ACCESS.2021.3098691</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wynants</surname><given-names>L</given-names> </name><name name-style="western"><surname>Van Calster</surname><given-names>B</given-names> </name><name name-style="western"><surname>Collins</surname><given-names>GS</given-names> </name><etal/></person-group><article-title>Prediction models for diagnosis and prognosis of Covid-19: systematic review and critical appraisal</article-title><source>BMJ</source><year>2020</year><month>04</month><day>7</day><volume>369</volume><fpage>m1328</fpage><pub-id pub-id-type="doi">10.1136/bmj.m1328</pub-id><pub-id pub-id-type="medline">32265220</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Christodoulou</surname><given-names>E</given-names> </name><name name-style="western"><surname>Ma</surname><given-names>J</given-names> </name><name name-style="western"><surname>Collins</surname><given-names>GS</given-names> </name><name name-style="western"><surname>Steyerberg</surname><given-names>EW</given-names> </name><name name-style="western"><surname>Verbakel</surname><given-names>JY</given-names> </name><name name-style="western"><surname>Van Calster</surname><given-names>B</given-names> </name></person-group><article-title>A systematic review shows no performance benefit of machine learning over logistic regression for clinical prediction models</article-title><source>J Clin Epidemiol</source><year>2019</year><month>06</month><volume>110</volume><fpage>12</fpage><lpage>22</lpage><pub-id pub-id-type="doi">10.1016/j.jclinepi.2019.02.004</pub-id><pub-id pub-id-type="medline">30763612</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Moons</surname><given-names>KGM</given-names> </name><name name-style="western"><surname>Damen</surname><given-names>JAA</given-names> </name><name name-style="western"><surname>Kaul</surname><given-names>T</given-names> </name><etal/></person-group><article-title>PROBAST+AI: an updated quality, risk of bias, and applicability assessment tool for prediction models using regression or artificial intelligence methods</article-title><source>BMJ</source><year>2025</year><month>03</month><day>24</day><volume>388</volume><fpage>e082505</fpage><pub-id pub-id-type="doi">10.1136/bmj-2024-082505</pub-id><pub-id pub-id-type="medline">40127903</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>He</surname><given-names>X</given-names> </name><name name-style="western"><surname>Zhao</surname><given-names>K</given-names> </name><name name-style="western"><surname>Chu</surname><given-names>X</given-names> </name></person-group><article-title>AutoML: a survey of the state-of-the-art</article-title><source>Knowl Based Syst</source><year>2021</year><month>01</month><volume>212</volume><fpage>106622</fpage><pub-id pub-id-type="doi">10.1016/j.knosys.2020.106622</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Lundberg</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>SI</given-names> </name></person-group><article-title>A unified approach to interpreting model predictions</article-title><access-date>2026-04-08</access-date><conf-name>NIPS&#x2019;17: Proceedings of the 31st International Conference on Neural Information Processing Systems</conf-name><conf-date>Dec 4-9, 2017</conf-date><comment><ext-link ext-link-type="uri" xlink:href="https://papers.nips.cc/paper_files/paper/2017/hash/8a20a8621978632d76c43dfd28b67767-Abstract.html">https://papers.nips.cc/paper_files/paper/2017/hash/8a20a8621978632d76c43dfd28b67767-Abstract.html</ext-link></comment></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zimmer</surname><given-names>L</given-names> </name><name name-style="western"><surname>Lindauer</surname><given-names>M</given-names> </name><name name-style="western"><surname>Hutter</surname><given-names>F</given-names> </name></person-group><article-title>Auto-PyTorch: multi-fidelity metalearning for efficient and robust AutoDL</article-title><source>IEEE Trans Pattern Anal Mach Intell</source><year>2021</year><month>09</month><volume>43</volume><issue>9</issue><fpage>3079</fpage><lpage>3090</lpage><pub-id pub-id-type="doi">10.1109/TPAMI.2021.3067763</pub-id><pub-id pub-id-type="medline">33750687</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hasan</surname><given-names>R</given-names> </name><name name-style="western"><surname>Dattana</surname><given-names>V</given-names> </name><name name-style="western"><surname>Mahmood</surname><given-names>S</given-names> </name><name name-style="western"><surname>Hussain</surname><given-names>S</given-names> </name></person-group><article-title>Towards transparent diabetes prediction: combining AutoML and explainable AI for improved clinical insights</article-title><source>Information</source><year>2025</year><volume>16</volume><issue>1</issue><fpage>7</fpage><pub-id pub-id-type="doi">10.3390/info16010007</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Huang</surname><given-names>HY</given-names> </name><name name-style="western"><surname>Khan</surname><given-names>A</given-names> </name><name name-style="western"><surname>Parikh</surname><given-names>C</given-names> </name><etal/></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Dash</surname><given-names>S</given-names> </name><name name-style="western"><surname>Pani</surname><given-names>SK</given-names> </name><name name-style="western"><surname>Susilo</surname><given-names>W</given-names> </name><name name-style="western"><surname>Bernard,</surname><given-names>CM</given-names> </name><name name-style="western"><surname>Tse</surname><given-names>G</given-names> </name></person-group><article-title>Machine learning-based predictive model for type 2 diabetes mellitus using genetic and clinical data</article-title><source>Internet of Things and Machine Learning for Type I and Type II Diabetes</source><year>2024</year><publisher-name>Elsevier Science</publisher-name><fpage>177</fpage><lpage>185</lpage><pub-id pub-id-type="doi">10.1016/B978-0-323-95686-4.00013-7</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mora-Ortiz</surname><given-names>M</given-names> </name><name name-style="western"><surname>Alcala-Diaz</surname><given-names>JF</given-names> </name><name name-style="western"><surname>Rangel-Zu&#x00F1;iga</surname><given-names>OA</given-names> </name><etal/></person-group><article-title>Metabolomics analysis of type 2 diabetes remission identifies 12 metabolites with predictive capacity: a CORDIOPREV clinical trial study</article-title><source>BMC Med</source><year>2022</year><month>10</month><day>27</day><volume>20</volume><issue>1</issue><fpage>373</fpage><pub-id pub-id-type="doi">10.1186/s12916-022-02566-z</pub-id><pub-id pub-id-type="medline">36289459</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ji</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Shang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Yi</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zang</surname><given-names>W</given-names> </name><name name-style="western"><surname>Cao</surname><given-names>W</given-names> </name></person-group><article-title>Machine learning-based models to predict type 2 diabetes combined with coronary heart disease and feature analysis-based on interpretable SHAP</article-title><source>Acta Diabetol</source><year>2025</year><month>10</month><volume>62</volume><issue>10</issue><fpage>1631</fpage><lpage>1646</lpage><pub-id pub-id-type="doi">10.1007/s00592-025-02496-1</pub-id><pub-id pub-id-type="medline">40167635</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rodriguez</surname><given-names>DV</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>J</given-names> </name><name name-style="western"><surname>Viswanadham</surname><given-names>RVN</given-names> </name><name name-style="western"><surname>Lawrence</surname><given-names>K</given-names> </name><name name-style="western"><surname>Mann</surname><given-names>D</given-names> </name></person-group><article-title>Leveraging machine learning to develop digital engagement phenotypes of users in a digital diabetes prevention program: evaluation study</article-title><source>JMIR AI</source><year>2024</year><month>03</month><day>1</day><volume>3</volume><fpage>e47122</fpage><pub-id pub-id-type="doi">10.2196/47122</pub-id><pub-id pub-id-type="medline">38875579</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Abdalrada</surname><given-names>AS</given-names> </name><name name-style="western"><surname>Abawajy</surname><given-names>J</given-names> </name><name name-style="western"><surname>Al-Quraishi</surname><given-names>T</given-names> </name><name name-style="western"><surname>Islam</surname><given-names>SMS</given-names> </name></person-group><article-title>Machine learning models for prediction of co-occurrence of diabetes and cardiovascular diseases: a retrospective cohort study</article-title><source>J Diabetes Metab Disord</source><year>2022</year><month>06</month><volume>21</volume><issue>1</issue><fpage>251</fpage><lpage>261</lpage><pub-id pub-id-type="doi">10.1007/s40200-021-00968-z</pub-id><pub-id pub-id-type="medline">35673486</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>M</given-names> </name><name name-style="western"><surname>He</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Predicting the risk of incident type 2 diabetes mellitus in Chinese elderly using machine learning techniques</article-title><source>J Pers Med</source><year>2022</year><month>05</month><day>31</day><volume>12</volume><issue>6</issue><fpage>905</fpage><pub-id pub-id-type="doi">10.3390/jpm12060905</pub-id><pub-id pub-id-type="medline">35743691</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Choi</surname><given-names>HY</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>EY</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>J</given-names> </name></person-group><article-title>Prognostic factors in diabetes: Comparison of chi-square automatic interaction detector (CHAID) decision tree technology and logistic regression</article-title><source>Medicine (Baltimore)</source><year>2022</year><month>10</month><day>21</day><volume>101</volume><issue>42</issue><fpage>e31343</fpage><pub-id pub-id-type="doi">10.1097/MD.0000000000031343</pub-id><pub-id pub-id-type="medline">36281142</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Daliya</surname><given-names>VK</given-names> </name><name name-style="western"><surname>Ramesh</surname><given-names>TK</given-names> </name></person-group><article-title>A cloud-based optimized ensemble model for risk prediction of diabetic progression&#x2014;an Azure machine learning perspective</article-title><source>IEEE Access</source><year>2025</year><volume>13</volume><fpage>11560</fpage><lpage>11575</lpage><pub-id pub-id-type="doi">10.1109/ACCESS.2025.3528033</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Laila</surname><given-names>UE</given-names> </name><name name-style="western"><surname>Mahboob</surname><given-names>K</given-names> </name><name name-style="western"><surname>Khan</surname><given-names>AW</given-names> </name><name name-style="western"><surname>Khan</surname><given-names>F</given-names> </name><name name-style="western"><surname>Taekeun</surname><given-names>W</given-names> </name></person-group><article-title>An ensemble approach to predict early-stage diabetes risk using machine learning: an empirical study</article-title><source>Sensors (Basel)</source><year>2022</year><month>07</month><day>13</day><volume>22</volume><issue>14</issue><fpage>5247</fpage><pub-id pub-id-type="doi">10.3390/s22145247</pub-id><pub-id pub-id-type="medline">35890927</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Extraction study-level data.</p><media xlink:href="ai_v5i1e87819_app1.xlsx" xlink:title="XLSX File, 68 KB"/></supplementary-material><supplementary-material id="app2"><label>Checklist 1</label><p>PRISMA-ScR checklist.</p><media xlink:href="ai_v5i1e87819_app2.docx" xlink:title="DOCX File, 87 KB"/></supplementary-material></app-group></back></article>