<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR AI</journal-id>
      <journal-title>JMIR AI</journal-title>
      <issn pub-type="epub">2817-1705</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v3i1e56700</article-id>
      <article-id pub-id-type="pmid">39024008</article-id>
      <article-id pub-id-type="doi">10.2196/56700</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Enhancing Type 2 Diabetes Treatment Decisions With Interpretable Machine Learning Models for Predicting Hemoglobin A1c Changes: Machine Learning Model Development</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>El Emam</surname>
            <given-names>Khaled</given-names>
          </name>
        </contrib>
        <contrib contrib-type="editor">
          <name>
            <surname>Malin</surname>
            <given-names>Bradley</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Lim</surname>
            <given-names>Gilbert</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Jafarizadeh</surname>
            <given-names>Ali</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Kurasawa</surname>
            <given-names>Hisashi</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7599-6277</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Waki</surname>
            <given-names>Kayo</given-names>
          </name>
          <degrees>MPH, MD, PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <address>
            <institution>The University of Tokyo Hospital</institution>
            <addr-line>7-3-1 Hongo, Bunkyo-ku</addr-line>
            <addr-line>Tokyo, 113-8655</addr-line>
            <country>Japan</country>
            <phone>81 358006427</phone>
            <email>kwaki-tky@m.u-tokyo.ac.jp</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0046-2523</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Seki</surname>
            <given-names>Tomohisa</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4281-135X</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Chiba</surname>
            <given-names>Akihiro</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3110-2048</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Fujino</surname>
            <given-names>Akinori</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3377-3539</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Hayashi</surname>
            <given-names>Katsuyoshi</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5332-9729</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Nakahara</surname>
            <given-names>Eri</given-names>
          </name>
          <degrees>ME</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0199-3249</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Haga</surname>
            <given-names>Tsuneyuki</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1137-0547</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Noguchi</surname>
            <given-names>Takashi</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8895-5327</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <name name-style="western">
            <surname>Ohe</surname>
            <given-names>Kazuhiko</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4296-9536</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Nippon Telegraph and Telephone Corporation</institution>
        <addr-line>Tokyo</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>The University of Tokyo Hospital</institution>
        <addr-line>Tokyo</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>NTT DOCOMO, Inc</institution>
        <addr-line>Tokyo</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>NTT-AT IPS Corporation</institution>
        <addr-line>Kanagawa</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>National Center for Child Health and Development</institution>
        <addr-line>Tokyo</addr-line>
        <country>Japan</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Kayo Waki <email>kwaki-tky@m.u-tokyo.ac.jp</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>18</day>
        <month>7</month>
        <year>2024</year>
      </pub-date>
      <volume>3</volume>
      <elocation-id>e56700</elocation-id>
      <history>
        <date date-type="received">
          <day>24</day>
          <month>1</month>
          <year>2024</year>
        </date>
        <date date-type="rev-request">
          <day>21</day>
          <month>3</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>21</day>
          <month>4</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>31</day>
          <month>5</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Hisashi Kurasawa, Kayo Waki, Tomohisa Seki, Akihiro Chiba, Akinori Fujino, Katsuyoshi Hayashi, Eri Nakahara, Tsuneyuki Haga, Takashi Noguchi, Kazuhiko Ohe. Originally published in JMIR AI (https://ai.jmir.org), 18.07.2024.</copyright-statement>
      <copyright-year>2024</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR AI, is properly cited. The complete bibliographic information, a link to the original publication on https://www.ai.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://ai.jmir.org/2024/1/e56700" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Type 2 diabetes (T2D) is a significant global health challenge. Physicians need to assess whether future glycemic control will be poor on the current trajectory of usual care and usual-care treatment intensifications so that they can consider taking extra treatment measures to prevent poor outcomes. Predicting poor glycemic control from trends in hemoglobin A<sub>1c</sub> (HbA<sub>1c</sub>) levels is difficult due to the influence of seasonal fluctuations and other factors.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>We sought to develop a model that accurately predicts poor glycemic control among patients with T2D receiving usual care.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Our machine learning model predicts poor glycemic control (HbA<sub>1c</sub>≥8%) using the transformer architecture, incorporating an attention mechanism to process irregularly spaced HbA<sub>1c</sub> time series and quantify temporal relationships of past HbA<sub>1c</sub> levels at each time point. We assessed the model using HbA<sub>1c</sub> levels from 7787 patients with T2D seeing specialist physicians at the University of Tokyo Hospital. The training data include instances of poor glycemic control occurring during usual care with usual-care treatment intensifications. We compared prediction accuracy, assessed with the area under the receiver operating characteristic curve, the area under the precision-recall curve, and the accuracy rate, to that of LightGBM.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The area under the receiver operating characteristic curve, the area under the precision-recall curve, and the accuracy rate (95% confidence limits) of the proposed model were 0.925 (95% CI 0.923-0.928), 0.864 (95% CI 0.852-0.875), and 0.864 (95% CI 0.86-0.869), respectively. The proposed model achieved high prediction accuracy comparable to or surpassing LightGBM’s performance. The model prioritized the most recent HbA<sub>1c</sub> levels for predictions. Older HbA<sub>1c</sub> levels in patients with poor glycemic control were slightly more influential in predictions compared to patients with good glycemic control.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The proposed model accurately predicts poor glycemic control for patients with T2D receiving usual care, including patients receiving usual-care treatment intensifications, allowing physicians to identify cases warranting extraordinary treatment intensifications. If used by a nonspecialist, the model’s indication of likely future poor glycemic control may warrant a referral to a specialist. Future efforts could incorporate diverse and large-scale clinical data for improved accuracy.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>AI</kwd>
        <kwd>artificial intelligence</kwd>
        <kwd>attention weight</kwd>
        <kwd>type 2 diabetes</kwd>
        <kwd>blood glucose control</kwd>
        <kwd>machine learning</kwd>
        <kwd>transformer</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Type 2 diabetes (T2D) affects an estimated 529 million people globally [<xref ref-type="bibr" rid="ref1">1</xref>]. Hemoglobin A<sub>1c</sub> (HbA<sub>1c</sub>) serves as an indicator of poor glycemic control, reflecting the average blood glucose levels over 1 to 2 months. An increase in HbA<sub>1c</sub> of 1 percentage point worsens cardiovascular disease risk by 1.2 times and mortality risk by 1.14 times [<xref ref-type="bibr" rid="ref2">2</xref>]. According to the American Diabetes Association <italic>Standards of Care in Diabetes</italic> [<xref ref-type="bibr" rid="ref3">3</xref>], target HbA<sub>1c</sub> levels are set at 7% for many adults who are nonpregnant and 8% for patients with limited life expectancy or where the harms of treatment are greater than the benefits.</p>
      <p>Physicians need to identify early signs of impending poor glycemic control in patients with T2D and act early to intensify treatment, via a combination of pharmacological and lifestyle interventions, to avoid poor outcomes. There are costs to intensified treatment, including side effects, so it is prudent to delay intensification until it is warranted by disease progression. Factors associated with poor glycemic control include age, duration of T2D treatment, treatment, race or ethnicity, and family history [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref7">7</xref>]. External factors such as seasonal variations affecting HbA<sub>1c</sub> levels [<xref ref-type="bibr" rid="ref8">8</xref>] complicate accurate glycemic control prediction.</p>
      <p>People with T2D receive care from primary care physicians, not T2D specialists, in many areas including the United States, Europe [<xref ref-type="bibr" rid="ref9">9</xref>], and Japan [<xref ref-type="bibr" rid="ref10">10</xref>]. For example, two-thirds of people with T2D in Japan receive care from primary care physicians [<xref ref-type="bibr" rid="ref10">10</xref>]. These nonspecialists may struggle to predict a patient’s glycemic control. In Japan, approximately 60% of surveyed patients with T2D treated by nonspecialists experienced poor glycemic control (HbA<sub>1c</sub>≥8%), with around 30% seeing worsened levels the following year, according to a survey on T2D treatment practices by primary care physicians [<xref ref-type="bibr" rid="ref10">10</xref>].</p>
      <p>Physicians regularly adjust a T2D patient’s treatment, intensifying treatment when the clinical indications lead them to predict poor glycemic control. Despite this usual care, including treatment intensification, some patients still experience poor glycemic control. From 2015 to 2018, a total of 49.5% of US community-dwelling adults with diabetes had HbA<sub>1c</sub>≥7% and 24.6% had HbA<sub>1c</sub>≥8% [<xref ref-type="bibr" rid="ref11">11</xref>]. A tool predicting poor glycemic control while under usual care, including usual-care treatment intensifications, could enhance treatment outcomes. It could alert physicians early enough to enable intensified modification of treatment, improving treatment outcomes for patients and increasing referrals to specialists when warranted by disease progression.</p>
      <p>Machine learning (ML) has demonstrated success in predicting patient symptoms, including forecasting the onset of T2D [<xref ref-type="bibr" rid="ref12">12</xref>] and predicting complications [<xref ref-type="bibr" rid="ref13">13</xref>], and it is a promising approach to predicting poor glycemic control, although to our knowledge it has not previously been applied to this task. Glycemic control data are in general irregularly spaced, reflecting the variability in patient care appointment dates, with updates to outpatient electronic health records (EHRs) occurring before and after clinical visits. Irregularly spaced data require preprocessing techniques such as interpolation, denoising autoencoders, and self-supervised learning [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref17">17</xref>]. Processing data with irregular intervals may hurt predictive performance [<xref ref-type="bibr" rid="ref18">18</xref>], requiring careful consideration in developing artificial intelligence models.</p>
      <p>Although ML models may provide good prediction performance, they often operate as “black boxes,” with opaque reasoning and associated poor interpretability that makes it difficult for both physicians and patients to understand the logical process guiding decision-making [<xref ref-type="bibr" rid="ref19">19</xref>]. To allow the interpretation of ML models, so that they are more acceptable to physicians [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>] and patients [<xref ref-type="bibr" rid="ref22">22</xref>], explainable artificial intelligence (XAI) has been studied [<xref ref-type="bibr" rid="ref23">23</xref>]. It attempts to clarify temporal relationships of symptoms at each time point toward temporal interpretability based on patient trajectories [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref25">25</xref>], and this has been actively researched in the computer science field [<xref ref-type="bibr" rid="ref26">26</xref>].</p>
      <p>Since its introduction in 2017, the transformer model has excelled in various time-series predictive tasks, solidifying its position as a core technology across multiple fields [<xref ref-type="bibr" rid="ref27">27</xref>-<xref ref-type="bibr" rid="ref32">32</xref>]. The transformer model incorporates an attention mechanism simplifying the extraction of temporal relationships and setting it apart from other models [<xref ref-type="bibr" rid="ref33">33</xref>-<xref ref-type="bibr" rid="ref35">35</xref>]. The attention mechanism allows a model to selectively focus on different data points in the input sequence, assigning varying degrees of importance to each data point. Applied to the problem of predicting poor glycemic control, the attention mechanism can process irregularly spaced HbA<sub>1c</sub> time series and quantify temporal relationships of past HbA<sub>1c</sub> levels at each time point, following a model-specific approach in XAI [<xref ref-type="bibr" rid="ref36">36</xref>].</p>
      <p>This study aims to develop an ML tool that accurately and interpretably predicts poor glycemic control (HbA<sub>1c</sub>≥8%) using irregularly spaced HbA<sub>1c</sub> levels over the past year, in support of preventing T2D complications by enabling timely intensification of treatment. Although the treatment guidelines generally target an HbA<sub>1c</sub> level of 7% or lower [<xref ref-type="bibr" rid="ref3">3</xref>], higher levels are common in diabetes patients. In our clinical experience, levels of 8% and higher are a cause of great concern and trigger more intensive intervention. Accordingly, we have set 8% HbA<sub>1c</sub> as the threshold for defining poor glycemic control.</p>
      <p>Given the absence of prior studies in this specific area, we set target accuracy to be the receiver operating characteristic (ROC) area under the curve (AUC)&gt;0.9 and precision-recall (PR)–AUC&gt;0.8 based on our clinical endocrinology experience with diabetes treatment. These values are commonly used as a benchmark for good prediction accuracy in the ML field [<xref ref-type="bibr" rid="ref37">37</xref>] and are consistent with the ROC-AUCs of past diabetes-related ML tasks ranging from 0.819 to 0.934 [<xref ref-type="bibr" rid="ref38">38</xref>-<xref ref-type="bibr" rid="ref42">42</xref>].</p>
      <p>Drawing on our team’s prior work in self-management support for T2D treatment [<xref ref-type="bibr" rid="ref43">43</xref>] and predicting treatment discontinuations [<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>], we designed this task with the hope of overcoming barriers to implementing ML in clinical practice, believing it could significantly advance T2D diagnosis and treatment.</p>
      <p>We hypothesize that an ML model can predict poor glycemic control in patients with T2D under usual care. Our specific research question is whether a transformer-based model, incorporating temporal relationships of HbA<sub>1c</sub> levels, can accurately and interpretably predict instances of poor glycemic control (HbA<sub>1c</sub>≥8%). Our approach is novel in how it overcomes challenges posed by irregularly spaced HbA<sub>1c</sub> time series.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Sets and Preprocessing</title>
        <p>All data were collected from EHRs at the University of Tokyo Hospital, which included 7787 patients who visited the hospital and had diagnostic codes indicative of T2D. The data were recorded in the EHRs between January 1, 2006, and December 31, 2015. The data, including treatment decisions and outcomes, were reflective of care by T2D specialists. Only HbA<sub>1c</sub> levels were used in the ML model.</p>
      </sec>
      <sec>
        <title>ML Models</title>
        <p>Given the irregularly spaced data, we organized the data into Monday-to-Sunday weeks and quantized the data to a single value per week, using the average in the case of multiple measurements and treating weeks with no values as having missing values [<xref ref-type="bibr" rid="ref46">46</xref>]. This approach allowed the ML model to treat irregularly spaced data spanning N years as regularly spaced data consisting of N×365/7 (rounded up to the nearest integer) values, that is, we treat all data as weekly data. We did not perform preprocessing, including interpolation, on missing values in the regularly spaced data. No normalization, outlier removal, or dimensionality reduction were performed on the HbA<sub>1c</sub> levels. Typical ML models such as LightGBM address missing values via interpolation or replacement before learning. In contrast, we adopted an approach that ignores and skips missing values.</p>
        <p>We designed a transformer model (<xref ref-type="table" rid="table1">Table 1</xref>) that takes as input an irregularly spaced time series of HbA<sub>1c</sub> levels spanning over the past year or more and outputs a binary assessment of poor glycemic control (HbA<sub>1c</sub>≥8%) within the subsequent year. The model incorporates 2 types of attention layers: self-attention, designed to extract temporal relationships from past irregularly spaced HbA<sub>1c</sub> levels, and cross-attention, used to predict poor glycemic control based on these temporal relationships. The self-attention weights are optimized through self-supervised learning. This involves the task of predicting the next HbA<sub>1c</sub> level using a time series of weekly spaced past HbA<sub>1c</sub> levels with missing values, where the past levels are used as both input and output. We use an attention mask mechanism that completely ignores missing values by setting their self-attention weight to 0, allowing us to learn using values with irregular spacing due to missing values as is. This is similar to the process of padding in language models. The cross-attention weights are optimized through supervised learning. This involves the task of predicting the class representing the likelihood of future poor glycemic control using the latent variables transformed by self-attention from the past HbA<sub>1c</sub> time series. We used causal masking in both learning tasks to prevent the model from referencing future data, ensuring that the model makes predictions considering the causal relationship between past symptoms and future symptoms. Conceptually, given that we constrained the model to improve interpretability, we expect a slightly lower prediction accuracy than that of an unconstrained model (<xref rid="figure1" ref-type="fig">Figure 1</xref>), and 1 goal is to minimize this interpretability penalty.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Model details (transformer architecture).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="670"/>
            <col width="330"/>
            <thead>
              <tr valign="top">
                <td>Configure</td>
                <td>Value</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Encoder layers including self-attention blocks, n</td>
                <td>4</td>
              </tr>
              <tr valign="top">
                <td>Decoder layers including cross-attention blocks, n</td>
                <td>4</td>
              </tr>
              <tr valign="top">
                <td>Heads in the attention, n</td>
                <td>4</td>
              </tr>
              <tr valign="top">
                <td>Transformer hidden size, n</td>
                <td>128</td>
              </tr>
              <tr valign="top">
                <td>Transformer feedforward neural network hidden size, n</td>
                <td>512</td>
              </tr>
              <tr valign="top">
                <td>Optimizer method</td>
                <td>Adam</td>
              </tr>
              <tr valign="top">
                <td>Loss function</td>
                <td>Focal Loss</td>
              </tr>
              <tr valign="top">
                <td>Learning rate</td>
                <td>1×10<sup>–4</sup></td>
              </tr>
              <tr valign="top">
                <td>Batch size, n</td>
                <td>512</td>
              </tr>
              <tr valign="top">
                <td>Iterations, n</td>
                <td>20,000 (no early stopping)</td>
              </tr>
              <tr valign="top">
                <td>Library</td>
                <td>Python (version 3.11) and PyTorch (version 2.2.0)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Conceptual trade-off between prediction accuracy and interpretability, for a given level of computational complexity.</p>
          </caption>
          <graphic xlink:href="ai_v3i1e56700_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>This model makes a yes or no decision on future poor glycemic control, with a threshold as a free variable allowing a tradeoff among true or false negatives or positives. We set the threshold to maximize the <italic>F</italic><sub>1</sub>-score (the harmonic mean of the ROC and PR values) using training data, resulting in a tool that made a binary prediction as to whether or not, in the next year, glycemic control will be poor. The training data include treatment intensification by specialists making their own assessments of likely future glycemic control. As such, the predicted poor glycemic control occurs despite any usual-care intensification of treatment prescribed by the attending specialist physicians. In other words, a prediction of poor glycemic control indicates a case likely warrants special attention and intervention, as usual-care intensification of treatment is predicted to be insufficient.</p>
      </sec>
      <sec>
        <title>Temporal Data Usage</title>
        <p>Our analysis sought to determine the length of the HbA<sub>1c</sub> time series needed to achieve the target accuracy. Training and testing were separated by period using the well-established time series prediction accuracy evaluation method [<xref ref-type="bibr" rid="ref47">47</xref>]. We used as a reference the date on which a patient took an HbA<sub>1c</sub> test in 2013. We used the HbA<sub>1c</sub> time series for the N years before the reference date as training input and the occurrence or absence of poor glycemic control (HbA<sub>1c</sub>≥8%) within 1 year from the reference date as the training output. Then, we tested the resulting model using the same procedure, but for the following year, 2014, selecting an appropriate choice for N, the length of training data. We evaluated the predictive performance of the resulting model using 7 years of test data, sliding the reference dates from 2007 to 2013, using the rolling-origin procedure [<xref ref-type="bibr" rid="ref47">47</xref>].</p>
        <p>The training input or output period and the testing output period do not overlap, and therefore there was no leakage into predictive evaluation. Data for a given patient will in general have some time samples in the training data and some in the test data, but since patient identification is not an input to the model, the model does not identify specific patients.</p>
      </sec>
      <sec>
        <title>Statistical Methods</title>
        <p>We analyzed the characteristics of patients in the data set using means, SDs, and frequency counts. We performed all statistical analyses using custom Python code. We used the <italic>Python</italic> (version 3.11) and <italic>PyTorch</italic> (version 2.2) libraries for developing the transformer model, the <italic>Numpy</italic> (version 1.26) and <italic>Pandas</italic> (version 2.2) libraries for managing data sets, and the <italic>scikit-learn</italic> (version 1.4) library for evaluating predictive accuracy.</p>
        <p>We compared our model with an established ML method recognized for high accuracy. There were no studies directly addressing our task, but validations on similar T2D prediction tasks favored LightGBM [<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref49">49</xref>], making it our chosen reference for comparisons. While LightGBM is acknowledged for its superior predictive performance, it is not inherently interpretable. The model’s complexity and intricate decision tree paths make it difficult to provide a straightforward interpretation of its predictions. Our reference LightGBM model takes as input equally spaced HbA<sub>1c</sub> data and outputs a binary assessment of poor glycemic control (HbA<sub>1c</sub>≥8%).</p>
        <p>We compared the transformer model and LightGBM using the evaluation metrics of ROC-AUC, PR-AUC, accuracy rate, and <italic>F</italic><sub>1</sub>-score, with 95% CI using the bootstrap method.</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>This study was approved by the Institutional Review Board of the University of Tokyo School of Medicine (10705-(3)) and was conducted per the Declaration of Helsinki. This was a retrospective, noninterventional database study without patient involvement. Confidentiality was safeguarded by the University of Tokyo Hospital. According to the Guidelines for Epidemiological Studies of the Ministry of Health, Labour and Welfare of Japan, written informed consent was not required. Information about this study was available to patients on a website, and patients have the right to cease registration of their data at any time [<xref ref-type="bibr" rid="ref50">50</xref>].</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Patient Data</title>
        <p>We analyzed 7787 patients (<xref ref-type="table" rid="table2">Table 2</xref>). Although specialist physicians were providing usual care and prescribing treatment intensifications based on their clinical judgment, 57.83% (n=4504) of patients had an HbA<sub>1c</sub> over 8% at least once. The number of HbA<sub>1c</sub> tests per year was 7.7 (SD 2.8). In other words, the missingness level of weekly spaced past HbA<sub>1c</sub> levels for a year was 1 – 7.7 / ROUNDUP(365/7) = 85.5%. The age group with the highest number of individuals is the aged 70-80 years category, comprising 2347 people, accounting for 30.14% of the patients. In addition to diabetes, more than 45% of patients had diseases such as essential (primary) hypertension, hypertensive heart disease, pure hypercholesterolemia, and astigmatism. Each patient had multiple records, leading to 323,825 records used in our analysis.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Characteristics of patients.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="30"/>
            <col width="530"/>
            <col width="0"/>
            <col width="220"/>
            <col width="0"/>
            <col width="190"/>
            <thead>
              <tr valign="top">
                <td colspan="4">Characteristics</td>
                <td colspan="2">Records (n=323,825)</td>
                <td>Patients (n=7787)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="7">
                  <bold>Feature used in the model</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="6">
                  <bold>HbA<sub>1c</sub><sup>a</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Mean (SD)</td>
                <td colspan="2">7.1 (1.1)</td>
                <td colspan="2">—<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>&lt;6%, n (%)</td>
                <td colspan="2">42,495 (13.12)</td>
                <td colspan="2">4103 (52.69)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>6%-7%, n (%)</td>
                <td colspan="2">137,968 (42.61)</td>
                <td colspan="2">6666 (85.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>7%-8%, n (%)</td>
                <td colspan="2">89,875 (27.75)</td>
                <td colspan="2">5770 (74.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>≥8%, n (%)</td>
                <td colspan="2">53,487 (16.52)</td>
                <td colspan="2">4504 (57.84)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Tests per year, mean (SD)</td>
                <td colspan="2">7.7 (2.8)</td>
                <td colspan="2">—</td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>Features not used in the model</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="6">
                  <bold>Gender</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Male, n (%)</td>
                <td colspan="2">193,976 (59.9)</td>
                <td colspan="2">4726 (60.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Female, n (%)</td>
                <td colspan="2">129,849 (40.1)</td>
                <td colspan="2">3061 (39.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="6">
                  <bold>Age (years)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Mean (SD)</td>
                <td colspan="2">—</td>
                <td colspan="2">67.5 (13.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>10-20, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">1 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>20-30, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">58 (0.74)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>30-40, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">255 (3.27)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>40-50, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">585 (7.51)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>50-60, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">1006 (12.92)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>60-70, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">2058 (26.43)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>70-80, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">2347 (30.14)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>80-90, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">1322 (16.98)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>90-100, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">149 (1.91)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>100-110, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">6 (0.08)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="6">
                  <bold>Top 10 most common diseases</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>E14: unspecified diabetes mellitus, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">5495 (70.57)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>I10: essential (primary) hypertension, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">5023 (64.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>E11: hypertensive heart disease, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">3715 (47.71)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>E780: pure hypercholesterolemia, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">3661 (47.01)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>H522: astigmatism, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">3636 (46.69)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>E785: hyperlipidemia, unspecified, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">3490 (44.82)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>K590: constipation, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">3353 (43.06)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>K210: gastro-esophageal reflux disease with esophagitis, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">2937 (37.72)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>K295: chronic gastritis, unspecified, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">2756 (35.39)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="6">
                  <bold>Top 10 most common medicines</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Metformin hydrochloride, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">2541 (32.63)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Sitagliptin phosphate hydrate, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">2177 (27.96)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Glimepiride, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">2036 (26.15)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Pioglitazone hydrochloride, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">1641 (21.07)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Insulin glargine (genetical recombination), n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">1597 (20.51)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Rosuvastatin calcium, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">1458 (18.72)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Voglibose, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">1430 (18.36)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Atorvastatin calcium hydrate, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">1323 (16.99)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Insulin aspart (genetical recombination), n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">1277 (16.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Vildagliptin, n (%)</td>
                <td colspan="2">—</td>
                <td colspan="2">1187 (15.24)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>HbA<sub>1c</sub>: hemoglobin A<sub>1c</sub>.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>Not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Prediction Performance for HbA1c Time Series Lengths</title>
        <p>We assessed using different lengths of past HbA<sub>1c</sub> time series (<xref ref-type="table" rid="table3">Table 3</xref>) as both training and test inputs to the model to determine the most effective period for predicting poor glycemic control. Extending the input period beyond 1 year did not yield a statistically significant difference within a 95% CI (<xref rid="figure2" ref-type="fig">Figures 2</xref> and <xref rid="figure3" ref-type="fig">3</xref>). This study’s objectives of achieving ROC-AUC&gt;0.9 and PR-AUC&gt;0.8 were attainable with just 1 year of past HbA<sub>1c</sub> time series. Comparing prediction accuracy with LightGBM revealed no significant differences within the 95% CI, indicating nearly equivalent performance between the transformer and LightGBM. As a result, we settled on a final model that is based on using 1 year of prior data for training.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Test data set size for the evaluation of various hemoglobin A<sub>1c</sub> (HbA<sub>1c</sub>) time series lengths.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="140"/>
            <col width="130"/>
            <col width="170"/>
            <col width="90"/>
            <col width="110"/>
            <col width="140"/>
            <col width="220"/>
            <thead>
              <tr valign="top">
                <td>Length of past HbA<sub>1c</sub> time series</td>
                <td>Records (R), n</td>
                <td>Records with poor glycemic control (T), n</td>
                <td>T/R, %</td>
                <td>Patients, n</td>
                <td>Records per patient, mean (SD)</td>
                <td>Weekly spaced data with values in input data, mean (SD)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>25,564</td>
                <td>6818</td>
                <td>26.7</td>
                <td>4661</td>
                <td>5.5 (2.7)</td>
                <td>7.3 (2.7)</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>25,594</td>
                <td>6827</td>
                <td>26.7</td>
                <td>4672</td>
                <td>5.5 (2.7)</td>
                <td>13.2 (5.6)</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>25,611</td>
                <td>6831</td>
                <td>26.7</td>
                <td>4676</td>
                <td>5.5 (2.7)</td>
                <td>18.8 (8.6)</td>
              </tr>
              <tr valign="top">
                <td>4</td>
                <td>25,618</td>
                <td>6831</td>
                <td>26.7</td>
                <td>4678</td>
                <td>5.5 (2.7)</td>
                <td>24.1 (11.8)</td>
              </tr>
              <tr valign="top">
                <td>5</td>
                <td>25,621</td>
                <td>6832</td>
                <td>26.7</td>
                <td>4678</td>
                <td>5.5 (2.7)</td>
                <td>28.9 (15.1)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Predictive performance using ROC-AUC as a measure for various HbA<sub>1c</sub> time series lengths using test data reference dates in 2014. HbA<sub>1c</sub>: hemoglobin A<sub>1c</sub>; ROC-AUC: area under the receiver operating characteristic curve.</p>
          </caption>
          <graphic xlink:href="ai_v3i1e56700_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Predictive performance using PR-AUC as a measure for various HbA1c time series lengths using test data reference dates in 2014. HbA<sub>1c</sub>: hemoglobin A<sub>1c</sub>; PR-AUC: area under the precision-recall curve.</p>
          </caption>
          <graphic xlink:href="ai_v3i1e56700_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Prediction Performance Over the Full Data Set</title>
        <p>We assessed whether the resulting model, using 1 year of prior data for training, could consistently achieve the target accuracy over the available 7 years of test data (<xref ref-type="table" rid="table4">Table 4</xref>). Despite some fluctuation in prediction accuracy, the target was achieved over the entire 7-year period (<xref rid="figure4" ref-type="fig">Figures 4</xref> and <xref rid="figure5" ref-type="fig">5</xref>). The ROC-AUC (95% confidence limits) for transformer was 0.925 (95% CI 0.923-0.928; <xref rid="figure6" ref-type="fig">Figure 6</xref>), compared to LightGBM’s 0.920 (95% CI 0.918-0.923), and the PR-AUC (95% confidence limits) for transformer was 0.864 (95% CI 0.852-0.875; <xref rid="figure7" ref-type="fig">Figure 7</xref>), compared to LightGBM’s 0.857 (95% CI 0.846-0.868). The average accuracy rate (95% confidence limits) for the transformer was 0.864 (95% CI 0.860-0.869), comparable to LightGBM’s 0.861 (95% CI 0.857-0.865).</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Test data set size for the evaluation of various hemoglobin A<sub>1c</sub> (HbA<sub>1c</sub>) time series lengths.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="140"/>
            <col width="130"/>
            <col width="170"/>
            <col width="90"/>
            <col width="110"/>
            <col width="140"/>
            <col width="220"/>
            <thead>
              <tr valign="top">
                <td>Year of the test data</td>
                <td>Records (R), n</td>
                <td>Records with poor glycemic control (T), n</td>
                <td>T/R, %</td>
                <td>Patients, n</td>
                <td>Records per patient, mean (SD)</td>
                <td>Weekly spaced data with values in input data, mean (SD)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>2007</td>
                <td>22,520</td>
                <td>7176</td>
                <td>31.9</td>
                <td>3221</td>
                <td>7 (3.1)</td>
                <td>8 (2.9)</td>
              </tr>
              <tr valign="top">
                <td>2008</td>
                <td>24,775</td>
                <td>7517</td>
                <td>30.3</td>
                <td>3626</td>
                <td>6.8 (3.1)</td>
                <td>8.1 (2.9)</td>
              </tr>
              <tr valign="top">
                <td>2009</td>
                <td>26,144</td>
                <td>8444</td>
                <td>32.3</td>
                <td>2973</td>
                <td>6.6 (3)</td>
                <td>8 (2.9)</td>
              </tr>
              <tr valign="top">
                <td>2010</td>
                <td>27,124</td>
                <td>8521</td>
                <td>31.4</td>
                <td>4260</td>
                <td>6.4 (3)</td>
                <td>7.8 (2.9)</td>
              </tr>
              <tr valign="top">
                <td>2011</td>
                <td>26,661</td>
                <td>7687</td>
                <td>28.8</td>
                <td>4377</td>
                <td>6.1 (3)</td>
                <td>7.7 (2.8)</td>
              </tr>
              <tr valign="top">
                <td>2012</td>
                <td>26,259</td>
                <td>6944</td>
                <td>26.4</td>
                <td>4412</td>
                <td>6 (2.9)</td>
                <td>7.5 (2.7)</td>
              </tr>
              <tr valign="top">
                <td>2013</td>
                <td>25,945</td>
                <td>7281</td>
                <td>28.1</td>
                <td>4533</td>
                <td>5.7 (2.8)</td>
                <td>7.4 (2.7)</td>
              </tr>
              <tr valign="top">
                <td>2014</td>
                <td>25,564</td>
                <td>6818</td>
                <td>26.7</td>
                <td>4661</td>
                <td>5.5 (2.7)</td>
                <td>7.3 (2.7)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Predictive performance over time using ROC-AUC as a measure using test data reference dates ranging from 2008 to 2014. ROC-AUC: area under the receiver operating characteristic curve.</p>
          </caption>
          <graphic xlink:href="ai_v3i1e56700_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Predictive performance over time using PR-AUC as a measure using test data reference dates ranging from 2008 to 2014. PR-AUC: area under the precision-recall curve.</p>
          </caption>
          <graphic xlink:href="ai_v3i1e56700_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>Predictive performance over time using ROC curve as a measure using test data reference dates ranging from 2008 to 2014. AUC: area under the curve; FPR: false positive rate; HbA<sub>1c</sub>: hemoglobin A<sub>1c</sub>; ROC: receiver operating characteristic; TPR: true positive rate.</p>
          </caption>
          <graphic xlink:href="ai_v3i1e56700_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure7" position="float">
          <label>Figure 7</label>
          <caption>
            <p>Predictive performance over time using PR curve as a measure using test data reference dates ranging from 2008 to 2014. AUC: area under the curve; HbA<sub>1c</sub>: hemoglobin A<sub>1c</sub>; PR: precision-recall.</p>
          </caption>
          <graphic xlink:href="ai_v3i1e56700_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Interpretability</title>
        <p>The proposed model extracts temporal relationships from past irregularly spaced HbA<sub>1c</sub> levels using self-attention and determines the contribution of each HbA<sub>1c</sub> level to the prediction of glycemic control using cross-attention. An example of the extracted results is shown in <xref rid="figure8" ref-type="fig">Figure 8</xref>.</p>
        <p><xref rid="figure9" ref-type="fig">Figures 9</xref>-<xref rid="figure11" ref-type="fig">11</xref> plot the average values of HbA<sub>1c</sub> levels, self-attention weights, and cross-attention weights for 4 groups: true positives with transformer and true positives with LightGBM, true negatives with transformer and true negatives with LightGBM, true positives with transformer and false negatives with LightGBM, and false negatives with transformer and true positives with LightGBM. The group with true positive results in both models had an average HbA<sub>1c</sub> level of 8% or higher, whereas the group with true negative results in both models had an average HbA<sub>1c</sub> level of less than 7%. The weight of older self-attention was larger in the former group, and the weight of recent cross-attention was smaller in the latter group. The group containing true positives by transformer and false negatives with LightGBM had an average HbA<sub>1c</sub> level of around 7.5%, had a smaller recent self-attention weight than the other groups, and had a similar trend of cross-attention weights as the group of true negatives with both models. The group that was false negative with transformer and true positive with LightGBM tended for HbA<sub>1c</sub> to fall from the 8% range to the 7% range, and both recent self-attention and cross-attention were greater than other groups.</p>
        <fig id="figure8" position="float">
          <label>Figure 8</label>
          <caption>
            <p>Example of HbA<sub>1c</sub> levels, self-attention weights, and cross-attention weights. HbA<sub>1c</sub>: hemoglobin A<sub>1c</sub>.</p>
          </caption>
          <graphic xlink:href="ai_v3i1e56700_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure9" position="float">
          <label>Figure 9</label>
          <caption>
            <p>Average levels of HbA<sub>1c</sub> time series. HbA<sub>1c</sub>: hemoglobin A<sub>1c</sub>.</p>
          </caption>
          <graphic xlink:href="ai_v3i1e56700_fig9.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure10" position="float">
          <label>Figure 10</label>
          <caption>
            <p>Average weight of self-attention.</p>
          </caption>
          <graphic xlink:href="ai_v3i1e56700_fig10.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure11" position="float">
          <label>Figure 11</label>
          <caption>
            <p>Average weight of cross-attention.</p>
          </caption>
          <graphic xlink:href="ai_v3i1e56700_fig11.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Evaluation of the Predictive Accuracy</title>
        <p>Our results show that, despite usual care by specialist physicians, poor glycemic control was common, affecting 57.83% (4504/7787) of patients. By highlighting cases with a high likelihood of poor glycemic control despite normal treatment intensifications, the proposed model provides new information to physicians, identifying patients who may benefit from extraordinary treatment intensification.</p>
        <p>Balancing high predictive accuracy with interpretability is vital for acceptance by patients and physicians. The proposed model achieved impressive predictive accuracy, with ROC-AUC above 0.9, PR-AUC above 0.8, and an overall accuracy of 0.864. For physicians, ROC-AUC above 0.9 suggests excellent performance in distinguishing between patients who will have poor glycemic control and patients who will have good glycemic control. Similarly, PR-AUC above 0.8 indicates excellent performance in providing accurate prediction while minimizing false positives. LightGBM, a widely respected model in ML, serves as a benchmark. The proposed model slightly surpassed the performance of LightGBM, implying that the proposed model can offer physicians a reliable tool for predicting poor glycemic control.</p>
        <p>Accuracy did not increase with longer training data lengths. The model achieved accurate predictions with just 1 year of training data, suggesting that recent glycemic control plays a dominant role in prediction outcomes. However, the actual future glycemic control is influenced by factors not accounted for in the current model, such as medications, exercise, diet, and other lifestyle factors.</p>
        <p>While the proposed model demonstrated comparable predictive accuracy to LightGBM within this experiment’s scope, further improvement may be possible with extensive training data. Transformer models, known for power-law characteristics, benefit from scale-ups [<xref ref-type="bibr" rid="ref51">51</xref>], and expanding this study to multiple hospitals could explore potential performance enhancements and test the applicability of the power-law in the medical field.</p>
      </sec>
      <sec>
        <title>Interpretability</title>
        <p>The cross-attention weights were very similar for the group that was true positive in both models and the group that was true positive in transformer and false negative in LightGBM. This suggests that the proposed model consistently made predictions by capturing sufficient features, while the benchmark LightGBM might have captured extraneous features. On the other hand, when the proposed model performed worse than LightGBM, as observed in the group of false negatives with the transformer and true positives with LightGBM, it appears that the cross-attention strongly responded to the decreasing trend in HbA<sub>1c</sub>, leading to a prediction failure. These prediction failures accounted for only 0.30% (77/25,564) of cases.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>Our study has notable limitations. First, the data were sourced from past records at a single hospital, limiting generalizability. We have not confirmed prediction accuracy for new patients, as we used a rolling origin procedure. While we separated the data into training and testing sets based on time duration, some patients still overlap between these sets. While this approach is useful for assessing the model’s performance within the hospital where it is trained, it poses challenges when applying a model trained in one hospital to another. The intensification of treatment may depend on factors specific to individual patients, the treatment strategies of individual physicians and hospitals, guidelines, and varying treatment trends across countries. Further work is needed to verify the extent to which the model needs to be customized for different environments.</p>
        <p>Second, ML reflects majority characteristics, potentially limiting applicability to diverse patient populations. In the data set used in the experiment, as shown in <xref ref-type="table" rid="table2">Table 2</xref>, 40% of patients have 7 diseases, and patient characteristics are biased. Prediction failure analysis needs to be further scrutinized, including versus patient characteristics. We should examine this issue by comparing prediction accuracy for each patient cluster.</p>
        <p>Third, the model uses only HbA<sub>1c</sub> levels as inputs. We incorporated prescription and other laboratory tests as explanatory variables during preliminary validation, but both our proposed model and LightGBM did not show improved predictive accuracy. Future work should further explore incorporating clinical data beyond HbA<sub>1c</sub>. EHRs contain patient history represented in categorical, numeric, text, and images that are still underused. We should devise model designs based on cutting-edge multimodal modeling using the transformer [<xref ref-type="bibr" rid="ref52">52</xref>-<xref ref-type="bibr" rid="ref54">54</xref>].</p>
        <p>Fourth, the interpretability of the model expresses temporal relationships numerically, lacking readability. To enhance clarity and visualization of the information that physicians require, it is essential to solidify the user interface or user experience concepts. There is a need for further consultation with physicians to determine an interface that would effectively communicate interpretability. Additionally, to increase the interpretability of this method, an approach that combines it with traditional XAI technologies [<xref ref-type="bibr" rid="ref36">36</xref>] such as SHAP and LIME should be investigated.</p>
        <p>Fifth, this was a backward-looking study, using past data, and the essential next phase is to assess the model’s predictive capabilities in clinical practice. There is a need for a careful exploration of the model’s effectiveness in real clinical scenarios.</p>
      </sec>
      <sec>
        <title>Future Research Direction</title>
        <p>Our ultimate goal is to improve the treatment outcomes of diabetes. Merely predicting poor glycemic control alone cannot achieve this goal. By providing predictive results to physicians and reinforcing treatment, we can demonstrate the value of the predictions. Future research could focus on improving predictions by incorporating additional clinical data beyond HbA<sub>1c</sub> levels. Exploring the applicability of the model in diverse populations will help assess its generalizability and institution-specific variations. Implementing the model in clinical practice for real-time predictions, possibly through randomized controlled trials, would elucidate its impact on clinical decision-making and patient outcomes. Moreover, expanding the scope to predict the impact of treatment changes as well [<xref ref-type="bibr" rid="ref55">55</xref>] could further enhance the model’s utility in diabetes management.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>The proposed model addresses the challenge of identifying patients with T2D who will have poor glycemic control, increasing the risk of complications, despite usual care by specialist physicians. The model achieves highly accurate predictions, with an accuracy of 0.864, and provides good interpretability from the irregularly spaced HbA<sub>1c</sub> values commonly observed in clinical settings. The model balances desirable predictive accuracy and interpretability in clinical practice, enhancing the acceptability of ML. Future efforts should focus on further improving accuracy and interpretability by incorporating additional features beyond HbA<sub>1c</sub> and validating large clinical data sets.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AUC</term>
          <def>
            <p>area under the curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">HbA<sub>1c</sub></term>
          <def>
            <p>hemoglobin A<sub>1c</sub></p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">ML</term>
          <def>
            <p>machine learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">PR</term>
          <def>
            <p>precision-recall</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">ROC</term>
          <def>
            <p>receiver operating characteristic</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">T2D</term>
          <def>
            <p>type 2 diabetes</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">XAI</term>
          <def>
            <p>explainable artificial intelligence</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>We thank Daniel Lane, ME, MBA, for his support in paper editing and scientific discussions. We made no use of generative artificial intelligence in the development of this paper. This work was funded by The University of Tokyo and Nippon Telegraph and Telephone Corporation (NTT) in a joint research program at the University of Tokyo Center of Innovation, Sustainable Life Care, and the Ageless Society dedicated to Self-Managing Healthcare in the Aging Society of Japan. The funding source had no role in the design and conduct of this study; collection, management, analysis, and interpretation of the data; preparation, review, or approval of this paper; and decision to submit this paper for publication. The content is solely the responsibility of the authors and does not necessarily represent the official views of the University of Tokyo Center of Innovation.</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The data in this study are not openly available because of the restrictions imposed by the research ethics committees that approved this study.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="conflict">
        <p>HK, KH, AF, and EN are employees of Nippon Telegraph and Telephone Corporation (NTT), Tokyo, Japan. AC was an employee of NTT, and he is now an employee of NTT DOCOMO, Inc, Tokyo, Japan. TH was an employee of NTT, and he is now the chief executive officer of NTT-AT IPS Corporation, Kanagawa, Japan. KW received research funding from NTT and the University of Tokyo Center of Innovation, Sustainable Life Care, and the Ageless Society dedicated to Self-Managing Healthcare in the Aging Society of Japan.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>GBD 2021 Diabetes Collaborators</collab>
          </person-group>
          <article-title>Global, regional, and national burden of diabetes from 1990 to 2021, with projections of prevalence to 2050: a systematic analysis for the Global Burden of Disease study 2021</article-title>
          <source>Lancet</source>
          <year>2023</year>
          <volume>402</volume>
          <issue>10397</issue>
          <fpage>203</fpage>
          <lpage>234</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://air.unimi.it/handle/2434/980231"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(23)01301-6</pub-id>
          <pub-id pub-id-type="medline">37356446</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(23)01301-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC10364581</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>YY</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>YJ</given-names>
            </name>
            <name name-style="western">
              <surname>Chong</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>PC</given-names>
            </name>
            <name name-style="western">
              <surname>Chao</surname>
              <given-names>TF</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Chien</surname>
              <given-names>KL</given-names>
            </name>
          </person-group>
          <article-title>The impact of diabetes mellitus and corresponding HbA1c levels on the future risks of cardiovascular disease and mortality: a representative cohort study in Taiwan</article-title>
          <source>PLoS One</source>
          <year>2015</year>
          <volume>10</volume>
          <issue>4</issue>
          <fpage>e0123116</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0123116"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0123116</pub-id>
          <pub-id pub-id-type="medline">25874454</pub-id>
          <pub-id pub-id-type="pii">PONE-D-14-43104</pub-id>
          <pub-id pub-id-type="pmcid">PMC4395238</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>ElSayed</surname>
              <given-names>NA</given-names>
            </name>
            <name name-style="western">
              <surname>Aleppo</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Aroda</surname>
              <given-names>VR</given-names>
            </name>
            <name name-style="western">
              <surname>Bannuru</surname>
              <given-names>RR</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>FM</given-names>
            </name>
            <name name-style="western">
              <surname>Bruemmer</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Hilliard</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Isaacs</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>EL</given-names>
            </name>
            <name name-style="western">
              <surname>Kahan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Khunti</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Leon</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lyons</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Perry</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Prahalad</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Pratley</surname>
              <given-names>RE</given-names>
            </name>
            <name name-style="western">
              <surname>Seley</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Stanton</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Gabbay</surname>
              <given-names>RA</given-names>
            </name>
          </person-group>
          <article-title>6. Glycemic targets: standards of care in diabetes-2023</article-title>
          <source>Diabetes Care</source>
          <year>2023</year>
          <volume>46</volume>
          <issue>Suppl 1</issue>
          <fpage>S97</fpage>
          <lpage>S110</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36507646"/>
          </comment>
          <pub-id pub-id-type="doi">10.2337/dc23-S006</pub-id>
          <pub-id pub-id-type="medline">36507646</pub-id>
          <pub-id pub-id-type="pii">148053</pub-id>
          <pub-id pub-id-type="pmcid">PMC9810469</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Harris</surname>
              <given-names>MI</given-names>
            </name>
            <name name-style="western">
              <surname>Eastman</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Cowie</surname>
              <given-names>CC</given-names>
            </name>
            <name name-style="western">
              <surname>Flegal</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Eberhardt</surname>
              <given-names>MS</given-names>
            </name>
          </person-group>
          <article-title>Racial and ethnic differences in glycemic control of adults with type 2 diabetes</article-title>
          <source>Diabetes Care</source>
          <year>1999</year>
          <volume>22</volume>
          <issue>3</issue>
          <fpage>403</fpage>
          <lpage>408</lpage>
          <pub-id pub-id-type="doi">10.2337/diacare.22.3.403</pub-id>
          <pub-id pub-id-type="medline">10097918</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Goudswaard</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Stolk</surname>
              <given-names>RP</given-names>
            </name>
            <name name-style="western">
              <surname>Zuithoff</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Rutten</surname>
              <given-names>GEHM</given-names>
            </name>
          </person-group>
          <article-title>Patient characteristics do not predict poor glycaemic control in type 2 diabetes patients treated in primary care</article-title>
          <source>Eur J Epidemiol</source>
          <year>2004</year>
          <volume>19</volume>
          <issue>6</issue>
          <fpage>541</fpage>
          <lpage>545</lpage>
          <pub-id pub-id-type="doi">10.1023/b:ejep.0000032351.42772.e7</pub-id>
          <pub-id pub-id-type="medline">15330126</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Haghighatpanah</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nejad</surname>
              <given-names>ASM</given-names>
            </name>
            <name name-style="western">
              <surname>Haghighatpanah</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Thunga</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Mallayasamy</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Factors that correlate with poor glycemic control in type 2 diabetes mellitus patients with complications</article-title>
          <source>Osong Public Health Res Perspect</source>
          <year>2018</year>
          <volume>9</volume>
          <issue>4</issue>
          <fpage>167</fpage>
          <lpage>174</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30159222"/>
          </comment>
          <pub-id pub-id-type="doi">10.24171/j.phrp.2018.9.4.05</pub-id>
          <pub-id pub-id-type="medline">30159222</pub-id>
          <pub-id pub-id-type="pii">ophrp-09-0167</pub-id>
          <pub-id pub-id-type="pmcid">PMC6110332</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Juarez</surname>
              <given-names>DT</given-names>
            </name>
            <name name-style="western">
              <surname>Sentell</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tokumaru</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Goo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Mau</surname>
              <given-names>MM</given-names>
            </name>
          </person-group>
          <article-title>Factors associated with poor glycemic control or wide glycemic variability among diabetes patients in Hawaii, 2006-2009</article-title>
          <source>Prev Chronic Dis</source>
          <year>2012</year>
          <volume>9</volume>
          <fpage>120065</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/23017247"/>
          </comment>
          <pub-id pub-id-type="doi">10.5888/pcd9.120065</pub-id>
          <pub-id pub-id-type="medline">23017247</pub-id>
          <pub-id pub-id-type="pii">E151</pub-id>
          <pub-id pub-id-type="pmcid">PMC3475506</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gikas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sotiropoulos</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pastromas</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Papazafiropoulou</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Apostolou</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Pappas</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Seasonal variation in fasting glucose and HbA1c in patients with type 2 diabetes</article-title>
          <source>Prim Care Diabetes</source>
          <year>2009</year>
          <volume>3</volume>
          <issue>2</issue>
          <fpage>111</fpage>
          <lpage>114</lpage>
          <pub-id pub-id-type="doi">10.1016/j.pcd.2009.05.004</pub-id>
          <pub-id pub-id-type="medline">19535310</pub-id>
          <pub-id pub-id-type="pii">S1751-9918(09)00042-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Davies</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Aroda</surname>
              <given-names>VR</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Gabbay</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Green</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Maruthur</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Rosas</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Del Prato</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mathieu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mingrone</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Rossing</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Tankova</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tsapas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Buse</surname>
              <given-names>JB</given-names>
            </name>
          </person-group>
          <article-title>Management of hyperglycaemia in type 2 diabetes, 2022. a consensus report by the American Diabetes Association (ADA) and the European Association for the Study of Diabetes (EASD)</article-title>
          <source>Diabetologia</source>
          <year>2022</year>
          <volume>65</volume>
          <issue>12</issue>
          <fpage>1925</fpage>
          <lpage>1966</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36151309"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s00125-022-05787-2</pub-id>
          <pub-id pub-id-type="medline">36151309</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00125-022-05787-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC9510507</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="web">
          <source>Primary care physicians' practices in diabetes treatment</source>
          <access-date>2024-06-22</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jdome.jp/doc/jdome-2021-64jds.pdf">https://www.jdome.jp/doc/jdome-2021-64jds.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>American Diabetes Association Professional Practice Committee</collab>
          </person-group>
          <article-title>1. Improving care and promoting health in populations: standards of care in diabetes-2024</article-title>
          <source>Diabetes Care</source>
          <year>2024</year>
          <volume>47</volume>
          <issue>Suppl 1</issue>
          <fpage>S11</fpage>
          <lpage>S19</lpage>
          <pub-id pub-id-type="doi">10.2337/dc24-S001</pub-id>
          <pub-id pub-id-type="medline">38078573</pub-id>
          <pub-id pub-id-type="pii">153937</pub-id>
          <pub-id pub-id-type="pmcid">PMC10725798</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Qu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ju</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Predicting diabetes mellitus with machine learning techniques</article-title>
          <source>Front Genet</source>
          <year>2018</year>
          <volume>9</volume>
          <fpage>515</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30459809"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fgene.2018.00515</pub-id>
          <pub-id pub-id-type="medline">30459809</pub-id>
          <pub-id pub-id-type="pmcid">PMC6232260</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dagliati</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Marini</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sacchi</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Cogni</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Teliti</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tibollo</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>de Cata</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Chiovato</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Bellazzi</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Machine learning methods to predict diabetes complications</article-title>
          <source>J Diabetes Sci Technol</source>
          <year>2018</year>
          <volume>12</volume>
          <issue>2</issue>
          <fpage>295</fpage>
          <lpage>302</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28494618"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/1932296817706375</pub-id>
          <pub-id pub-id-type="medline">28494618</pub-id>
          <pub-id pub-id-type="pmcid">PMC5851210</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Islam</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Qaraqe</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Belhaouari</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Petrovski</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Long term HbA1c prediction using multi-stage CGM data analysis</article-title>
          <source>IEEE Sens J</source>
          <year>2021</year>
          <volume>21</volume>
          <issue>13</issue>
          <fpage>15237</fpage>
          <lpage>15247</lpage>
          <pub-id pub-id-type="doi">10.1109/JSEN.2021.3073974</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vincent</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Larochelle</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Bengio</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Manzagol</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Extracting and composing robust features with denoising autoencoders</article-title>
          <year>2008</year>
          <conf-name>Proceedings of the 25th international conference on Machine learning (ICML '08)</conf-name>
          <conf-date>2008</conf-date>
          <conf-loc>Canada</conf-loc>
          <publisher-name>Association for Computing Machinery</publisher-name>
          <fpage>1096</fpage>
          <lpage>1103</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jawed</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Grabocka</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Schmidt-Thieme</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Self-supervised learning for semi-supervised time series classification</article-title>
          <year>2020</year>
          <conf-name>Advances in Knowledge Discovery and Data Mining (PAKDD 2020)</conf-name>
          <conf-date>May 11, 2020</conf-date>
          <conf-loc>Asia</conf-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>12084</fpage>
          <pub-id pub-id-type="doi">10.1007/978-3-030-47426-3_39</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tipirneni</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Reddy</surname>
              <given-names>CK</given-names>
            </name>
          </person-group>
          <article-title>Self-supervised transformer for sparse and irregularly sampled multivariate clinical time-series</article-title>
          <source>ACM Trans Knowl Discov Data</source>
          <year>2022</year>
          <volume>16</volume>
          <issue>6</issue>
          <fpage>1</fpage>
          <lpage>17</lpage>
          <pub-id pub-id-type="doi">10.1145/3516367</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>BY</given-names>
            </name>
            <name name-style="western">
              <surname>Naiel</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Wardell</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kleinikkink</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zelek</surname>
              <given-names>JS</given-names>
            </name>
          </person-group>
          <article-title>Time-series causality with missing data</article-title>
          <source>J Comp Vis Imag Sys</source>
          <year>2021</year>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>4</lpage>
          <pub-id pub-id-type="doi">10.15353/jcvis.v6i1.3552</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Theissler</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Spinnato</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Schlegel</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Guidotti</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Explainable AI for time series classification: a review, taxonomy and research directions</article-title>
          <year>2022</year>
          <conf-name>IEEE Access</conf-name>
          <conf-date>September 19, 2022</conf-date>
          <conf-loc>Australia</conf-loc>
          <publisher-name>IEEE</publisher-name>
          <fpage>100700</fpage>
          <lpage>100724</lpage>
          <pub-id pub-id-type="doi">10.1109/access.2022.3207765</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maassen</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Fritsch</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Palm</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Deffge</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kunze</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Marx</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Riedel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Schuppert</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bickenbach</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Future medical artificial intelligence application requirements and expectations of physicians in German university hospitals: web-based survey</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <volume>23</volume>
          <issue>3</issue>
          <fpage>e26646</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/3/e26646/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/26646</pub-id>
          <pub-id pub-id-type="medline">33666563</pub-id>
          <pub-id pub-id-type="pii">v23i3e26646</pub-id>
          <pub-id pub-id-type="pmcid">PMC7980122</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Diprose</surname>
              <given-names>WK</given-names>
            </name>
            <name name-style="western">
              <surname>Buist</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hua</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Thurier</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Shand</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Robinson</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Physician understanding, explainability, and trust in a hypothetical machine learning risk calculator</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2020</year>
          <volume>27</volume>
          <issue>4</issue>
          <fpage>592</fpage>
          <lpage>600</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32106285"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocz229</pub-id>
          <pub-id pub-id-type="medline">32106285</pub-id>
          <pub-id pub-id-type="pii">5762808</pub-id>
          <pub-id pub-id-type="pmcid">PMC7647292</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kodera</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ninomiya</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Sawano</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Katsushika</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shinohara</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Akazawa</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Komuro</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Patient awareness survey on medical AI</article-title>
          <year>2022</year>
          <conf-name>The 36th Annual Conference of the Japanese Society for Artificial Intelligence</conf-name>
          <conf-date>June 14, 2022</conf-date>
          <conf-loc>Kyoto, Japan</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ossa</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Starke</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Lorenzini</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Vogt</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Shaw</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Elger</surname>
              <given-names>BS</given-names>
            </name>
          </person-group>
          <article-title>Re-focusing explainability in medicine</article-title>
          <source>Digit Health</source>
          <year>2022</year>
          <volume>8</volume>
          <fpage>20552076221074488</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/10.1177/20552076221074488?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:crossref.org&amp;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/20552076221074488</pub-id>
          <pub-id pub-id-type="medline">35173981</pub-id>
          <pub-id pub-id-type="pii">10.1177_20552076221074488</pub-id>
          <pub-id pub-id-type="pmcid">PMC8841907</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Allam</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Feuerriegel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rebhan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Krauthammer</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Analyzing patient trajectories with artificial intelligence</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <volume>23</volume>
          <issue>12</issue>
          <fpage>e29812</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/12/e29812/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/29812</pub-id>
          <pub-id pub-id-type="medline">34870606</pub-id>
          <pub-id pub-id-type="pii">v23i12e29812</pub-id>
          <pub-id pub-id-type="pmcid">PMC8686456</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Richens</surname>
              <given-names>JG</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Johri</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Improving the accuracy of medical diagnosis with causal machine learning</article-title>
          <source>Nat Commun</source>
          <year>2020</year>
          <volume>11</volume>
          <issue>1</issue>
          <fpage>3923</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41467-020-17419-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41467-020-17419-7</pub-id>
          <pub-id pub-id-type="medline">32782264</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41467-020-17419-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC7419549</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rojat</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Puget</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Filliat</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Del</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Gelin</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Díaz-Rodríguez</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Explainable artificial intelligence (XAI) on TimeSeries data: a survey</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on April 2, 2021</comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2104.00950</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bommasani</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hudson</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Adeli</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>On the opportunities and risks of foundation models</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on August 16, 2021</comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2108.07258</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Qiu</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>A survey of transformers</article-title>
          <source>AI Open</source>
          <year>2022</year>
          <volume>3</volume>
          <fpage>111</fpage>
          <lpage>132</lpage>
          <pub-id pub-id-type="doi">10.1016/j.aiopen.2022.10.001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lakew</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cettolo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Federico</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A comparison of transformer and recurrent neural networks on multilingual neural machine translation</article-title>
          <year>2018</year>
          <conf-name>Proceedings of the 27th International Conference on Computational Linguistics</conf-name>
          <conf-date>2018</conf-date>
          <conf-loc>Barcelona, Spain (Online)</conf-loc>
          <fpage>641</fpage>
          <lpage>652</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2020.coling-tutorials.3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Comparison of the potential between transformer and CNN in image classification</article-title>
          <year>2021</year>
          <conf-name>ICMLCA 2021; 2nd International Conference on Machine Learning and Computer Application</conf-name>
          <conf-date>December 17, 2021</conf-date>
          <conf-loc>Shenyang, China</conf-loc>
          <fpage>1</fpage>
          <lpage>6</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zerveas</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Jayaraman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bhamidipaty</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Eickhoff</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>A transformer-based framework for multivariate time series representation learning</article-title>
          <year>2021</year>
          <conf-name>Proceedings of the 27th ACM SIGKDD Conference on Knowledge Discovery &amp; Data Mining (KDD '21)</conf-name>
          <conf-date>August 14, 2021</conf-date>
          <conf-loc>New York</conf-loc>
          <fpage>2114</fpage>
          <lpage>2124</lpage>
          <pub-id pub-id-type="doi">10.1145/3447548.3467401</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xiong</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Informer: beyond efficient transformer for long sequence time-series forecasting</article-title>
          <year>2021</year>
          <conf-name>Proceedings of the AAAI Conference on Artificial Intelligence</conf-name>
          <conf-date>February 20, 2024</conf-date>
          <conf-loc>USA</conf-loc>
          <fpage>11106</fpage>
          <lpage>11115</lpage>
          <pub-id pub-id-type="doi">10.1609/aaai.v35i12.17325</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vaswani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shazeer</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Parmar</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Uszkoreit</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gomez</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kaiser</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Polosukhin</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Attention is all you need</article-title>
          <source>Adv Neural Inf Process Syst</source>
          <year>2017</year>
          <volume>30</volume>
          <pub-id pub-id-type="doi">10.48550/arXiv.1706.03762</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vig</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Belinkov</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Analyzing the structure of attention in a transformer language model</article-title>
          <year>2019</year>
          <conf-name>Proceedings of the 2019 ACL Workshop BlackboxNLP: Analyzing and Interpreting Neural Networks for NLP</conf-name>
          <conf-date>2019</conf-date>
          <conf-loc>Florence, Italy</conf-loc>
          <fpage>63</fpage>
          <lpage>76</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/w19-4808</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Voita</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Talbot</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Moiseev</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Sennrich</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Titov</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Analyzing multi-head self-attention: specialized heads do the heavy lifting, the rest can be pruned</article-title>
          <year>2019</year>
          <conf-name>Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics</conf-name>
          <conf-date>2019</conf-date>
          <conf-loc>Florence, Italy</conf-loc>
          <fpage>5797</fpage>
          <lpage>5808</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/p19-1580</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chaddad</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bouridane</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Survey of explainable AI techniques in healthcare</article-title>
          <source>Sensors (Basel)</source>
          <year>2023</year>
          <volume>23</volume>
          <issue>2</issue>
          <fpage>634</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=s23020634"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/s23020634</pub-id>
          <pub-id pub-id-type="medline">36679430</pub-id>
          <pub-id pub-id-type="pii">s23020634</pub-id>
          <pub-id pub-id-type="pmcid">PMC9862413</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hosmer</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lemeshow</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <source>Applied Logistic Regression</source>
          <year>2000</year>
          <publisher-loc>New York</publisher-loc>
          <publisher-name>John Wiley and Sons</publisher-name>
          <fpage>160</fpage>
          <lpage>164</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lv</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Bai</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Jing</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Identifying diagnostic indicators for type 2 diabetes mellitus from physical examination using interpretable machine learning approach</article-title>
          <source>Front Endocrinol (Lausanne)</source>
          <year>2024</year>
          <volume>15</volume>
          <fpage>1376220</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3389/fendo.2024.1376220"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fendo.2024.1376220</pub-id>
          <pub-id pub-id-type="medline">38562414</pub-id>
          <pub-id pub-id-type="pmcid">PMC10982324</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Uchitachimoto</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Sukegawa</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Kojima</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kagawa</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Oyama</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Okada</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Imakura</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sakurai</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Data collaboration analysis in predicting diabetes from a small amount of health checkup data</article-title>
          <source>Sci Rep</source>
          <year>2023</year>
          <volume>13</volume>
          <issue>1</issue>
          <fpage>11820</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-023-38932-x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-023-38932-x</pub-id>
          <pub-id pub-id-type="medline">37479701</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-023-38932-x</pub-id>
          <pub-id pub-id-type="pmcid">PMC10361975</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Oh</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Jee</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Jeon</surname>
              <given-names>JY</given-names>
            </name>
          </person-group>
          <article-title>Comparisons of the prediction models for undiagnosed diabetes between machine learning versus traditional statistical methods</article-title>
          <source>Sci Rep</source>
          <year>2023</year>
          <volume>13</volume>
          <issue>1</issue>
          <fpage>13101</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-023-40170-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-023-40170-0</pub-id>
          <pub-id pub-id-type="medline">37567907</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-023-40170-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC10421881</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Agliata</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Giordano</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bardozzo</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Bottiglieri</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Facchiano</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tagliaferri</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Machine learning as a support for the diagnosis of type 2 diabetes</article-title>
          <source>Int J Mol Sci</source>
          <year>2023</year>
          <volume>24</volume>
          <issue>7</issue>
          <fpage>6775</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijms24076775"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijms24076775</pub-id>
          <pub-id pub-id-type="medline">37047748</pub-id>
          <pub-id pub-id-type="pii">ijms24076775</pub-id>
          <pub-id pub-id-type="pmcid">PMC10095542</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dutta</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hasan</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmad</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Awal</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Islam</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Masud</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Meshref</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Early prediction of diabetes using an ensemble of machine learning models</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2022</year>
          <volume>19</volume>
          <issue>19</issue>
          <fpage>12378</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph191912378"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph191912378</pub-id>
          <pub-id pub-id-type="medline">36231678</pub-id>
          <pub-id pub-id-type="pii">ijerph191912378</pub-id>
          <pub-id pub-id-type="pmcid">PMC9566114</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Waki</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Fujita</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Uchimura</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Omae</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Aramaki</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kato</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kobayashi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kadowaki</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ohe</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>DialBetics: a novel smartphone-based self-management support system for type 2 diabetes patients</article-title>
          <source>J Diabetes Sci Technol</source>
          <year>2014</year>
          <volume>8</volume>
          <issue>2</issue>
          <fpage>209</fpage>
          <lpage>215</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/24876569"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/1932296814526495</pub-id>
          <pub-id pub-id-type="medline">24876569</pub-id>
          <pub-id pub-id-type="pii">1932296814526495</pub-id>
          <pub-id pub-id-type="pmcid">PMC4455411</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kurasawa</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Hayashi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Fujino</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Takasugi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Haga</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Waki</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Noguchi</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ohe</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Machine-learning-based prediction of a missed scheduled clinical appointment by patients with diabetes</article-title>
          <source>J Diabetes Sci Technol</source>
          <year>2016</year>
          <volume>10</volume>
          <issue>3</issue>
          <fpage>730</fpage>
          <lpage>736</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26555782"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/1932296815614866</pub-id>
          <pub-id pub-id-type="medline">26555782</pub-id>
          <pub-id pub-id-type="pii">1932296815614866</pub-id>
          <pub-id pub-id-type="pmcid">PMC5038527</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kurasawa</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Waki</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Chiba</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Seki</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Hayashi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Fujino</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Haga</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Noguchi</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ohe</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Treatment discontinuation prediction in patients with diabetes using a ranking model: machine learning model development</article-title>
          <source>JMIR Bioinform Biotech</source>
          <year>2022</year>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>e37951</fpage>
          <pub-id pub-id-type="doi">10.2196/37951</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kazijevs</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Samad</surname>
              <given-names>MD</given-names>
            </name>
          </person-group>
          <article-title>Deep imputation of missing values in time series health data: a review with benchmarking</article-title>
          <source>J Biomed Inform</source>
          <year>2023</year>
          <volume>144</volume>
          <fpage>104440</fpage>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2023.104440</pub-id>
          <pub-id pub-id-type="medline">37429511</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(23)00161-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC10529422</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tashman</surname>
              <given-names>LJ</given-names>
            </name>
          </person-group>
          <article-title>Out-of-sample tests of forecasting accuracy: an analysis and review</article-title>
          <source>Int J Forecast</source>
          <year>2000</year>
          <volume>16</volume>
          <issue>4</issue>
          <fpage>437</fpage>
          <lpage>450</lpage>
          <pub-id pub-id-type="doi">10.1016/s0169-2070(00)00065-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Seto</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Oyama</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kitora</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Toki</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Yamamoto</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kotoku</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Haga</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shinzawa</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yamakawa</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fukui</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Moriyama</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Author correction: gradient boosting decision tree becomes more reliable than logistic regression in predicting probability for diabetes with big data</article-title>
          <source>Sci Rep</source>
          <year>2022</year>
          <volume>12</volume>
          <issue>1</issue>
          <fpage>22599</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-022-27052-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-022-27052-7</pub-id>
          <pub-id pub-id-type="medline">36585468</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-022-27052-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC9803642</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rufo</surname>
              <given-names>DD</given-names>
            </name>
            <name name-style="western">
              <surname>Debelee</surname>
              <given-names>TG</given-names>
            </name>
            <name name-style="western">
              <surname>Ibenthal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Negera</surname>
              <given-names>WG</given-names>
            </name>
          </person-group>
          <article-title>Diagnosis of diabetes mellitus using gradient boosting machine (LightGBM)</article-title>
          <source>Diagnostics (Basel)</source>
          <year>2021</year>
          <volume>11</volume>
          <issue>9</issue>
          <fpage>1714</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=diagnostics11091714"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/diagnostics11091714</pub-id>
          <pub-id pub-id-type="medline">34574055</pub-id>
          <pub-id pub-id-type="pii">diagnostics11091714</pub-id>
          <pub-id pub-id-type="pmcid">PMC8467876</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="web">
          <source>Information about the current study</source>
          <access-date>2023-01-03</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.h.u-tokyo.ac.jp/patient/depts/taisha/pdf/pa_md_md_info-04.pdf">https://www.h.u-tokyo.ac.jp/patient/depts/taisha/pdf/pa_md_md_info-04.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Henighan</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kaplan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Katz</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Scaling laws for autoregressive generative modeling</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on October 28, 2020</comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2001.08361</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Mitra</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Berlowitz</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>TransformEHR: transformer-based encoder-decoder generative model to enhance prediction of disease outcomes using electronic health records</article-title>
          <source>Nat Commun</source>
          <year>2023</year>
          <volume>14</volume>
          <issue>1</issue>
          <fpage>7857</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41467-023-43715-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41467-023-43715-z</pub-id>
          <pub-id pub-id-type="medline">38030638</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41467-023-43715-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC10687211</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Rao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Solares</surname>
              <given-names>JRA</given-names>
            </name>
            <name name-style="western">
              <surname>Hassaine</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ramakrishnan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Canoy</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Rahimi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Salimi-Khorshidi</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>BEHRT: transformer for electronic health records</article-title>
          <source>Sci Rep</source>
          <year>2020</year>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>7155</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-020-62922-y"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-020-62922-y</pub-id>
          <pub-id pub-id-type="medline">32346050</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-020-62922-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC7189231</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kraljevic</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Bean</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Shek</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bendayan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hemingway</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Yeung</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Baston</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ross</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Idowu</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Teo</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Dobson</surname>
              <given-names>RJB</given-names>
            </name>
          </person-group>
          <article-title>Foresight-a generative pretrained transformer for modelling of patient timelines using electronic health records: a retrospective modelling study</article-title>
          <source>Lancet Digit Health</source>
          <year>2024</year>
          <volume>6</volume>
          <issue>4</issue>
          <fpage>e281</fpage>
          <lpage>e290</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2589-7500(24)00025-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S2589-7500(24)00025-6</pub-id>
          <pub-id pub-id-type="medline">38519155</pub-id>
          <pub-id pub-id-type="pii">S2589-7500(24)00025-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Feuerriegel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Frauen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Melnychuk</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Schweisthal</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hess</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Curth</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bauer</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kilbertus</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>IS</given-names>
            </name>
            <name name-style="western">
              <surname>van der Schaar</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Causal machine learning for predicting treatment outcomes</article-title>
          <source>Nat Med</source>
          <year>2024</year>
          <volume>30</volume>
          <issue>4</issue>
          <fpage>958</fpage>
          <lpage>968</lpage>
          <pub-id pub-id-type="doi">10.1038/s41591-024-02902-1</pub-id>
          <pub-id pub-id-type="medline">38641741</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41591-024-02902-1</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
