<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id><journal-id journal-id-type="publisher-id">medinform</journal-id><journal-id journal-id-type="index">7</journal-id><journal-title>JMIR Medical Informatics</journal-title><abbrev-journal-title>JMIR Med Inform</abbrev-journal-title><issn pub-type="epub">2291-9694</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v13i1e67748</article-id><article-id pub-id-type="doi">10.2196/67748</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Enhancing Antidiabetic Drug Selection Using Transformers: Machine-Learning Model Development</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Kurasawa</surname><given-names>Hisashi</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" corresp="yes" equal-contrib="yes"><name name-style="western"><surname>Waki</surname><given-names>Kayo</given-names></name><degrees>MD, MPH, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Seki</surname><given-names>Tomohisa</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Nakahara</surname><given-names>Eri</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Fujino</surname><given-names>Akinori</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Shiomi</surname><given-names>Nagisa</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Nakashima</surname><given-names>Hiroshi</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ohe</surname><given-names>Kazuhiko</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>The University of Tokyo Hospital</institution><addr-line>7-3-1 Hongo, Bunkyo-ku</addr-line><addr-line>Tokyo</addr-line><country>Japan</country></aff><aff id="aff2"><institution>Nippon Telegraph and Telephone Corporation</institution><country>Japan</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Coristine</surname><given-names>Andrew</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Victor</surname><given-names>Audencio</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Mahali</surname><given-names>Lakshmi Priyanka</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Kayo Waki, MD, MPH, PhD, The University of Tokyo Hospital, 7-3-1 Hongo, Bunkyo-ku, Tokyo, Japan, 81 3-5800-6427; <email>kwaki-tky@m.u-tokyo.ac.jp</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>2</day><month>6</month><year>2025</year></pub-date><volume>13</volume><elocation-id>e67748</elocation-id><history><date date-type="received"><day>20</day><month>10</month><year>2024</year></date><date date-type="rev-recd"><day>21</day><month>04</month><year>2025</year></date><date date-type="accepted"><day>21</day><month>04</month><year>2025</year></date></history><copyright-statement>&#x00A9; Hisashi Kurasawa, Kayo Waki, Tomohisa Seki, Eri Nakahara, Akinori Fujino, Nagisa Shiomi, Hiroshi Nakashima, Kazuhiko Ohe. Originally published in JMIR Medical Informatics (<ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org">https://medinform.jmir.org</ext-link>), 2.6.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/">https://medinform.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://medinform.jmir.org/2025/1/e67748"/><abstract><sec><title>Background</title><p>Diabetes affects millions worldwide. Primary care physicians provide a significant portion of care, and they often struggle with selecting appropriate medications.</p></sec><sec><title>Objective</title><p>This study aimed to develop a model that accurately predicts what drug an endocrinologist would prescribe based on the current measurements. The goal was to create a system that would assist nonspecialists in choosing medications, thereby potentially improving diabetes treatment outcomes. Based on the performance of previous studies, we set a performance target of achieving a receiver operating characteristic area under the curve (ROC-AUC) above 0.95.</p></sec><sec sec-type="methods"><title>Methods</title><p>A transformer-based encoder-decoder model predicts whether 44 types of diabetes drugs will be prescribed. The model uses sequences of age, sex, history for 12 laboratory tests, and prescribed drug history as inputs. We assessed the model using the electronic health records from 7034 patients with diabetes seeing endocrinologists between 2012 and 2022 at the University of Tokyo Hospital. We assessed model performance trained on data subsets spanning different time periods (2, 5, and 10 years) using micro- and macro-averaged ROC-AUC on a hold-out test set comprising data solely from 2022. The model&#x2019;s performance was compared against LightGBM.</p></sec><sec sec-type="results"><title>Results</title><p>The model trained on data from the past 5 years (2017&#x2010;2021) yielded the best predictive performance, achieving a microaverage (95% CI) ROC-AUC of 0.993 (0.992-0.994) and a macroaverage (95% CI) ROC-AUC of 0.988 (0.980-0.993). The model achieved an ROC-AUC above 0.95 for 43 out of 44 drugs. These results surpassed the predefined performance target and outperformed both previous studies and the LightGBM model&#x2019;s microaverage ROC-AUC of 0.988 (0.985-0.990) in terms of prediction accuracy. Furthermore, training the model with short-term data from the past 5 years yielded high accuracy compared to using data from the past 10 years, suggesting that learning from more recent prescribing patterns might be advantageous.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>The proposed model demonstrates the feasibility of accurately predicting the next prescribed drugs. This model, trained from the past prescriptions of endocrinologists, has the potential to provide information that can assist nonspecialists in making diabetes-treatment decisions. Future studies will focus on incorporating important factors such as prescription contraindications and constraints to enhance safety, as well as leveraging large-scale clinical data across multiple hospitals to improve the generalizability of the model.</p></sec></abstract><kwd-group><kwd>AI</kwd><kwd>diabetes</kwd><kwd>drug selection</kwd><kwd>machine learning</kwd><kwd>transformer</kwd><kwd>artificial intelligence</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Diabetes affects 529 million people worldwide, with 1 in every 10 adults experiencing the condition [<xref ref-type="bibr" rid="ref1">1</xref>]. Patients with diabetes receive care from primary care physicians, not endocrinologists, in many areas including the United States, Europe [<xref ref-type="bibr" rid="ref2">2</xref>], and Japan [<xref ref-type="bibr" rid="ref3">3</xref>]. This is particularly concerning in the United States, where the endocrinologist shortage is significant: the population-to-endocrinologist ratio within 20 miles was 29,887:1 for adults aged 18&#x2010;64. Rural areas face even greater disparities, with only 55.5% of adults having access to at least 1 endocrinologist within that distance [<xref ref-type="bibr" rid="ref4">4</xref>]. Japan also faces a similar problem. Japan has 11 million patients with diabetes but only about 7000 specialists, and two-thirds of people with type 2 diabetes (T2D) receive care from primary care physicians [<xref ref-type="bibr" rid="ref3">3</xref>]. These nonspecialists may struggle to predict a patient&#x2019;s glycemic control. Approximately 60% of surveyed patients with T2D treated by nonspecialists experienced poor glycemic control (hemoglobin A<sub>1c</sub> [HbA<sub>1c</sub>] &#x2265;8%), with around 30% seeing worsened levels the following year, according to a survey on T2D treatment practices by primary care physicians [<xref ref-type="bibr" rid="ref3">3</xref>].</p><p>One of the difficulties in diabetes treatment for primary care physicians is drug selection [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. Medications are prescribed either as monotherapy or in combination. Medications need to be chosen [<xref ref-type="bibr" rid="ref7">7</xref>] considering insulin secretion and insulin resistance [<xref ref-type="bibr" rid="ref8">8</xref>], age [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>], degree of obesity [<xref ref-type="bibr" rid="ref11">11</xref>], severity of chronic complications [<xref ref-type="bibr" rid="ref12">12</xref>], liver function, and kidney function [<xref ref-type="bibr" rid="ref13">13</xref>]. New diabetes treatments continue to be developed, expanding the options for medication selection. For example, in Japan, sodium&#x2013;glucose cotransporter 2 [<xref ref-type="bibr" rid="ref14">14</xref>], imeglimin [<xref ref-type="bibr" rid="ref15">15</xref>], and tirzepatide [<xref ref-type="bibr" rid="ref16">16</xref>] were introduced in 2014, 2021, and 2023, respectively. The selection of diabetes medications depends on individual patient factors, with guidelines [<xref ref-type="bibr" rid="ref17">17</xref>] and treatment tendencies [<xref ref-type="bibr" rid="ref18">18</xref>] that vary from country to country. A tool supporting drug selection could enhance treatment outcomes. It could provide early warning to physicians and potentially improve treatment outcomes for patients who are being examined by nonspecialized physicians.</p><p>Clinical decision support systems (CDSS) provide physicians with safety tools for drug selection [<xref ref-type="bibr" rid="ref19">19</xref>]. By adopting a knowledge-based approach aligned with clinical guidelines, CDSS help to prevent medication errors such as overdosing, incomplete, or unclear orders [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. However, replicating the ability of endocrinologists to select drugs for individual patient conditions in a CDSS is complex and challenging for knowledge-based approaches.</p><p>Machine learning (ML) has demonstrated success in predicting patient symptoms, including forecasting the onset of T2D [<xref ref-type="bibr" rid="ref22">22</xref>] and predicting complications [<xref ref-type="bibr" rid="ref23">23</xref>]. Several studies have applied ML to the problem of drug selection for patients with diabetes [<xref ref-type="bibr" rid="ref24">24</xref>]. A study predicting the next prescribed diabetes drugs for 161,497 patients with diabetes using sequential pattern mining demonstrated an accuracy of 89.1%&#x2010;90.5% in guessing from 37 drug classes (eg, DPP-4 inhibitor) and 63.5%&#x2010;64.9% accuracy in guessing from 43 drugs (eg, algliptin) [<xref ref-type="bibr" rid="ref25">25</xref>]. Another study predicted 7 drug classes with an ROC-AUC of 90.6%&#x2010;94.3% using recurrent neural networks (RNN) [<xref ref-type="bibr" rid="ref26">26</xref>]. There are also proposed methods for predicting treatment outcomes after selecting diabetes medications [<xref ref-type="bibr" rid="ref27">27</xref>].</p><p>The field of ML has undergone significant advancement since the introduction of the transformer approach in 2017 [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>]. Transformers enable contextual interactions for natural language processing tasks and have become a core technology across diverse domains [<xref ref-type="bibr" rid="ref30">30</xref>-<xref ref-type="bibr" rid="ref32">32</xref>]. The transformer model incorporates an attention mechanism and has shown remarkable performance in tasks involving the extraction of temporal and semantic relationships, leading to success in tasks such as generation and classification [<xref ref-type="bibr" rid="ref33">33</xref>]. Generally, transformers enhance predictive performance through two types of training: pretraining via self-supervised learning and fine-tuning via supervised learning. For example, large language models like GPT and bidirectional encoder representations from transformers (BERT) were pretrained on a task predicting the next or masked word and then fine-tuned on a task generating responses to an instruction [<xref ref-type="bibr" rid="ref34">34</xref>]. Several studies in health care have already used this scheme of 2 types of learning. TransformEHR improved performance on the fine-tuned task of predicting the onset of pancreatic cancer and intentional self-harm among patients with posttraumatic stress disorder by pretraining on the task of predicting randomly-masked diseases and outcomes in time series of 6.5 million patients [<xref ref-type="bibr" rid="ref35">35</xref>]. A deep neural sequence transduction model for electronic health records (BEHRT) [<xref ref-type="bibr" rid="ref36">36</xref>] was pretrained using an electronic health records (EHR) dataset of 1.6 million patients and was fine-tuned to predict diagnosis codes. Recent transformers have also made advancements in learning by combining different modalities of information such as images, audio, and text. Foresight [<xref ref-type="bibr" rid="ref37">37</xref>] was trained with structured data such as laboratory results as well as unstructured data such as free text from 1.5 million patients across three EHR datasets. The transformer approach has not previously been applied to the task of selecting diabetes medications. In addition, while efforts have been made to train models with large amounts of data to improve accuracy [<xref ref-type="bibr" rid="ref38">38</xref>], the impact of the training data period on predictions is largely unexplored.</p><p>Diabetes drug selection involves deciding to prescribe one or more drugs from among many candidates. This selection can be handled by ML as a multichoice task. This study aimed to develop an ML tool that accurately predicts the next prescribed drugs using the patient&#x2019;s medical condition and prescription history over the past year. The objective is to enhance diabetes treatment outcomes for nonspecialists through improved support in drug selection (<xref ref-type="fig" rid="figure1">Figure 1</xref>). Based on the performance of previous studies [<xref ref-type="bibr" rid="ref24">24</xref>-<xref ref-type="bibr" rid="ref26">26</xref>], our goal was to achieve an ROC-AUC above 0.95 when predicting the next prescribed drugs. Drawing on our team&#x2019;s previous work in self-management support for T2D treatment [<xref ref-type="bibr" rid="ref39">39</xref>] and predicting treatment discontinuations [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>], we designed this task with the hope of overcoming barriers to nonspecialist diabetes treatment in clinical practice, believing it could significantly improve diabetes treatment outcomes.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>System image of prescription drug selection assistant.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e67748_fig01.png"/></fig></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Datasets</title><p>All data were collected from the EHRs at the University of Tokyo Hospital, which included 7034 patients who visited the hospital, had diagnostic codes, and were registered to the Japan diabetes comprehensive database project based on an advanced electronic medical record system (J-DREAMS) cohort [<xref ref-type="bibr" rid="ref42">42</xref>]. The data were recorded in the EHRs between January 1, 2011 and December 31, 2022. The data, including treatment decisions and outcomes, were reflective of care by endocrinologists. Variables extracted from the EHRs included sex, age, 12 kinds of diabetes-related laboratory tests, and drugs. The laboratory tests included numerical values of HbA<sub>1c</sub>, glucose, triacylglycerol, high density lipoprotein cholesterol, total cholesterol [<xref ref-type="bibr" rid="ref43">43</xref>], urinary albumin creatinine ratio, creatinine [<xref ref-type="bibr" rid="ref44">44</xref>], alanine transaminase, aspartate transaminase, and &#x03B3;-glutamyltransferase [<xref ref-type="bibr" rid="ref45">45</xref>], and categorical values of proteins [<xref ref-type="bibr" rid="ref45">45</xref>] and glycogen. Drugs were identified using the list of drug price standards [<xref ref-type="bibr" rid="ref46">46</xref>] provided by the Ministry of Health, Labour and Welfare of Japan, and 44 types prescribed in 2021 were selected.</p></sec><sec id="s2-2"><title>Training and Test Data</title><p>The records used for training were not used for testing to ensure that the same patients were not included in both groups. A total of 80% (5627/7034) of patients were included in the training group, and the remaining 20% (1407/7034) of patients were included in the testing group.</p><p>In order to examine the size of the training data needed to achieve the target prediction accuracy, we extracted three different subsets of training data from the sequences of the 5627 patients in the training group: 2 years from 2020 to 2021 (3013 patients and their 25484 subsequences), 5 years from 2017 to 2021 (4009 patients and their 78,020 subsequences), and 10 years from 2012 to 2021 (4524 patients and their 168,595 subsequences). For testing, we further identified a subset of the testing data that was solely data from 2022 (637 patients and their 2988 subsequences). Thus, there was no overlap in patients or time periods between training and testing. <xref ref-type="table" rid="table1">Table 1</xref> shows the characteristics of the patients. The drugs in the table are the top 5 and bottom 5 in terms of number of prescriptions in the 2-year training data. All characteristics are provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Characteristics of patients with diabetes included in the training and testing datasets. Characteristics are presented separately for the patient groups belonging to the different training datasets defined by period: 2 years (2020-2021), 5 years (2017-2021), 10 years (2012-2021) and the independent test dataset (data exclusively from 2022).</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom" colspan="2">2 years of training data</td><td align="left" valign="bottom" colspan="2">5 years of training data</td><td align="left" valign="bottom" colspan="2">10 years of training data</td><td align="left" valign="bottom" colspan="2">1 year of test data</td></tr><tr><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">Records (n=25484)</td><td align="left" valign="top">Patient (n=3013)</td><td align="left" valign="top">Records (n=78020)</td><td align="left" valign="top">Patient (n=4009)</td><td align="left" valign="top">Records (n=168595)</td><td align="left" valign="top">Patient (n=4524)</td><td align="left" valign="top">Records (n=2988)</td><td align="left" valign="top">Patient (n=637)</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="9">Sex</td></tr><tr><td align="left" valign="top">&#x2003;Male, n (%)</td><td align="left" valign="top">16224 (63.66)</td><td align="left" valign="top">1915 (63.56)</td><td align="left" valign="top">49348 (63.25)</td><td align="left" valign="top">2543 (63.43)</td><td align="left" valign="top">106782 (63.34)</td><td align="left" valign="top">2869 (63.42)</td><td align="left" valign="top">1793 (60.01)</td><td align="left" valign="top">381 (59.81)</td></tr><tr><td align="left" valign="top">&#x2003;Female, n (%)</td><td align="left" valign="top">9260 (36.34)</td><td align="left" valign="top">1098 (36.44)</td><td align="left" valign="top">28672 (36.75)</td><td align="left" valign="top">1466 (36.57)</td><td align="left" valign="top">61813 (36.66)</td><td align="left" valign="top">1655 (36.58)</td><td align="left" valign="top">1195 (39.99)</td><td align="left" valign="top">256 (40.19)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Age, mean (SD)</td><td align="left" valign="top">67.62 (12.59)</td><td align="left" valign="top">69.06 (12.50)</td><td align="left" valign="top">67.25 (12.56)</td><td align="left" valign="top">69.17 (12.87)</td><td align="left" valign="top">66.41 (12.30)</td><td align="left" valign="top">68.98 (13.10)</td><td align="left" valign="top">68.80 (12.31)</td><td align="left" valign="top">69.68 (12.26)</td></tr><tr><td align="left" valign="top" colspan="9">HbA1c<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mean (SD)</td><td align="left" valign="top">7.37 (1.08)</td><td align="left" valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="top">7.31 (1.06)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">7.25 (1.03)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">7.31 (1.02)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003C;6, n (%)</td><td align="left" valign="top">920 (3.61)</td><td align="left" valign="top">323 (10.72)</td><td align="left" valign="top">3046 (3.90)</td><td align="left" valign="top">754 (18.81)</td><td align="left" valign="top">7286 (4.32)</td><td align="left" valign="top">1345 (29.73)</td><td align="left" valign="top">96 (3.21)</td><td align="left" valign="top">49 (7.69)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>6&#x2010;7, n (%)</td><td align="left" valign="top">8874 (34.82)</td><td align="left" valign="top">1865 (61.90)</td><td align="left" valign="top">29030 (37.21)</td><td align="left" valign="top">3027 (75.51)</td><td align="left" valign="top">66470 (39.43)</td><td align="left" valign="top">3835 (84.77)</td><td align="left" valign="top">1113 (37.25)</td><td align="left" valign="top">370 (58.08)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>7&#x2010;8, n (%)</td><td align="left" valign="top">10177 (39.93)</td><td align="left" valign="top">2135 (70.86)</td><td align="left" valign="top">30493 (39.08)</td><td align="left" valign="top">3157 (78.75)</td><td align="left" valign="top">64355 (38.17)</td><td align="left" valign="top">3830 (84.66)</td><td align="left" valign="top">1189 (39.79)</td><td align="left" valign="top">404 (63.42)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x2265;8, n (%)</td><td align="left" valign="top">5513 (21.63)</td><td align="left" valign="top">1224 (40.62)</td><td align="left" valign="top">15451 (19.80)</td><td align="left" valign="top">2008 (50.09)</td><td align="left" valign="top">30484 (18.08)</td><td align="left" valign="top">2725 (60.23)</td><td align="left" valign="top">590 (19.75)</td><td align="left" valign="top">200 (31.40)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>missing, n (%)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td></tr><tr><td align="left" valign="top" colspan="9">HDL-C<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mean (SD)</td><td align="left" valign="top">60.99 (18.23)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">60.07 (17.94)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">59.81 (17.80)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">63.76 (19.79)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003C;40, n (%)</td><td align="left" valign="top">1943 (7.62)</td><td align="left" valign="top">512 (16.99)</td><td align="left" valign="top">6633 (8.50)</td><td align="left" valign="top">964 (24.05)</td><td align="left" valign="top">14694 (8.72)</td><td align="left" valign="top">1374 (30.37)</td><td align="left" valign="top">158 (5.29)</td><td align="left" valign="top">67 (10.52)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>40&#x2010;120, n (%)</td><td align="left" valign="top">21304 (83.60)</td><td align="left" valign="top">2737 (90.84)</td><td align="left" valign="top">63249 (81.07)</td><td align="left" valign="top">3644 (90.90)</td><td align="left" valign="top">134924 (80.03)</td><td align="left" valign="top">4195 (92.73)</td><td align="left" valign="top">2564 (85.81)</td><td align="left" valign="top">577 (90.58)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x2265;120, n (%)</td><td align="left" valign="top">195 (0.77)</td><td align="left" valign="top">59 (1.96)</td><td align="left" valign="top">494 (0.63)</td><td align="left" valign="top">100 (2.49)</td><td align="left" valign="top">966 (0.57)</td><td align="left" valign="top">137 (3.03)</td><td align="left" valign="top">44 (1.47)</td><td align="left" valign="top">11 (1.73)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>missing, n (%)</td><td align="left" valign="top">2042 (8.01)</td><td align="left" valign="top">178 (5.91)</td><td align="left" valign="top">7644 (9.80)</td><td align="left" valign="top">243 (6.06)</td><td align="left" valign="top">18011 (10.68)</td><td align="left" valign="top">219 (4.84)</td><td align="left" valign="top">222 (7.43)</td><td align="left" valign="top">40 (6.28)</td></tr><tr><td align="left" valign="top" colspan="9">Cre<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mean (SD)</td><td align="left" valign="top">0.97 (0.69)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">0.96 (0.75)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">0.95 (0.72)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">1.04 (1.08)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top" colspan="9">Male</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mean (SD)</td><td align="left" valign="top">1.08 (0.71)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">1.07 (0.74)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">1.05 (0.74)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">1.18 (1.23)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003C;0.65, n (%)</td><td align="left" valign="top">758 (2.97)</td><td align="left" valign="top">191 (6.34)</td><td align="left" valign="top">2675 (3.43)</td><td align="left" valign="top">405 (10.10)</td><td align="left" valign="top">5783 (3.43)</td><td align="left" valign="top">566 (12.51)</td><td align="left" valign="top">111 (3.71)</td><td align="left" valign="top">37 (5.81)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>0.65&#x2010;1.09, n (%)</td><td align="left" valign="top">10672 (41.88)</td><td align="left" valign="top">1482 (49.19)</td><td align="left" valign="top">32766 (42.00)</td><td align="left" valign="top">2057 (51.31)</td><td align="left" valign="top">71870 (42.63)</td><td align="left" valign="top">2456 (54.29)</td><td align="left" valign="top">1145 (38.32)</td><td align="left" valign="top">290 (45.53)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x2265;1.09, n (%)</td><td align="left" valign="top">4543 (17.83)</td><td align="left" valign="top">750 (24.89)</td><td align="left" valign="top">13140 (16.84)</td><td align="left" valign="top">1093 (27.26)</td><td align="left" valign="top">27001 (16.02)</td><td align="left" valign="top">1337 (29.55)</td><td align="left" valign="top">516 (17.27)</td><td align="left" valign="top">129 (20.25)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>missing, n (%)</td><td align="left" valign="top">251 (0.98)</td><td align="left" valign="top">6 (0.20)</td><td align="left" valign="top">767 (0.98)</td><td align="left" valign="top">5 (0.12)</td><td align="left" valign="top">2128 (1.26)</td><td align="left" valign="top">7 (0.15)</td><td align="left" valign="top">21 (0.70)</td><td align="left" valign="top">1 (0.16)</td></tr><tr><td align="left" valign="top" colspan="9">Female</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mean (SD)</td><td align="left" valign="top">0.78 (0.60)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">0.78 (0.72)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">0.77 (0.65)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">0.82 (0.74)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003C;0.46, n (%)</td><td align="left" valign="top">357 (1.40)</td><td align="left" valign="top">89 (2.95)</td><td align="left" valign="top">1160 (1.49)</td><td align="left" valign="top">175 (4.37)</td><td align="left" valign="top">2616 (1.55)</td><td align="left" valign="top">282 (6.23)</td><td align="left" valign="top">28 (0.94)</td><td align="left" valign="top">11 (1.73)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>0.46&#x2010;0.82, n (%)</td><td align="left" valign="top">6596 (25.88)</td><td align="left" valign="top">895 (29.70)</td><td align="left" valign="top">20561 (26.35)</td><td align="left" valign="top">1224 (30.53)</td><td align="left" valign="top">44130 (26.18)</td><td align="left" valign="top">1428 (31.56)</td><td align="left" valign="top">825 (27.61)</td><td align="left" valign="top">194 (30.46)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x2265;0.82, n (%)</td><td align="left" valign="top">2133 (8.37)</td><td align="left" valign="top">372 (12.35)</td><td align="left" valign="top">6370 (8.16)</td><td align="left" valign="top">596 (14.87)</td><td align="left" valign="top">13572 (8.05)</td><td align="left" valign="top">730 (16.14)</td><td align="left" valign="top">326 (10.91)</td><td align="left" valign="top">93 (14.60)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>missing, n (%)</td><td align="left" valign="top">174 (0.68)</td><td align="left" valign="top">11 (0.37)</td><td align="left" valign="top">581 (0.74)</td><td align="left" valign="top">11 (0.27)</td><td align="left" valign="top">1495 (0.89)</td><td align="left" valign="top">16 (0.35)</td><td align="left" valign="top">16 (0.54)</td><td align="left" valign="top">2 (0.31)</td></tr><tr><td align="left" valign="top" colspan="9">Glu<sup><xref ref-type="table-fn" rid="table1fn5">e</xref></sup></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mean (SD)</td><td align="left" valign="top">147.68 (51.19)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">147.00 (51.31)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">144.12 (50.77)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">145.47 (48.67)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003C;70, n (%)</td><td align="left" valign="top">302 (1.19)</td><td align="left" valign="top">169 (5.61)</td><td align="left" valign="top">979 (1.25)</td><td align="left" valign="top">403 (10.05)</td><td align="left" valign="top">2709 (1.61)</td><td align="left" valign="top">743 (16.42)</td><td align="left" valign="top">28 (0.94)</td><td align="left" valign="top">22 (3.45)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>70&#x2010;110, n (%)</td><td align="left" valign="top">4230 (16.60)</td><td align="left" valign="top">1389 (46.10)</td><td align="left" valign="top">13604 (17.44)</td><td align="left" valign="top">2483 (61.94)</td><td align="left" valign="top">33633 (19.95)</td><td align="left" valign="top">3403 (75.22)</td><td align="left" valign="top">555 (18.57)</td><td align="left" valign="top">260 (40.82)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x2265;110, n (%)</td><td align="left" valign="top">20863 (81.87)</td><td align="left" valign="top">2924 (97.05)</td><td align="left" valign="top">63201 (81.01)</td><td align="left" valign="top">3907 (97.46)</td><td align="left" valign="top">131586 (78.05)</td><td align="left" valign="top">4418 (97.66)</td><td align="left" valign="top">2394 (80.12)</td><td align="left" valign="top">609 (95.60)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>missing, n (%)</td><td align="left" valign="top">89 (0.35)</td><td align="left" valign="top">7 (0.23)</td><td align="left" valign="top">236 (0.30)</td><td align="left" valign="top">5 (0.12)</td><td align="left" valign="top">667 (0.40)</td><td align="left" valign="top">6 (0.13)</td><td align="left" valign="top">11 (0.37)</td><td align="left" valign="top">2 (0.31)</td></tr><tr><td align="left" valign="top" colspan="9">Prescribed drug (top 5)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Metformin hydrochloride, n (%)</td><td align="left" valign="top">11257 (44.17)</td><td align="left" valign="top">1390 (46.13)</td><td align="left" valign="top">33442 (42.86)</td><td align="left" valign="top">1952 (48.69)</td><td align="left" valign="top">72337 (42.91)</td><td align="left" valign="top">2376 (52.52)</td><td align="left" valign="top">1361 (45.55)</td><td align="left" valign="top">297 (46.62)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Sitagliptin phosphate hydrate, n (%)</td><td align="left" valign="top">4963 (19.47)</td><td align="left" valign="top">693 (23.00)</td><td align="left" valign="top">15420 (19.76)</td><td align="left" valign="top">1148 (28.64)</td><td align="left" valign="top">37438 (22.21)</td><td align="left" valign="top">1808 (39.96)</td><td align="left" valign="top">425 (14.22)</td><td align="left" valign="top">101 (15.86)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Insulin aspart (genetical recombination), n (%)</td><td align="left" valign="top">3212 (12.60)</td><td align="left" valign="top">377 (12.51)</td><td align="left" valign="top">10039 (12.87)</td><td align="left" valign="top">603 (15.04)</td><td align="left" valign="top">20149 (11.95)</td><td align="left" valign="top">833 (18.41)</td><td align="left" valign="top">403 (13.49)</td><td align="left" valign="top">85 (13.34)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Glimepiride, n (%)</td><td align="left" valign="top">2885 (11.32)</td><td align="left" valign="top">398 (13.21)</td><td align="left" valign="top">10387 (13.31)</td><td align="left" valign="top">690 (17.21)</td><td align="left" valign="top">28855 (17.11)</td><td align="left" valign="top">1141 (25.22)</td><td align="left" valign="top">358 (11.98)</td><td align="left" valign="top">76 (11.93)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Pioglitazone hydrochloride, n (%)</td><td align="left" valign="top">2731 (10.72)</td><td align="left" valign="top">354 (11.75)</td><td align="left" valign="top">9450 (12.11)</td><td align="left" valign="top">592 (14.77)</td><td align="left" valign="top">24305 (14.42)</td><td align="left" valign="top">910 (20.11)</td><td align="left" valign="top">244 (8.17)</td><td align="left" valign="top">53 (8.32)</td></tr><tr><td align="left" valign="top" colspan="9">Prescribed drug (buttom 5)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Saxagliptin hydrate, n (%)</td><td align="left" valign="top">158 (0.62)</td><td align="left" valign="top">17 (0.56)</td><td align="left" valign="top">586 (0.75)</td><td align="left" valign="top">41 (1.02)</td><td align="left" valign="top">960 (0.57)</td><td align="left" valign="top">52 (1.15)</td><td align="left" valign="top">30 (1.00)</td><td align="left" valign="top">6 (0.94)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Anagliptin, n (%)</td><td align="left" valign="top">142 (0.56)</td><td align="left" valign="top">17 (0.56)</td><td align="left" valign="top">528 (0.68)</td><td align="left" valign="top">34 (0.85)</td><td align="left" valign="top">986 (0.58)</td><td align="left" valign="top">51 (1.13)</td><td align="left" valign="top">5 (0.17)</td><td align="left" valign="top">1 (0.16)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Insulin lispro (genetical recombination) [Insulin lispro Biosimilar 1], n (%)</td><td align="left" valign="top">59 (0.23)</td><td align="left" valign="top">19 (0.63)</td><td align="left" valign="top">59 (0.08)</td><td align="left" valign="top">19 (0.47)</td><td align="left" valign="top">59 (0.03)</td><td align="left" valign="top">19 (0.42)</td><td align="left" valign="top">58 (1.94)</td><td align="left" valign="top">13 (2.04)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Insulin glargine (genetical recombination) [Insulin glargin biosimilar 2], n (%)</td><td align="left" valign="top">39 (0.15)</td><td align="left" valign="top">9 (0.30)</td><td align="left" valign="top">86 (0.11)</td><td align="left" valign="top">14 (0.35)</td><td align="left" valign="top">86 (0.05)</td><td align="left" valign="top">14 (0.31)</td><td align="left" valign="top">1 (0.03)</td><td align="left" valign="top">1 (0.16)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Glibenclamide, n (%)</td><td align="left" valign="top">33 (0.13)</td><td align="left" valign="top">5 (0.17)</td><td align="left" valign="top">280 (0.36)</td><td align="left" valign="top">24 (0.60)</td><td align="left" valign="top">1722 (1.02)</td><td align="left" valign="top">87 (1.92)</td><td align="left" valign="top">11 (0.37)</td><td align="left" valign="top">3 (0.47)</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>HbA<sub>1c</sub>: hemoglobin A<sub>1c</sub>.</p></fn><fn id="table1fn2"><p><sup>b</sup>not applicable.</p></fn><fn id="table1fn3"><p><sup>c</sup>HDL-C: high density lipoprotein cholesterol.</p></fn><fn id="table1fn4"><p><sup>d</sup>Cre: creatinine..</p></fn><fn id="table1fn5"><p><sup>e</sup>Glu: glucose.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2-3"><title>ML Models</title><p>Patients&#x2019; medical conditions and prescription histories are in general irregularly spaced, reflecting variability in patient care appointment dates, with updates to outpatient EHR occurring before and after clinical visits. We organized the data into Monday-to-Sunday weeks and quantized the data to a single value per week, using the average in the case of multiple measurements and treating weeks with no values as having missing values [<xref ref-type="bibr" rid="ref47">47</xref>]. This approach allowed the ML model to treat irregularly spaced data spanning Y (a natural number) years as regularly spaced data consisting of (Y&#x00D7;365)&#x2044;7 (rounded up to the nearest integer) values, that is we treated all data as weekly data. We did not perform preprocessing, including interpolation, on missing values in the regularly spaced data. No normalization, outlier removal, or dimensionality reduction was performed.</p><p>We designed a transformer-based encoder-decoder model (<xref ref-type="fig" rid="figure2">Figure 2</xref>) that takes as input a time series of drugs prescribed and laboratory tests over the past 1 year, sex, and age. The model approaches drug selection as a multichoice task. With N types of drugs, there are 2^N potential prescription combinations. By setting the number of units in the output layer of the transformer decoder to N, we implemented N binary classifications. The model outputs a set of scores representing the probability of each drug being prescribed on that day and, for each drug and day, a binary prescription decision based on whether the prescription probability is greater than or equal to 0.5.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Architecture of the transformer-based encoder-decoder model for predicting the next-prescribed diabetes medications. EHRs: electronic health records.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e67748_fig02.png"/></fig><p>We treated age and HbA<sub>1c</sub> values as numerical data, sex as a categorical label, and prescription history as a set of categorical labels. In addition, a time series representing the presence or absence of missing data, called an attention mask, was simultaneously generated. Each data type was transformed into a uniform-dimensional vector using an embedding layer specific to that data type, which was then handled by the transformer model. Time information was converted to a uniform-dimensional vector using a positional embedding layer with a periodic function and added to the output value of the embedding layers.</p><p>The model incorporates two types of attention layers: self-attention in the encoder, designed to extract relationships in time and meaning from the time series of drugs prescribed and laboratory tests, and cross-attention in the decoder, used to predict the next prescribed drugs based on these relationships. Times in the time series that contain missing data are ignored in the self-attention and mutual attention calculation process using the attention mask. This makes it easy to handle without additional processing for missing data completion. The self-attention weights were optimized through self-supervised learning. This involves the task of predicting both the next laboratory test values and drugs prescribed using a time series of past laboratory tests and drugs prescribed. The cross-attention weights were optimized through supervised learning involving the task of predicting a set of scores representing the probability of each drug being prescribed on that day.</p><p>The model consisted of four transformer-encoder layers including four multihead self-attention blocks and four transformer-decoder layers including four multihead cross-attention blocks, along with a hidden layer of dimension 256. Compared to the text data handled by the language model, the prescription drug selection data has a smaller vocabulary (number of drug types) and a shorter time series, so these hyperparameters were set to about one-third the size of the BERT model [<xref ref-type="bibr" rid="ref34">34</xref>]. The parameters were optimized by Adam with a learning rate of 1e-4, a batch size of 256, and 100 epochs. The loss functions for numerical and categorical data were mean squared error and focal loss [<xref ref-type="bibr" rid="ref48">48</xref>], respectively. All implementations were written in Python 3.11 (Python Software Foundation) and PyTorch 2.2 (Meta AI).</p><p>The model was trained using prescription records from endocrinologists at the University of Tokyo Hospital. As a result, the model generates outputs aligned with the treatment approaches of these specialists.</p></sec><sec id="s2-4"><title>Statistical Methods</title><p>We analyzed the characteristics of patients in the dataset using means, SD, and frequency counts. We calculated 95% CI using the bootstrap method where applicable. We performed all statistical analyses using custom Python code.</p><p>We compared our model with an established ML method recognized for high accuracy. There were validations on similar T2D prediction tasks favored LightGBM [<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>], making it our chosen reference for comparisons. We compared the predictive accuracy of the two methods with the three different training dataset for the prescription prediction of 44 drugs using both macro- and microaverages [<xref ref-type="bibr" rid="ref51">51</xref>] of the receiver operating characteristic area under the curve (ROC-AUC) as metrics. The macroaverage is a measure of the average performance across all classes independently. The method computes the metrics of ROC-AUC for each individual drug, then averages them to obtain an overall score. This analysis method gives equal weight to each drug, regardless of its size or imbalance in the dataset. On the other hand, the microaverage is a measure of the aggregate performance that weights all instances in the dataset equally. This analysis method first aggregates the true positives, false positives, true negatives, and false negatives across all drugs, and then computes each metric using these aggregated values. The microaverage treats every prediction equally, without considering the kinds of drugs.</p><p>The predictive performance of each drug was also evaluated using ROC-AUC.</p></sec><sec id="s2-5"><title>Ethical Considerations</title><p>This study was approved by the institutional review board of the University of Tokyo School of Medicine (approval number: 10705-(4)) and was conducted in accordance with the Declaration of Helsinki. This was a retrospective, noninterventional database study without patient involvement. Confidentiality was safeguarded by the University of Tokyo Hospital. According to the Guidelines for Epidemiological Studies of the Ministry of Health, Labour and Welfare of Japan, written informed consent was not required. Information about the current study was available to patients on a website, and patients have the right to cease registration of their data at any time [<xref ref-type="bibr" rid="ref52">52</xref>].</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Prediction Performance for Various Sizes of Training Data</title><p>We assessed different sizes of training data (<xref ref-type="table" rid="table2">Table 2</xref>). The best prediction performance was obtained from training with the 5 years of data from 2017 to 2021. This version achieved a microaverage (95% CI) ROC-AUC of 0.993 (0.992-0.994) and a macroaverage (95% CI) ROC-AUC of 0.988 (0.980-0.993), and we selected it as our model. Performance was similar when trained using the full range of 10 years of data, from 2012 to 2021, producing somewhat worse results. For all sizes of training data, we met the study&#x2019;s objectives of achieving an ROC-AUC above 0.95 from our macro- and microaverage evaluations. The prediction accuracy of LightGBM with the 5 years of data had a microaverage ROC AUC of 0.988 (0.985-0.990), and the transformer outperformed LightGBM.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Overall prediction performance of models for the next-prescribed diabetes drugs, stratified by the training data period. This table compares the overall accuracy of the developed transformer model against a LightGBM model.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom" colspan="2">Transformer</td><td align="left" valign="bottom" colspan="2">LightGBM</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Microaverage (95% CI)</td><td align="left" valign="top">Macroaverage (95% CI)</td><td align="left" valign="top">Microaverage (95% CI)</td><td align="left" valign="top">Macroaverage (95% CI)</td></tr></thead><tbody><tr><td align="left" valign="top">2 years of training data</td><td align="left" valign="top">0.991 (0.990-0.992)</td><td align="left" valign="top">0.981 (0.975-0.988)</td><td align="left" valign="top">0.987 (0.984-0.989)</td><td align="left" valign="top">0.970 (0.941-0.992)</td></tr><tr><td align="left" valign="top">5 years of training data</td><td align="left" valign="top">0.993 (0.992-0.994)</td><td align="left" valign="top">0.988 (0.980-0.993)</td><td align="left" valign="top">0.988 (0.985-0.990)</td><td align="left" valign="top">0.962 (0.916-0.993)</td></tr><tr><td align="left" valign="top">10 years of training data</td><td align="left" valign="top">0.992 (0.990-0.993)</td><td align="left" valign="top">0.987 (0.976-0.994)</td><td align="left" valign="top">0.984 (0.981-0.986)</td><td align="left" valign="top">0.959 (0.921-0.987)</td></tr></tbody></table></table-wrap></sec><sec id="s3-2"><title>Prediction Performance for Each Drug</title><p>We examined the prediction performance for each of the 44 drugs (<xref ref-type="table" rid="table3">Table 3</xref>). The drugs in the table are the top 5 and bottom 5 in terms of the number of prescriptions in the 2 years of training data. All results are provided in the supplemental file (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). We achieved an ROC-AUC above our target of 0.95 for 43 of the 44 drugs when trained with the 5 years of data.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Prediction performance for drugs when trained with various sizes of training data. The table shows results for the top 5 and bottom 5 most frequently prescribed drugs, showing a comparison of performance between specific drugs and the impact of the data period of the training data on the prediction accuracy of individual drugs.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">Number of prescriptions in 1 year of test data, n (%)</td><td align="left" valign="bottom" colspan="2">Number of prescriptions in 2 years of training data</td><td align="left" valign="bottom" colspan="2">Number of prescriptions in 5 years of training data</td><td align="left" valign="bottom" colspan="2">Number of prescriptions in 10 years of training data</td></tr><tr><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">ROC-AUC (95% CI)</td><td align="left" valign="top">Accuracy (95% CI)</td><td align="left" valign="top">ROC-AUC (95% CI)</td><td align="left" valign="top">Accuracy (95% CI)</td><td align="left" valign="top">ROC-AUC (95% CI)</td><td align="left" valign="top">Accuracy (95% CI)</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="8">Prescribed drug (top 5)</td></tr><tr><td align="left" valign="top">Metformin hydrochloride, n (%)</td><td align="left" valign="top">1361 (45.55)</td><td align="left" valign="top">0.992 (0.989-0.995)</td><td align="left" valign="top">0.977 (0.971-0.982)</td><td align="left" valign="top">0.992 (0.989-0.995)</td><td align="left" valign="top">0.982 (0.978-0.987)</td><td align="left" valign="top">0.993 (0.990-0.996)</td><td align="left" valign="top">0.980 (0.975-0.985)</td></tr><tr><td align="left" valign="top">Sitagliptin phosphate hydrate, n (%)</td><td align="left" valign="top">425 (14.22)</td><td align="left" valign="top">0.991 (0.985-0.996)</td><td align="left" valign="top">0.988 (0.985-0.992)</td><td align="left" valign="top">0.994 (0.990-0.997)</td><td align="left" valign="top">0.990 (0.987-0.994)</td><td align="left" valign="top">0.996 (0.994-0.998)</td><td align="left" valign="top">0.992 (0.989-0.995)</td></tr><tr><td align="left" valign="top">Insulin aspart (genetical recombination), n (%)</td><td align="left" valign="top">403 (13.49)</td><td align="left" valign="top">0.993 (0.989-0.997)</td><td align="left" valign="top">0.985 (0.981-0.989)</td><td align="left" valign="top">0.996 (0.993-0.998)</td><td align="left" valign="top">0.985 (0.981-0.989)</td><td align="left" valign="top">0.995 (0.991-0.999)</td><td align="left" valign="top">0.993 (0.990-0.996)</td></tr><tr><td align="left" valign="top">Glimepiride, n (%)</td><td align="left" valign="top">358 (11.98)</td><td align="left" valign="top">0.988 (0.979-0.995)</td><td align="left" valign="top">0.991 (0.988-0.994)</td><td align="left" valign="top">0.991 (0.984-0.996)</td><td align="left" valign="top">0.994 (0.991-0.996)</td><td align="left" valign="top">0.995 (0.990-0.999)</td><td align="left" valign="top">0.992 (0.989-0.995)</td></tr><tr><td align="left" valign="top">Pioglitazone hydrochloride, n (%)</td><td align="left" valign="top">244 (8.17)</td><td align="left" valign="top">0.989 (0.978-0.998)</td><td align="left" valign="top">0.993 (0.990-0.996)</td><td align="left" valign="top">0.990 (0.979-0.999)</td><td align="left" valign="top">0.993 (0.990-0.996)</td><td align="left" valign="top">0.995 (0.992-0.997)</td><td align="left" valign="top">0.985 (0.981-0.989)</td></tr><tr><td align="left" valign="top" colspan="8">Prescribed drug (buttom 5)</td></tr><tr><td align="left" valign="top">Saxagliptin hydrate, n (%)</td><td align="left" valign="top">30 (1.00)</td><td align="left" valign="top">0.978 (0.944-1.000)</td><td align="left" valign="top">0.998 (0.996-0.999)</td><td align="left" valign="top">0.999 (0.999-1.000)</td><td align="left" valign="top">0.999 (0.998-1.000)</td><td align="left" valign="top">0.999 (0.999-1.000)</td><td align="left" valign="top">0.999 (0.998-1.000)</td></tr><tr><td align="left" valign="top">Anagliptin, n (%)</td><td align="left" valign="top">5 (0.17)</td><td align="left" valign="top">0.999 (0.998-1.000)</td><td align="left" valign="top">0.998 (0.996-0.999)</td><td align="left" valign="top">0.999 (0.999-1.000)</td><td align="left" valign="top">0.999 (0.998-1.000)</td><td align="left" valign="top">0.999 (0.998-1.000)</td><td align="left" valign="top">1.000 (0.999-1.000)</td></tr><tr><td align="left" valign="top">Insulin lispro (genetical recombination) [Insulin lispro Biosimilar 1], n (%)</td><td align="left" valign="top">58 (1.94)</td><td align="left" valign="top">0.945 (0.910-0.972)</td><td align="left" valign="top">0.986 (0.981-0.990)</td><td align="left" valign="top">0.848 (0.784-0.904)</td><td align="left" valign="top">0.981 (0.976-0.986)</td><td align="left" valign="top">0.799 (0.735-0.860)</td><td align="left" valign="top">0.981 (0.975-0.986)</td></tr><tr><td align="left" valign="top">Insulin glargine (genetical recombination) [Insulin glargin biosimilar 2], n (%)</td><td align="left" valign="top">1 (0.03)</td><td align="left" valign="top">0.938 (0.500-0.945)</td><td align="left" valign="top">0.996 (0.994-0.998)</td><td align="left" valign="top">0.990 (0.500-0.993)</td><td align="left" valign="top">0.999 (0.998-1.000)</td><td align="left" valign="top">0.938 (0.500-0.945)</td><td align="left" valign="top">1.000 (0.999-1.000)</td></tr><tr><td align="left" valign="top">Glibenclamide, n (%)</td><td align="left" valign="top">11 (0.37)</td><td align="left" valign="top">0.999 (0.999-1.000)</td><td align="left" valign="top">0.999 (0.997-1.000)</td><td align="left" valign="top">0.999 (0.999-1.000)</td><td align="left" valign="top">0.999 (0.997-1.000)</td><td align="left" valign="top">0.973 (0.935-0.999)</td><td align="left" valign="top">0.996 (0.994-0.998)</td></tr></tbody></table></table-wrap><p>The only drug that did not achieve the target value was &#x201C;Insulin lispro (genetical recombination) [Insulin lispro Biosimilar 1].&#x201D; The prescription of this drug began in 2020. Therefore, the same instances of prescription were present in all three training data periods. For this drug, the model trained on just 2 years of data had the highest ROC-AUC.</p></sec><sec id="s3-3"><title>Interpretability</title><p>The proposed model performed as well as other transformer-based models considering the ability for extracting relationships in time and meaning [<xref ref-type="bibr" rid="ref53">53</xref>]. The embedding vectors obtained through training represent the closeness of relationships between vectors as proximity. The embedding vectors in this experiment were the same 256 dimensions as the transformer hidden size. Projecting onto two dimensions using uniform manifold approximation and projection [<xref ref-type="bibr" rid="ref54">54</xref>] allows visualization (<xref ref-type="fig" rid="figure3">Figure 3</xref>). While we did not observe a strong tendency for clustering, several biosimilar drugs, such as insulin glargine (genetical recombination, ie, insulin glargin biosimilar 1), were positioned close to the biosimilar drug.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Visualization of learned drug embedding vectors using uniform manifold approximation and projection. This plot displays a 2D representation of the relationships between 44 different diabetes drugs, as learned by the transformer model&#x2019;s encoder component. Each point corresponds to a specific diabetes drug. Proximity between points suggests that the model identified similarities in how these drugs were used or in the patient contexts associated with their prescription within the training dataset.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e67748_fig03.png"/></fig></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Evaluation of the Predictive Accuracy</title><p>The proposed model achieved impressive predictive accuracy, with macroaverages (95% CI) of ROC-AUC of 0.988 (0.980-0.993). In previous studies [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>], the ROC-AUC for drugs was less than 0.95, and our model represents a significant improvement relative to this previous work.</p><p>The prediction accuracy was higher when trained with short-term data from 5 years than when trained using data from the past 10 years. We suspect that changes in the treatment environment, such as the introduction of new prescription drugs, are responsible for this difference in prediction accuracy. When training on data from the past N years, the model uniformly learns the prescription selection trends for the past N years. Therefore, when N is large, the model is heavily influenced by the trends of older prescription selections. This suspicion is supported by our results that the prescription drug that did not reach target accuracy, &#x201C;Insulin lispro (genetical recombination) [Insulin lispro Biosimilar 1],&#x201D; was only recently approved and prescribed. Introduced in 2020, this drug has remained relatively rare in the dataset, as demonstrated in <xref ref-type="table" rid="table1">Table 1</xref>. Even when expanding the training data period from 2 to 10 years, the number of prescriptions for this drug has remained stagnant at 59, and its proportion within the overall dataset has decreased from 0.23% to a mere 0.03%. This low frequency and temporal bias in the data have rendered learning this specific drug&#x2019;s patterns challenging. Although ML models generally perform better with more data, for this application it may be better to gather data from more hospitals rather than a longer time span, since it is desirable to learn more fresh data, including new prescription drugs. Transformer models, known for power-law characteristics, benefit from scale-ups [<xref ref-type="bibr" rid="ref38">38</xref>], and expanding the study to multiple hospitals could explore potential performance enhancements and test the applicability of the power-law in the medical field.</p><p>Physicians select drugs considering insulin secretion and insulin resistance, age, obesity, severity of chronic complications, and liver and kidney function. In this experiment, we used age, sex, 12 kinds of diabetes-related laboratory tests, and past prescription history. By adding comprehensive items likely used in medication selection to the model input, performance may be improved.</p><p>Our ultimate goal is to improve the treatment outcomes of diabetes. Merely predicting drug selection alone cannot achieve this goal. Expanding the scope to predict the impact of prescribed drugs could further enhance the model&#x2019;s utility in diabetes treatment.</p></sec><sec id="s4-2"><title>Limitations</title><p>Our study has notable limitations. First, the model uses only age, sex, 12 kinds of diabetes-related laboratory tests, and past prescription history as inputs. It is desirable to fully account for the various constraints and contraindications that physicians consider in real-world clinical practice. For example, when considering patient characteristics, factors such as age (older adults or pediatric), pregnancy, lactation, BMI, type of diabetes, c-peptide, renal and hepatic function, comorbidities, allergies, urinary tract infection history, diabetic ketoacidosis history, cardiac history, and hypoglycemia must be considered. Regarding medications, considerations include adverse effects, drug resistance, and cost. However, despite these limitations, this study demonstrates that it is possible to narrow down treatment options to some extent using a limited set of variables. We believe that this result holds promise for providing primary care physicians with some guidance and direction. Regarding warnings of constraints and contraindications in drug selection, CDSS have traditionally excelled in this [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>] and can effectively complement this model. In addition, recent advancements in natural language processing within ML models [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>] have enabled the extraction of important information on constraints and contraindications from fresh sources such as research papers published daily. We believe there is substantial potential for future research to integrate these important factors into ML models, and we intend to work on this improvement.</p><p>Second, the data were sourced from a single hospital, limiting generalizability. Potential biases in the results include the race and geography of the patients and the prescribing tendencies of a limited number of endocrinologists at the hospital. ML models tend to learn biases present in the training data, resulting in predictions that reflect those biases. Prediction accuracy is significantly degraded when different biases exist between the training data and the test data. Therefore, in order to generalize the prediction results of the model, a large dataset of data from multiple hospitals containing data on patients with diverse backgrounds is required. However, in reality, it is difficult to build an ideal dataset due to constraints such as privacy protection and data collection costs. As one solution, we believe that it is good to collect training data that resembles the patterns of patients treated by the primary care physicians who are the users of the model, thereby eliminating biase differences between the training data and the test data as much as possible. Specifically, we collect EHRs of patients who have been involved in prescriptions by endocrinologists at multiple hospitals in a specific region, and use this to build the model that selects prescription drugs for patients treated by primary care physicians in the same region. We believe that this approach will reduce the bias differences in regional characteristics between the training data and the test data, and improve generalization performance with realistic data collection. We would like to verify the validity of this solution in the future.</p><p>Third, ML reflects majority characteristics, potentially limiting applicability to diverse patient populations. In the dataset used in the experiment, over 40% (297/637) of patients were prescribed metformin hydrochloride, and patient characteristics are biased. There is a risk that truly effective treatments may not be prescribed correctly to a minority of patients. Prediction failure analysis needs to be further scrutinized, including versus patient characteristics. We should examine this issue by comparing prediction accuracy for each patient cluster.</p><p>Fourth, this was a backward-looking study, using past data, and the essential next phase is to assess the model&#x2019;s predictive capabilities in clinical practice. There is a need for a careful exploration of the model&#x2019;s effectiveness in real clinical scenarios.</p><p>Fifth, while the proposed model requires hyperparameters, we determined these values based on previous studies. Although fine-tuning hyperparameters is generally desirable, transformer models are typically computationally expensive to train, and many previous studies have likewise not fully tuned their parameters. There is potential for performance improvement through hyperparameter tuning, and we intend to investigate this further in future work.</p><p>Sixth, the model has poor interpretability. We investigated the proximity relationship between embedding vectors, but no strong tendency was found. It would be better to use other information obtained from the transformer, such as attention weights, to further improve interpretability.</p><p>These limitations raise important ethical considerations in the development and application of medical artificial intelligence. Physicians who use the model must be aware of these limitations and exercise appropriate clinical judgment. Obtaining appropriate informed consent from patients is important.</p></sec><sec id="s4-3"><title>Conclusions</title><p>The proposed model addresses the challenge of predicting the next prescribed drugs. This model, trained using past prescriptions of endocrinologists, has the potential to improve treatment outcomes for nonspecialists by assisting them in making prescription decisions. Future efforts should focus on improving accuracy by incorporating disease state information beyond current inputs and validating the model on large clinical datasets across multiple hospitals.</p></sec></sec></body><back><ack><p>We thank Daniel Lane for his support in manuscript editing and scientific discussions. We made no use of generative AI in the development of this paper.</p><p>This work was funded by The University of Tokyo and Nippon Telegraph and Telephone Corporation in a joint research program at the University of Tokyo Center of Innovation, Sustainable Life Care, and the Ageless Society dedicated to Self-managing Healthcare in the Aging Society of Japan. The funding source had no role in the design and conduct of the study; collection, management, analysis, and interpretation of the data; preparation, review, or approval of the manuscript; and decision to submit the manuscript for publication. The content is solely the responsibility of the authors and does not necessarily represent the official views of the University of Tokyo Center of Innovation.</p></ack><notes><sec><title>Data Availability</title><p>The datasets analyzed during this study are not publicly available due the restrictions imposed by the research ethics committees that approved this study.</p></sec></notes><fn-group><fn fn-type="conflict"><p>HK, EN, AF, NS, and NN are employees of Nippon Telegraph and Telephone Corporation (NTT), Tokyo, Japan.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">CDSS</term><def><p>clinical decision support system</p></def></def-item><def-item><term id="abb2">EHR</term><def><p>electronic health record</p></def></def-item><def-item><term id="abb3">LightGBM</term><def><p>light gradient boosting machine</p></def></def-item><def-item><term id="abb4">ML</term><def><p> machine learning</p></def></def-item><def-item><term id="abb5">RNN</term><def><p>recurrent neural network</p></def></def-item><def-item><term id="abb6">ROC-AUC</term><def><p> area under the receiver operating characteristic curve</p></def></def-item><def-item><term id="abb7">T2D</term><def><p>type 2 diabete</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><collab>GBD 2021 Diabetes Collaborators</collab></person-group><article-title>Global, regional, and national burden of diabetes from 1990 to 2021, with projections of prevalence to 2050: a systematic analysis for the Global Burden of Disease Study 2021</article-title><source>Lancet</source><year>2023</year><month>07</month><day>15</day><volume>402</volume><issue>10397</issue><fpage>203</fpage><lpage>234</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(23)01301-6</pub-id><pub-id pub-id-type="medline">37356446</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Davies</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Aroda</surname><given-names>VR</given-names> </name><name name-style="western"><surname>Collins</surname><given-names>BS</given-names> </name><etal/></person-group><article-title>Management of hyperglycaemia in type 2 diabetes, 2022. A consensus report by the American Diabetes Association (ADA) and the European Association for the Study of Diabetes (EASD)</article-title><source>Diabetologia</source><year>2022</year><month>12</month><volume>65</volume><issue>12</issue><fpage>1925</fpage><lpage>1966</lpage><pub-id pub-id-type="doi">10.1007/s00125-022-05787-2</pub-id><pub-id pub-id-type="medline">36151309</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="web"><article-title>Primary care physicians&#x2019; practices in diabetes treatment</article-title><year>2024</year><access-date>2025-05-29</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.jdome.jp/doc/jdome-2021-64jds.pdf">https://www.jdome.jp/doc/jdome-2021-64jds.pdf</ext-link></comment></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lu</surname><given-names>H</given-names> </name><name name-style="western"><surname>Holt</surname><given-names>JB</given-names> </name><name name-style="western"><surname>Cheng</surname><given-names>YJ</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Onufrak</surname><given-names>S</given-names> </name><name name-style="western"><surname>Croft</surname><given-names>JB</given-names> </name></person-group><article-title>Population-based geographic access to endocrinologists in the United States, 2012</article-title><source>BMC Health Serv Res</source><year>2015</year><month>12</month><day>7</day><volume>15</volume><issue>1</issue><fpage>541</fpage><pub-id pub-id-type="doi">10.1186/s12913-015-1185-5</pub-id><pub-id pub-id-type="medline">26644021</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bolen</surname><given-names>S</given-names> </name><name name-style="western"><surname>Feldman</surname><given-names>L</given-names> </name><name name-style="western"><surname>Vassy</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Systematic review: comparative effectiveness and safety of oral medications for type 2 diabetes mellitus</article-title><source>Ann Intern Med</source><year>2007</year><month>09</month><day>18</day><volume>147</volume><issue>6</issue><fpage>386</fpage><lpage>399</lpage><pub-id pub-id-type="doi">10.7326/0003-4819-147-6-200709180-00178</pub-id><pub-id pub-id-type="medline">17638715</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="report"><person-group person-group-type="author"><name name-style="western"><surname>Bolen</surname><given-names>S</given-names> </name><name name-style="western"><surname>Tseng</surname><given-names>E</given-names> </name><name name-style="western"><surname>Hutfless</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Diabetes medications for adults with type 2 diabetes: an update [internet]</article-title><year>2016</year><publisher-name>Rockville (MD): Agency for Healthcare Research and Quality (US)</publisher-name><comment>16-EHC013-EF</comment><pub-id pub-id-type="medline">27227214</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><collab>American Diabetes Association Professional Practice Committee</collab></person-group><article-title>Erratum. 9. Pharmacologic approaches to glycemic treatment: standards of care in diabetes-2024. Diabetes Care 2024;47(Suppl. 1):S158-S178</article-title><source>Diabetes Care</source><year>2024</year><month>07</month><day>1</day><volume>47</volume><issue>7</issue><fpage>S158</fpage><lpage>S178</lpage><pub-id pub-id-type="doi">10.2337/dc24-er07a</pub-id><pub-id pub-id-type="medline">38696224</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wilcox</surname><given-names>G</given-names> </name></person-group><article-title>Insulin and insulin resistance</article-title><source>Clin Biochem Rev</source><year>2005</year><month>05</month><volume>26</volume><issue>2</issue><fpage>19</fpage><lpage>39</lpage><pub-id pub-id-type="medline">16278749</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><collab>American Diabetes Association Professional Practice Committee</collab></person-group><article-title>13. Older adults: standards of care in diabetes-2024</article-title><source>Diabetes Care</source><year>2024</year><month>01</month><day>1</day><volume>47</volume><issue>Suppl 1</issue><fpage>S244</fpage><lpage>S257</lpage><pub-id pub-id-type="doi">10.2337/dc24-S013</pub-id><pub-id pub-id-type="medline">38078580</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Babiker</surname><given-names>A</given-names> </name><name name-style="western"><surname>Al Dubayee</surname><given-names>M</given-names> </name></person-group><article-title>Anti-diabetic medications: How to make a choice?</article-title><source>Sudan J Paediatr</source><year>2017</year><volume>17</volume><issue>2</issue><fpage>11</fpage><lpage>20</lpage><pub-id pub-id-type="doi">10.24911/SJP.2017.2.12</pub-id><pub-id pub-id-type="medline">29545660</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><collab>American Diabetes Association Professional Practice Committee</collab></person-group><article-title>8. Obesity and weight management for the prevention and treatment of type 2 diabetes: standards of care in diabetes-2024</article-title><source>Diabetes Care</source><year>2024</year><month>01</month><day>1</day><volume>47</volume><issue>Suppl 1</issue><fpage>S145</fpage><lpage>S157</lpage><pub-id pub-id-type="doi">10.2337/dc24-S008</pub-id><pub-id pub-id-type="medline">38078578</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Steiger</surname><given-names>K</given-names> </name><name name-style="western"><surname>Herrin</surname><given-names>J</given-names> </name><name name-style="western"><surname>Swarna</surname><given-names>KS</given-names> </name><name name-style="western"><surname>Davis</surname><given-names>EM</given-names> </name><name name-style="western"><surname>McCoy</surname><given-names>RG</given-names> </name></person-group><article-title>Disparities in acute and chronic complications of diabetes along the U.S. rural-urban continuum</article-title><source>Diabetes Care</source><year>2024</year><month>05</month><day>1</day><volume>47</volume><issue>5</issue><fpage>818</fpage><lpage>825</lpage><pub-id pub-id-type="doi">10.2337/dc23-1552</pub-id><pub-id pub-id-type="medline">38387066</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><collab>American Diabetes Association Professional Practice Committee</collab></person-group><article-title>11. Chronic kidney disease and risk management: standards of care in diabetes-2024</article-title><source>Diabetes Care</source><year>2024</year><month>01</month><day>1</day><volume>47</volume><issue>Suppl 1</issue><fpage>S219</fpage><lpage>S230</lpage><pub-id pub-id-type="doi">10.2337/dc24-S011</pub-id><pub-id pub-id-type="medline">38078574</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Vasilakou</surname><given-names>D</given-names> </name><name name-style="western"><surname>Karagiannis</surname><given-names>T</given-names> </name><name name-style="western"><surname>Athanasiadou</surname><given-names>E</given-names> </name><etal/></person-group><article-title>Sodium-glucose cotransporter 2 inhibitors for type 2 diabetes: a systematic review and meta-analysis</article-title><source>Ann Intern Med</source><year>2013</year><month>08</month><day>20</day><volume>159</volume><issue>4</issue><fpage>262</fpage><lpage>274</lpage><pub-id pub-id-type="doi">10.7326/0003-4819-159-4-201308200-00007</pub-id><pub-id pub-id-type="medline">24026259</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hallakou-Bozec</surname><given-names>S</given-names> </name><name name-style="western"><surname>Vial</surname><given-names>G</given-names> </name><name name-style="western"><surname>Kergoat</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Mechanism of action of Imeglimin: a novel therapeutic agent for type 2 diabetes</article-title><source>Diabetes Obes Metab</source><year>2021</year><month>03</month><volume>23</volume><issue>3</issue><fpage>664</fpage><lpage>673</lpage><pub-id pub-id-type="doi">10.1111/dom.14277</pub-id><pub-id pub-id-type="medline">33269554</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Karagiannis</surname><given-names>T</given-names> </name><name name-style="western"><surname>Avgerinos</surname><given-names>I</given-names> </name><name name-style="western"><surname>Liakos</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Management of type 2 diabetes with the dual GIP/GLP-1 receptor agonist tirzepatide: a systematic review and meta-analysis</article-title><source>Diabetologia</source><year>2022</year><month>08</month><volume>65</volume><issue>8</issue><fpage>1251</fpage><lpage>1261</lpage><pub-id pub-id-type="doi">10.1007/s00125-022-05715-4</pub-id><pub-id pub-id-type="medline">35579691</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><collab>American Diabetes Association</collab></person-group><article-title>Standards of Care in Diabetes-2023 Abridged for Primary Care Providers</article-title><source>Clin Diabetes</source><year>2022</year><volume>41</volume><issue>1</issue><fpage>4</fpage><lpage>31</lpage><pub-id pub-id-type="doi">10.2337/cd23-as01</pub-id><pub-id pub-id-type="medline">36714254</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bouchi</surname><given-names>R</given-names> </name><name name-style="western"><surname>Sugiyama</surname><given-names>T</given-names> </name><name name-style="western"><surname>Goto</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Retrospective nationwide study on the trends in first-line antidiabetic medication for patients with type&#x2009;2 diabetes in Japan</article-title><source>J Diabetes Investig</source><year>2022</year><month>02</month><volume>13</volume><issue>2</issue><fpage>280</fpage><lpage>291</lpage><pub-id pub-id-type="doi">10.1111/jdi.13636</pub-id><pub-id pub-id-type="medline">34309213</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sutton</surname><given-names>RT</given-names> </name><name name-style="western"><surname>Pincock</surname><given-names>D</given-names> </name><name name-style="western"><surname>Baumgart</surname><given-names>DC</given-names> </name><name name-style="western"><surname>Sadowski</surname><given-names>DC</given-names> </name><name name-style="western"><surname>Fedorak</surname><given-names>RN</given-names> </name><name name-style="western"><surname>Kroeker</surname><given-names>KI</given-names> </name></person-group><article-title>An overview of clinical decision support systems: benefits, risks, and strategies for success</article-title><source>NPJ Digit Med</source><year>2020</year><volume>3</volume><fpage>17</fpage><pub-id pub-id-type="doi">10.1038/s41746-020-0221-y</pub-id><pub-id pub-id-type="medline">32047862</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Helmons</surname><given-names>PJ</given-names> </name><name name-style="western"><surname>Suijkerbuijk</surname><given-names>BO</given-names> </name><name name-style="western"><surname>Nannan Panday</surname><given-names>PV</given-names> </name><name name-style="western"><surname>Kosterink</surname><given-names>JGW</given-names> </name></person-group><article-title>Drug-drug interaction checking assisted by clinical decision support: a return on investment analysis</article-title><source>J Am Med Inform Assoc</source><year>2015</year><month>07</month><volume>22</volume><issue>4</issue><fpage>764</fpage><lpage>772</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocu010</pub-id><pub-id pub-id-type="medline">25670751</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Koutkias</surname><given-names>V</given-names> </name><name name-style="western"><surname>Bouaud</surname><given-names>J</given-names> </name><collab>Section Editors for the IMIA Yearbook Section on Decision Support</collab></person-group><article-title>Contributions from the 2017 literature on clinical decision support</article-title><source>Yearb Med Inform</source><year>2018</year><month>08</month><volume>27</volume><issue>1</issue><fpage>122</fpage><lpage>128</lpage><pub-id pub-id-type="doi">10.1055/s-0038-1641222</pub-id><pub-id pub-id-type="medline">30157515</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zou</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Qu</surname><given-names>K</given-names> </name><name name-style="western"><surname>Luo</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Yin</surname><given-names>D</given-names> </name><name name-style="western"><surname>Ju</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Tang</surname><given-names>H</given-names> </name></person-group><article-title>Predicting diabetes mellitus with machine learning techniques</article-title><source>Front Genet</source><year>2018</year><volume>9</volume><fpage>515</fpage><pub-id pub-id-type="doi">10.3389/fgene.2018.00515</pub-id><pub-id pub-id-type="medline">30459809</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dagliati</surname><given-names>A</given-names> </name><name name-style="western"><surname>Marini</surname><given-names>S</given-names> </name><name name-style="western"><surname>Sacchi</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Machine learning methods to predict diabetes complications</article-title><source>J Diabetes Sci Technol</source><year>2018</year><month>03</month><volume>12</volume><issue>2</issue><fpage>295</fpage><lpage>302</lpage><pub-id pub-id-type="doi">10.1177/1932296817706375</pub-id><pub-id pub-id-type="medline">28494618</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fujihara</surname><given-names>K</given-names> </name><name name-style="western"><surname>Sone</surname><given-names>H</given-names> </name></person-group><article-title>Machine learning approach to drug treatment strategy for diabetes care</article-title><source>Diabetes Metab J</source><year>2023</year><month>05</month><volume>47</volume><issue>3</issue><fpage>325</fpage><lpage>332</lpage><pub-id pub-id-type="doi">10.4093/dmj.2022.0349</pub-id><pub-id pub-id-type="medline">36631990</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wright</surname><given-names>AP</given-names> </name><name name-style="western"><surname>Wright</surname><given-names>AT</given-names> </name><name name-style="western"><surname>McCoy</surname><given-names>AB</given-names> </name><name name-style="western"><surname>Sittig</surname><given-names>DF</given-names> </name></person-group><article-title>The use of sequential pattern mining to predict next prescribed medications</article-title><source>J Biomed Inform</source><year>2015</year><month>02</month><volume>53</volume><fpage>73</fpage><lpage>80</lpage><pub-id pub-id-type="doi">10.1016/j.jbi.2014.09.003</pub-id><pub-id pub-id-type="medline">25236952</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mei</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zhao</surname><given-names>S</given-names> </name><name name-style="western"><surname>Jin</surname><given-names>F</given-names> </name><etal/></person-group><article-title>Deep diabetologist: learning to prescribe hypoglycemic medications with recurrent neural networks</article-title><source>Stud Health Technol Inform</source><year>2017</year><volume>245</volume><issue>1277</issue><fpage>29295362</fpage><pub-id pub-id-type="medline">29295362</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tarumi</surname><given-names>S</given-names> </name><name name-style="western"><surname>Takeuchi</surname><given-names>W</given-names> </name><name name-style="western"><surname>Chalkidis</surname><given-names>G</given-names> </name><etal/></person-group><article-title>Leveraging artificial intelligence to improve chronic disease care: methods and application to pharmacotherapy decision support for type-2 diabetes mellitus</article-title><source>Methods Inf Med</source><year>2021</year><month>06</month><volume>60</volume><issue>S 01</issue><fpage>e32</fpage><lpage>e43</lpage><pub-id pub-id-type="doi">10.1055/s-0041-1728757</pub-id><pub-id pub-id-type="medline">33975376</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Vaswani</surname><given-names>A</given-names> </name><name name-style="western"><surname>Shazeer</surname><given-names>N</given-names> </name><name name-style="western"><surname>Parmar</surname><given-names>N</given-names> </name><etal/></person-group><article-title>Attention is all you need</article-title><year>2017</year><conf-name>Proceedings of the 31st Annual Conference on Neural Information Processing Systems (NIPS&#x2019;17)</conf-name><conf-date>Dec 4-9, 2017</conf-date><conf-loc>Long Beach, California, USA</conf-loc><fpage>6000</fpage><lpage>6010</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://dl.acm.org/doi/10.5555/3295222.3295349">https://dl.acm.org/doi/10.5555/3295222.3295349</ext-link></comment></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Bommasani</surname><given-names>R</given-names> </name><name name-style="western"><surname>Hudson</surname><given-names>DA</given-names> </name><name name-style="western"><surname>Adeli</surname><given-names>E</given-names> </name><etal/></person-group><article-title>On the opportunities and risks of foundation models</article-title><source>arXiv</source><comment>Preprint posted online on 2021</comment><pub-id pub-id-type="doi">10.48550/arXiv.2108.07258</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Lakew</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Cettolo</surname><given-names>M</given-names> </name><name name-style="western"><surname>Federico</surname><given-names>M</given-names> </name></person-group><article-title>A comparison of transformer and recurrent neural networks on multilingual neural machine translation</article-title><conf-name>Proceedings of the 27th International Conference on Computational Linguistics (COLING 2018)</conf-name><conf-date>Aug 20-26, 2018</conf-date><conf-loc>Santa Fe, New Mexico, USA</conf-loc><fpage>641</fpage><lpage>652</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://aclanthology.org/C18-1054/">https://aclanthology.org/C18-1054/</ext-link></comment></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Zerveas</surname><given-names>G</given-names> </name><name name-style="western"><surname>Jayaraman</surname><given-names>S</given-names> </name><name name-style="western"><surname>Patel</surname><given-names>D</given-names> </name><name name-style="western"><surname>Bhamidipaty</surname><given-names>A</given-names> </name><name name-style="western"><surname>Eickhoff</surname><given-names>C</given-names> </name></person-group><article-title>A transformer-based framework for multivariate time series representation learning</article-title><conf-name>KDD &#x2019;21: Proceedings of the 27th ACM SIGKDD Conference on Knowledge Discovery &#x0026; Data Mining</conf-name><conf-date>Aug 14, 2021</conf-date><conf-loc>Virtual Event Singapore</conf-loc><fpage>2114</fpage><lpage>2124</lpage><pub-id pub-id-type="doi">10.1145/3447548.3467401</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhou</surname><given-names>H</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>S</given-names> </name><name name-style="western"><surname>Peng</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Informer: beyond efficient transformer for long sequence time-series forecasting</article-title><source>AAAI</source><year>2021</year><volume>35</volume><issue>12</issue><fpage>11106</fpage><lpage>11115</lpage><pub-id pub-id-type="doi">10.1609/aaai.v35i12.17325</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lin</surname><given-names>T</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>X</given-names> </name><name name-style="western"><surname>Qiu</surname><given-names>X</given-names> </name></person-group><article-title>A survey of transformers</article-title><source>AI Open</source><year>2022</year><volume>3</volume><fpage>111</fpage><lpage>132</lpage><pub-id pub-id-type="doi">10.1016/j.aiopen.2022.10.001</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Devlin</surname><given-names>J</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>MW</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>K</given-names> </name><name name-style="western"><surname>Toutanova</surname><given-names>K</given-names> </name></person-group><article-title>Bert: pre-training of deep bidirectional transformers for language understanding</article-title><source>arXiv</source><comment>Preprint posted online on 2018</comment><pub-id pub-id-type="doi">10.48550/arXiv.1810.04805</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Mitra</surname><given-names>A</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>W</given-names> </name><name name-style="western"><surname>Berlowitz</surname><given-names>D</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>H</given-names> </name></person-group><article-title>TransformEHR: transformer-based encoder-decoder generative model to enhance prediction of disease outcomes using electronic health records</article-title><source>Nat Commun</source><year>2023</year><month>11</month><day>29</day><volume>14</volume><issue>1</issue><fpage>7857</fpage><pub-id pub-id-type="doi">10.1038/s41467-023-43715-z</pub-id><pub-id pub-id-type="medline">38030638</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Rao</surname><given-names>S</given-names> </name><name name-style="western"><surname>Solares</surname><given-names>JRA</given-names> </name><etal/></person-group><article-title>BEHRT: transformer for electronic health records</article-title><source>Sci Rep</source><year>2020</year><volume>10</volume><issue>1</issue><fpage>7155</fpage><pub-id pub-id-type="doi">10.1038/s41598-020-62922-y</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kraljevic</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Bean</surname><given-names>D</given-names> </name><name name-style="western"><surname>Shek</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Foresight-a generative pretrained transformer for modelling of patient timelines using electronic health records: a retrospective modelling study</article-title><source>Lancet Digit Health</source><year>2024</year><month>04</month><volume>6</volume><issue>4</issue><fpage>e281</fpage><lpage>e290</lpage><pub-id pub-id-type="doi">10.1016/S2589-7500(24)00025-6</pub-id><pub-id pub-id-type="medline">38519155</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Henighan</surname><given-names>T</given-names> </name><name name-style="western"><surname>Kaplan</surname><given-names>J</given-names> </name><name name-style="western"><surname>Katz</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Scaling laws for autoregressive generative modeling</article-title><source>arXiv</source><comment>Preprint posted online on 2020</comment><pub-id pub-id-type="doi">10.48550/arXiv.2010.14701</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Waki</surname><given-names>K</given-names> </name><name name-style="western"><surname>Fujita</surname><given-names>H</given-names> </name><name name-style="western"><surname>Uchimura</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>DialBetics: a novel smartphone-based self-management support system for type 2 diabetes patients</article-title><source>J Diabetes Sci Technol</source><year>2014</year><month>03</month><volume>8</volume><issue>2</issue><fpage>209</fpage><lpage>215</lpage><pub-id pub-id-type="doi">10.1177/1932296814526495</pub-id><pub-id pub-id-type="medline">24876569</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kurasawa</surname><given-names>H</given-names> </name><name name-style="western"><surname>Hayashi</surname><given-names>K</given-names> </name><name name-style="western"><surname>Fujino</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Machine-learning-based prediction of a missed scheduled clinical appointment by patients with diabetes</article-title><source>J Diabetes Sci Technol</source><year>2016</year><month>05</month><volume>10</volume><issue>3</issue><fpage>730</fpage><lpage>736</lpage><pub-id pub-id-type="doi">10.1177/1932296815614866</pub-id><pub-id pub-id-type="medline">26555782</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kurasawa</surname><given-names>H</given-names> </name><name name-style="western"><surname>Waki</surname><given-names>K</given-names> </name><name name-style="western"><surname>Chiba</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Treatment discontinuation prediction in patients with diabetes using a ranking model: machine learning model development</article-title><source>JMIR Bioinform Biotechnol</source><year>2022</year><month>09</month><day>23</day><volume>3</volume><issue>1</issue><fpage>e37951</fpage><pub-id pub-id-type="doi">10.2196/37951</pub-id><pub-id pub-id-type="medline">38935955</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sugiyama</surname><given-names>T</given-names> </name><name name-style="western"><surname>Miyo</surname><given-names>K</given-names> </name><name name-style="western"><surname>Tsujimoto</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Design of and rationale for the Japan diabetes comprehensive database project based on an advanced electronic medical record system (J-DREAMS)</article-title><source>Diabetol Int</source><year>2017</year><month>11</month><volume>8</volume><issue>4</issue><fpage>375</fpage><lpage>382</lpage><pub-id pub-id-type="doi">10.1007/s13340-017-0326-y</pub-id><pub-id pub-id-type="medline">30603343</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mooradian</surname><given-names>AD</given-names> </name></person-group><article-title>Dyslipidemia in type 2 diabetes mellitus</article-title><source>Nat Clin Pract Endocrinol Metab</source><year>2009</year><month>03</month><volume>5</volume><issue>3</issue><fpage>150</fpage><lpage>159</lpage><pub-id pub-id-type="doi">10.1038/ncpendmet1066</pub-id><pub-id pub-id-type="medline">19229235</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Thomas</surname><given-names>MC</given-names> </name><name name-style="western"><surname>Brownlee</surname><given-names>M</given-names> </name><name name-style="western"><surname>Susztak</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Diabetic kidney disease</article-title><source>Nat Rev Dis Primers</source><year>2015</year><month>07</month><day>30</day><volume>1</volume><fpage>15018</fpage><pub-id pub-id-type="doi">10.1038/nrdp.2015.18</pub-id><pub-id pub-id-type="medline">27188921</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>El-Serag</surname><given-names>HB</given-names> </name><name name-style="western"><surname>Tran</surname><given-names>T</given-names> </name><name name-style="western"><surname>Everhart</surname><given-names>JE</given-names> </name></person-group><article-title>Diabetes increases the risk of chronic liver disease and hepatocellular carcinoma</article-title><source>Gastroenterology</source><year>2004</year><month>02</month><volume>126</volume><issue>2</issue><fpage>460</fpage><lpage>468</lpage><pub-id pub-id-type="doi">10.1053/j.gastro.2003.10.065</pub-id><pub-id pub-id-type="medline">14762783</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="web"><article-title>List of drugs covered by the drug price standards and information on generic pharmaceuticals [Website in Japanese]</article-title><year>2024</year><access-date>2025-05-29</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.mhlw.go.jp/topics/2023/04/tp20230401-01.html">https://www.mhlw.go.jp/topics/2023/04/tp20230401-01.html</ext-link></comment></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kazijevs</surname><given-names>M</given-names> </name><name name-style="western"><surname>Samad</surname><given-names>MD</given-names> </name></person-group><article-title>Deep imputation of missing values in time series health data: A review with benchmarking</article-title><source>J Biomed Inform</source><year>2023</year><month>08</month><volume>144</volume><fpage>104440</fpage><pub-id pub-id-type="doi">10.1016/j.jbi.2023.104440</pub-id><pub-id pub-id-type="medline">37429511</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lin</surname><given-names>TY</given-names> </name><name name-style="western"><surname>Goyal</surname><given-names>P</given-names> </name><name name-style="western"><surname>Girshick</surname><given-names>R</given-names> </name><name name-style="western"><surname>He</surname><given-names>K</given-names> </name><name name-style="western"><surname>Dollar</surname><given-names>P</given-names> </name></person-group><article-title>Focal loss for dense object detection</article-title><source>IEEE Trans Pattern Anal Mach Intell</source><year>2020</year><month>02</month><volume>42</volume><issue>2</issue><fpage>318</fpage><lpage>327</lpage><pub-id pub-id-type="doi">10.1109/TPAMI.2018.2858826</pub-id><pub-id pub-id-type="medline">30040631</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Seto</surname><given-names>H</given-names> </name><name name-style="western"><surname>Oyama</surname><given-names>A</given-names> </name><name name-style="western"><surname>Kitora</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Author Correction: Gradient boosting decision tree becomes more reliable than logistic regression in predicting probability for diabetes with big data</article-title><source>Sci Rep</source><year>2022</year><month>12</month><day>30</day><volume>12</volume><issue>1</issue><fpage>22599</fpage><pub-id pub-id-type="doi">10.1038/s41598-022-27052-7</pub-id><pub-id pub-id-type="medline">36585468</pub-id></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rufo</surname><given-names>DD</given-names> </name><name name-style="western"><surname>Debelee</surname><given-names>TG</given-names> </name><name name-style="western"><surname>Ibenthal</surname><given-names>A</given-names> </name><name name-style="western"><surname>Negera</surname><given-names>WG</given-names> </name></person-group><article-title>Diagnosis of diabetes mellitus using gradient boosting machine (LightGBM)</article-title><source>Diagnostics (Basel)</source><year>2021</year><month>09</month><day>19</day><volume>11</volume><issue>9</issue><fpage>1714</fpage><pub-id pub-id-type="doi">10.3390/diagnostics11091714</pub-id><pub-id pub-id-type="medline">34574055</pub-id></nlm-citation></ref><ref id="ref51"><label>51</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Grandini</surname><given-names>M</given-names> </name><name name-style="western"><surname>Bagli</surname><given-names>E</given-names> </name><name name-style="western"><surname>Visani</surname><given-names>G</given-names> </name></person-group><article-title>Metrics for multi-class classification: an overview</article-title><source>arXiv</source><comment>Preprint posted online on 2020</comment><pub-id pub-id-type="doi">10.48550/arXiv.2008.05756</pub-id></nlm-citation></ref><ref id="ref52"><label>52</label><nlm-citation citation-type="web"><source>Information about the current study</source><year>2024</year><access-date>2025-05-29</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.h.u-tokyo.ac.jp/patient/depts/taisha/pdf/pa_md_md_info-04.pdf">https://www.h.u-tokyo.ac.jp/patient/depts/taisha/pdf/pa_md_md_info-04.pdf</ext-link></comment></nlm-citation></ref><ref id="ref53"><label>53</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Dar</surname><given-names>G</given-names> </name><name name-style="western"><surname>Geva</surname><given-names>M</given-names> </name><name name-style="western"><surname>Gupta</surname><given-names>A</given-names> </name><name name-style="western"><surname>Berant</surname><given-names>J</given-names> </name></person-group><article-title>Analyzing transformers in embedding space</article-title><source>arXiv</source><comment>Preprint posted online on 2022</comment><pub-id pub-id-type="doi">10.48550/arXiv.2209.02535</pub-id></nlm-citation></ref><ref id="ref54"><label>54</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>McInnes</surname><given-names>L</given-names> </name></person-group><article-title>Umap: uniform manifold approximation and projection for dimension reduction</article-title><source>arXiv</source><comment>Preprint posted online on 2018</comment><pub-id pub-id-type="doi">10.48550/arXiv.1802.03426</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Characteristics of patients with diabetes included in the training and testing datasets. Characteristics are presented separately for the patient groups belonging to the different training datasets defined by period: 2 years (2020-2021), 5 years (2017-2021), 10 years (2012-2021) and the independent test dataset (data exclusively from 2022). Variables shown include patient counts, age, sex distribution, laboratory values, and prescription frequencies of 44 drugs.</p><media xlink:href="medinform_v13i1e67748_app1.docx" xlink:title="DOCX File, 54 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Prediction performance for drugs when trained with various sizes of training data. The table shows results for the 44 prescribed drugs, showing a comparison of performance between specific drugs and the impact of the data period of the training data on the prediction accuracy of individual drugs.</p><media xlink:href="medinform_v13i1e67748_app2.docx" xlink:title="DOCX File, 36 KB"/></supplementary-material></app-group></back></article>