<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id><journal-id journal-id-type="publisher-id">medinform</journal-id><journal-id journal-id-type="index">7</journal-id><journal-title>JMIR Medical Informatics</journal-title><abbrev-journal-title>JMIR Med Inform</abbrev-journal-title><issn pub-type="epub">2291-9694</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v13i1e71539</article-id><article-id pub-id-type="doi">10.2196/71539</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Interpretable Machine Learning for Predicting Adverse Pregnancy Outcomes in Gestational Diabetes: Retrospective Cohort Study</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Li</surname><given-names>Jiaxi</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Liu</surname><given-names>Xiali</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>He</surname><given-names>Shenyang</given-names></name><degrees>MBBS</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author" corresp="yes" equal-contrib="yes"><name name-style="western"><surname>Ren</surname><given-names>Yan</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib></contrib-group><aff id="aff1"><institution>Jinniu Maternity and Child Health Hospital of Chengdu</institution><addr-line>Chengdu</addr-line><country>China</country></aff><aff id="aff2"><institution>Department of Anesthesiology, West China Hospital, Sichuan University</institution><addr-line>Chengdu</addr-line><country>China</country></aff><aff id="aff3"><institution>Department of Endocrinology and Metabolism, Adrenal Center, West China Hospital of Sichuan University</institution><addr-line>Number 37 Guoxue Alley, Wuhou District</addr-line><addr-line>Chengdu</addr-line><country>China</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Benis</surname><given-names>Arriel</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Darsareh</surname><given-names>Fatemeh</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Khan</surname><given-names>Wasif</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Yan Ren, MSc, Department of Endocrinology and Metabolism, Adrenal Center, West China Hospital of Sichuan University, Number 37 Guoxue Alley, Wuhou District, Chengdu, 610041, China, 86 18227387870; <email>renyan922@163.com</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>16</day><month>9</month><year>2025</year></pub-date><volume>13</volume><elocation-id>e71539</elocation-id><history><date date-type="received"><day>21</day><month>01</month><year>2025</year></date><date date-type="rev-recd"><day>21</day><month>05</month><year>2025</year></date><date date-type="accepted"><day>21</day><month>05</month><year>2025</year></date></history><copyright-statement>&#x00A9; Jiaxi Li, Xiali Liu, Shenyang He, Yan Ren. Originally published in JMIR Medical Informatics (<ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org">https://medinform.jmir.org</ext-link>), 16.9.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/">https://medinform.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://medinform.jmir.org/2025/1/e71539"/><abstract><sec><title>Background</title><p>Gestational diabetes mellitus (GDM) affects over 5% of pregnancies worldwide, elevating risks of type 2 diabetes post partum and complications such as fetal death, miscarriage, and congenital abnormalities. Effective GDM management is essential to balance glycemic control and pregnancy outcomes.</p></sec><sec><title>Objective</title><p>We aim to develop interpretable machine learning models using GDM datasets for predicting adverse pregnancy outcomes and identifying key factors through the Shapley additive explanations (SHAP) algorithm, thus supporting improved maternal and infant health.</p></sec><sec sec-type="methods"><title>Methods</title><p>Data preprocessing and feature selection were performed, with adaptive synthetic sampling used to address class imbalance. Classification models, including logistic regression, random forest, support vector machine, and extreme gradient boosting, were built and enhanced through the stacking method. Model interpretability was assessed with SHAP to quantify feature contributions.</p></sec><sec sec-type="results"><title>Results</title><p>Among 1670 patients, 200 experienced adverse outcomes. The stacking model outperformed individual models, achieving an accuracy of 85.6%, a sensitivity of 57.8%, a specificity of 95.9%, and an area under the receiver operating characteristic curve of 0.82 on the test set. External validation on 159 patients showed a decline in performance (accuracy 83.6%, area under the receiver operating characteristic curve 0.67). SHAP analysis identified gestational age, glucose control, and diagnosis time among the most influential predictors, providing clinically meaningful insights into risk factors. Additionally, detailed SHAP-based visualization revealed the distribution of different feature values and their nonlinear impact on outcomes, as well as interaction effects between features. These interpretable analyses enabled a deeper understanding of individual and combined feature contributions, thereby enhancing clinical assessment capabilities.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This study underscores the potential of machine learning in predicting adverse outcomes in GDM, with interpretable features offering valuable clinical insights to enhance pregnancy management and maternal-infant health.</p></sec></abstract><kwd-group><kwd>gestational diabetes mellitus</kwd><kwd>adverse pregnancy outcomes</kwd><kwd>interpretable model</kwd><kwd>machine learning</kwd><kwd>risk prediction</kwd><kwd>ensemble learning</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Gestational diabetes mellitus (GDM) is a significant global health concern, affecting at least 5% of pregnancies worldwide [<xref ref-type="bibr" rid="ref1">1</xref>]. It is characterized by impaired glucose tolerance due to an increase in anti-insulin substances and decreased insulin sensitivity, leading to hyperglycemia and other metabolic disturbances [<xref ref-type="bibr" rid="ref2">2</xref>]. Women diagnosed with GDM not only face increased perinatal complications but are also at a significantly higher risk of developing type 2 diabetes mellitus postpartum [<xref ref-type="bibr" rid="ref3">3</xref>]. Moreover, in utero exposure to hyperglycemia has long-term implications for offspring, predisposing them to metabolic disorders, obesity, and cardiovascular diseases later in life.</p><p>Uncontrolled GDM significantly increases the risk of adverse pregnancy outcomes, including fetal macrosomia, preterm birth, neonatal hypoglycemia, and even perinatal mortality [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. During early pregnancy, poor glycemic control may result in congenital malformations or spontaneous abortion, whereas in later stages, it can contribute to pre-eclampsia, respiratory distress syndrome, and hyperbilirubinemia [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. Despite advancements in clinical management, the timely identification of high-risk pregnancies remains a challenge. Traditional risk assessment methods, such as clinical scoring systems and conventional regression models, often rely on predefined risk factors and fail to capture complex interactions within high-dimensional clinical data [<xref ref-type="bibr" rid="ref8">8</xref>]. This limitation highlights the need for more advanced predictive tools that can improve early risk stratification and optimize maternal and fetal outcomes.</p><p>Machine learning has emerged as a transformative approach in medical research, offering superior capabilities in analyzing complex, high-dimensional datasets [<xref ref-type="bibr" rid="ref9">9</xref>]. Machine learning models can effectively capture intricate patterns and nonlinear relationships in clinical data, surpassing traditional statistical approaches in predictive accuracy. In a retrospective analysis of 8888 deliveries, random forest classification achieved exceptional accuracy in predicting birth asphyxia, with critical risk factors including maternal hypertension, anemia, preterm birth, and noncephalic presentation [<xref ref-type="bibr" rid="ref10">10</xref>]. Similarly, deep learning showed superior predictive performance for intrauterine growth restriction in another study of 8888 pregnancies, identifying key risk factors such as maternal hypertension, drug addiction, and COVID-19 infection [<xref ref-type="bibr" rid="ref11">11</xref>]. Furthermore, in an analysis of 7166 pregnancies, random forest demonstrated optimal prediction of fetal heart, with significant predictors including primiparity, placental abruption, and male fetal sex [<xref ref-type="bibr" rid="ref12">12</xref>]. However, the use of machine learning models in predicting GDM-related adverse pregnancy outcomes remains relatively limited&#x2014;particularly in the field of interpretable machine learning. Most current studies focus on model predictive accuracy, lacking transparent analysis of feature variable impacts, which makes it difficult to provide clinically reliable risk factor assessments. This lack of interpretability limits the practical application and adoption of such models in real-world medical settings. Therefore, there is an urgent need to develop models that combine high predictive performance with clinical interpretability to identify key risk factors and assist physicians in formulating personalized intervention strategies.</p><p>To address this gap, this study aims to develop an interpretable machine learning model using a publicly available GDM dataset to predict the risk of adverse pregnancy outcomes associated with gestational diabetes. Unlike previous studies that primarily focus on GDM diagnosis, our approach emphasizes predicting maternal and fetal complications, which is crucial for timely intervention. Furthermore, we incorporate Shapley additive explanations (SHAP) analysis to enhance model interpretability, allowing clinicians to identify the most influential factors contributing to adverse pregnancy outcomes. By providing clinically actionable insights, our model aims to support personalized risk assessment and improve maternal and fetal health outcomes.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Data</title><p>This study is based on the publicly available GDM dataset. We included pregnant women who met specific diagnostic criteria through the publicly available dataset [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. The dataset comprises anonymized electronic health records extracted from the Cerner system at St Mary&#x2019;s Hospital in London, covering pregnancies monitored between April 2016 and November 2019. A total of 1854 records were initially retrieved, including clinical and demographic variables such as maternal age, BMI at booking, ethnicity, glucose tolerance test results (0- and 120-min post-75 g glucose load), mode of delivery, gestational age, neonatal birth weight, and stillbirth outcomes.</p><p>To ensure data quality and reliability, patients with missing values in key variables were excluded. Implausible outliers were identified and corrected when possible; otherwise, they were removed from the dataset. Unit inconsistencies were also standardized. These preprocessing steps were applied to ensure consistency, accuracy, and completeness of the data used for model development and analysis.</p></sec><sec id="s2-2"><title>Subject</title><p>To ensure the accuracy and reliability of this study&#x2019;s results, inclusion criteria (based on the results of the oral glucose tolerance test [OGTT]) were defined as follows: the blood glucose level of pregnant women should reach or exceed 7.8 mmol/L and not exceed 25 mmol/L at 2 hours after OGTT; or the blood glucose level should reach or exceed 5.6 mmol/L and not exceed 25 mmol/L at 10 minutes after OGTT [<xref ref-type="bibr" rid="ref15">15</xref>]. In addition, the study&#x2019;s definition of adverse pregnancy outcomes includes newborn birth weight below 2500 g, severe prematurity, stillbirth, and Apgar score below 4 [<xref ref-type="bibr" rid="ref16">16</xref>]. Additionally, we excluded cases with missing Apgar score data to avoid potential biases that could arise from inaccuracies in assessing pregnancy outcomes. By implementing these strict inclusion and exclusion criteria, we ensured the consistency of this study&#x2019;s population, allowing for a more accurate assessment of the impact of GDM on the health of pregnant women and their offspring.</p></sec><sec id="s2-3"><title>Data Preprocessing</title><p>In this study, we encountered issues with missing values for multiple features in the dataset. To maintain data integrity and the reliability of the analysis, we adopted a cautious approach to handle these missing values. Specifically, when the proportion of missing values for a particular feature exceeded 30%, such as &#x201C;previous obstetric history,&#x201D; &#x201C;presence of meconium,&#x201D; and &#x201C;O_Thyroid function blood,&#x201D; we chose to exclude them from the analysis. For the remaining missing values in the features, we implemented an imputation strategy to enhance the usability of the data.</p><p>In terms of the choice of imputation method, we adopted a differentiated approach based on the type of feature. For numerical features, we used the median or mean for imputation, a method that reduces the impact of extreme values while preserving the distribution characteristics of the data. For categorical features, we used the k-nearest neighbors algorithm for imputation, which estimates the possible values of missing data by finding similar observations based on distance metrics.</p><p>Additionally, some categorical features with sparse or heterogeneous classifications were restructured using domain knowledge to improve statistical interpretability. For instance, antenatal medical factors were originally recorded in 64 different categories. These were clinically reviewed and consolidated into 7 meaningful groups: (1) mental health and neurological disorders, (2) genetic disorders, (3) surgical or operative conditions, (4) infectious and immune-related diseases, (5) obesity-related conditions, (6) chronic diseases, and (7) none.</p><p>Finally, to further meet the requirements of machine learning models, we performed 1-hot encoding on all categorical variables. This helps to avoid potential numerical encoding biases and ensures the effectiveness of model training.</p></sec><sec id="s2-4"><title>Feature Selection</title><p>To mitigate the &#x201C;curse of dimensionality&#x201D; and enhance the practicality of model deployment in clinical settings, we removed redundant features. As shown in <xref ref-type="fig" rid="figure1">Figure 1</xref>, we used the Pearson correlation matrix to identify highly correlated variables. For continuous variables, feature selection was guided by the Pearson correlation coefficient. As the number of categorical variables was relatively small&#x2014;primarily including &#x201C;number of previous C-sections,&#x201D; &#x201C;obesity status,&#x201D; and &#x201C;antenatal medical factors&#x201D;&#x2014;all were retained in the model.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Pearson correlation matrix of key features for redundancy analysis. IMD: Index of Multiple Deprivation.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e71539_fig01.png"/></fig><p>During the analysis, we identified several pairs of features with relatively high Pearson correlation coefficients, including &#x201C;Index of Multiple Deprivation (IMD) decile&#x201D; and &#x201C;IMD rank,&#x201D; &#x201C;gestation (days)&#x201D; and &#x201C;gestation,&#x201D; as well as &#x201C;body mass index (BMI) at booking&#x201D; and &#x201C;weight measured.&#x201D; Both deprivation-related variables reflect the socioeconomic status of pregnant women; however, given the broader range of values for &#x201C;IMD decile&#x201D; (1012 to 32,742), we considered it more statistically informative and retained this feature.</p><p>Given the direct association between gestational age and adverse pregnancy outcomes, gestational variables were excluded from the model to prevent potential confounding. Likewise, fetal birth weight&#x2014;available only after delivery&#x2014;was excluded to avoid outcome leakage. We recalculated BMI based on height and weight, as it offers a more comprehensive measure of maternal body composition. Consequently, the original &#x201C;height&#x201D; and &#x201C;weight&#x201D; variables were removed due to redundancy. Additionally, although &#x201C;gestation (days),&#x201D; &#x201C;gestation,&#x201D; and &#x201C;Gravida&#x201D; are strongly associated with adverse outcomes such as preterm birth and miscarriage, including them posed a risk of information leakage. Based on both statistical reasoning and clinical expert input, these features were excluded.</p><p>Lastly, &#x201C;vitamin D level in blood&#x201D; was removed due to concerns over data quality and consistency. Vitamin D is not a routine prenatal test, and the lack of standardization in test timing introduced considerable variability, limiting its reliability as a predictive feature.</p></sec><sec id="s2-5"><title>Missing Data</title><p>The final dataset included 10 continuous variables such as pregnancy age, blood glucose levels, and blood pressure. The categorical variables include obesity status, number of previous C-sections, and antenatal medical factors. Several continuous variables had missing values, with the highest rates observed in blood glucose levels (up to 23.1%) and blood pressure measurements (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p></sec><sec id="s2-6"><title>Model Construction</title><p>Based on our analysis results, we performed feature selection and data preprocessing and then constructed machine learning models. We used a variety of algorithms, including logistic regression, random forests, support vector machines (SVM), and extreme gradient boosting (XGBoost), to independently build classification prediction models. To further enhance the predictive power of the models, we used the Stacking ensemble learning method, taking the prediction results of these base models as input and training them with a meta-model (also known as a secondary model), thereby achieving superior overall predictive performance. In our study, we chose XGBoost as the meta-model. Considering that only 11.9% of the samples in the dataset manifested adverse pregnancy outcomes, indicating an imbalance in the dataset, we applied the adaptive synthetic sampling (ADASYN) algorithm to address this imbalance and improve the model&#x2019;s generalization ability.</p><p>ADASYN is a machine learning algorithm used to address class imbalance in classification problems [<xref ref-type="bibr" rid="ref17">17</xref>]. In imbalanced datasets, there is a large difference in the number of samples between different classes, which can result in poor classification performance of the model for minority classes. ADASYN balances the dataset by increasing the number of samples of the minority class, thus improving the model&#x2019;s performance. Considering the imbalance between the alive group and the expired group and the impact on the accuracy of the prediction results, we applied the ADASYN method to oversample the training set, while the test set maintained the original sample ratio. To further validate the model&#x2019;s robustness and performance in addressing class imbalance, we conducted supplementary experiments by introducing another widely used oversampling method&#x2014;SMOTE (Synthetic Minority Oversampling Technique) for comparison. SMOTE generates synthetic minority class samples through interpolation in the feature space and has been extensively applied in imbalanced classification tasks. Compared with ADASYN, it is more comprehensive to evaluate the impact of different oversampling strategies on model performance, ensuring the selected method exhibits stronger robustness and generalization capability in practical applications. The overall data was split into a training set and a test set in an 8:2 ratio. To fine-tune the hyperparameters of each algorithm, we used grid search based on 5-fold cross-validation within the training set. The hyperparameters adjusted for each algorithm are as follows (<xref ref-type="table" rid="table1">Table 1</xref>).</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Hyperparameters adjusted for each algorithm.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Algorithm</td><td align="left" valign="bottom">Hyperparameters</td></tr></thead><tbody><tr><td align="left" valign="bottom">Random forest</td><td align="left" valign="bottom"><list list-type="bullet"><list-item><p>n_estimators: 10, 50, 100</p></list-item><list-item><p>max_features: auto, sqrt, log2</p></list-item><list-item><p>Bootstrap: true, false</p></list-item></list></td></tr><tr><td align="left" valign="top">Extreme Gradient Boosting</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>n_estimators: 20, 50, 100</p></list-item><list-item><p>learning_rate: 0.1, 0.2, 0.3</p></list-item><list-item><p>max_depth: 4, 6, 8</p></list-item><list-item><p>objective: binary: logistic</p></list-item><list-item><p>subsample: 0.6, 0.8, 1</p></list-item></list></td></tr><tr><td align="left" valign="top">Logistic regression</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>C: 0.001, 0.01, 0.1, 1, 10, 100, 1000</p></list-item><list-item><p>Penalty: L1, L2</p></list-item></list></td></tr><tr><td align="left" valign="top">Support vector machine</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>C: 0.1, 1, 10, 100</p></list-item><list-item><p>Kernel: linear, rbf, poly</p></list-item><list-item><p>Gamma: scale, auto</p></list-item></list></td></tr></tbody></table></table-wrap><p>Based on the basic models obtained from training, we introduced the stacking strategy in our model fusion approach to more comprehensively explore the potential correlations between different basic models. We treated the outputs of each basic model as new features and further trained them using the XGBoost gradient boosting framework to construct a highly optimized stacking model with significant synergistic effects.</p><p>In clinical models, the interpretability of the model is crucial because it helps doctors and researchers understand the decision-making process of the model, thereby increasing trust in the model and promoting its application in clinical practice. SHAP is a popular machine learning interpretability tool that can quantify the contribution of each feature to the model&#x2019;s prediction. In our study, we used the SHAP algorithm to perform an interpretability analysis on the gestational diabetes risk prediction model to increase the model&#x2019;s transparency, helping doctors better understand the model&#x2019;s decision-making process and make appropriate interventions when necessary.</p></sec><sec id="s2-7"><title>Ethical Considerations</title><p>This study is based on the publicly available GDM dataset. We included pregnant women who met specific diagnostic criteria, as defined in the dataset documentation. All protected health information has been deidentified to ensure privacy. The dataset is accessible [<ext-link ext-link-type="uri" xlink:href="https://figshare.com/articles/dataset/GDM_Dataset_xlsx/21806472?file=38695140">14</ext-link>], and its use complies with the associated public license and terms of use. Therefore, ethical approval and individual patient consent were not required for this study.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Overview</title><p>A total of 1670 patients were selected from the GDM database for inclusion in this study. The data inclusion and exclusion diagram is shown in <xref ref-type="fig" rid="figure2">Figure 2</xref>. Among them, 200 patients had adverse pregnancy outcomes. Statistical analysis was conducted using SPSS (version 22.0; IBM Corp), while data cleaning, model construction, and performance evaluation were carried out using Python (Python Software Foundation). Continuous variables were expressed as median (IQR), while categorical data were presented as counts (percentages). The Mann-Whitney <italic>U</italic> test was used for analyzing continuous variables, and chi-square test was used to examine significant differences in categorical variables. The patient&#x2019;s baseline is presented in <xref ref-type="table" rid="table2">Table 2</xref>.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Flowchart of data inclusion and exclusion criteria. GDM: gestational diabetes mellitus.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e71539_fig02.png"/></fig><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Comparison of maternal characteristics by outcome group. Statistical significance was defined as <italic>P</italic>&#x003C;.05.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Variable</td><td align="left" valign="bottom">HC<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td><td align="left" valign="bottom">Adverse outcome</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top">IMD<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup> decile, median (IQR)</td><td align="left" valign="top">4.00 (3.00&#x2010;6.00)</td><td align="left" valign="top">4.00 (3.00&#x2010;6.00)</td><td align="left" valign="top">.25</td></tr><tr><td align="left" valign="top">Pregnancy age, median (IQR)</td><td align="left" valign="top">34.00 (30.00&#x2010;37.00)</td><td align="left" valign="top">35.00 (31.00&#x2010;38.00)</td><td align="left" valign="top">.04</td></tr><tr><td align="left" valign="top">Glucose level (blood), median (IQR)</td><td align="left" valign="top">4.70 (4.30&#x2010;5.30)</td><td align="left" valign="top">5.00 (4.45&#x2010;5.80)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Glucose level (0 min), median (IQR)</td><td align="left" valign="top">4.60 (4.20&#x2010;5.20)</td><td align="left" valign="top">4.70 (4.30&#x2010;5.65)</td><td align="left" valign="top">.002</td></tr><tr><td align="left" valign="top">Glucose level (120 min), median (IQR)</td><td align="left" valign="top">8.40 (8.00&#x2010;9.10)</td><td align="left" valign="top">8.50 (8.00&#x2010;9.50)</td><td align="left" valign="top">.02</td></tr><tr><td align="left" valign="top">Systolic blood pressure, median (IQR)</td><td align="left" valign="top">111.00 (104.00&#x2010;120.00)</td><td align="left" valign="top">115.00 (107.00&#x2010;125.00)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Diastolic blood pressure, median (IQR)</td><td align="left" valign="top">70.00 (63.00&#x2010;77.00)</td><td align="left" valign="top">72.00 (65.00&#x2010;79.25)</td><td align="left" valign="top">.01</td></tr><tr><td align="left" valign="top">Folic acid dose, median (IQR)</td><td align="left" valign="top">400.00 (0.00&#x2010;400.00)</td><td align="left" valign="top">400.00 (0.00&#x2010;400.00)</td><td align="left" valign="top">.81</td></tr><tr><td align="left" valign="top">Diagnosis time (weeks), median (IQR)</td><td align="left" valign="top">10.00 (10.00&#x2010;12.00)</td><td align="left" valign="top">10.00 (9.75&#x2010;12.00)</td><td align="left" valign="top">.82</td></tr><tr><td align="left" valign="top">BMI (kg/m&#x00B2;), median (IQR)</td><td align="left" valign="top">26.02 (22.81&#x2010;29.75)</td><td align="left" valign="top">26.51 (23.71&#x2010;30.05)</td><td align="left" valign="top">.02</td></tr><tr><td align="left" valign="top" colspan="3">Obese? n (%)</td><td align="left" valign="top">.30</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>No</td><td align="left" valign="top">908 (74.49)</td><td align="left" valign="top">324 (71.84)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Yes</td><td align="left" valign="top">311 (25.51)</td><td align="left" valign="top">127 (28.16)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="3">No_of_previous_csections, n (%)</td><td align="left" valign="top">.69</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>0</td><td align="left" valign="top">1003 (82.28)</td><td align="left" valign="top">369 (81.82)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1</td><td align="left" valign="top">187 (15.34)</td><td align="left" valign="top">72 (15.96)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>2</td><td align="left" valign="top">26 (2.13)</td><td align="left" valign="top">7 (1.55)</td><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>3</td><td align="left" valign="top">2 (0.16)</td><td align="left" valign="top">2 (0.44)</td><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>4</td><td align="left" valign="top">1 (0.08)</td><td align="left" valign="top">1 (0.22)</td><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content></td></tr><tr><td align="left" valign="top" colspan="3">Antenatal medical factors, n (%)</td><td align="left" valign="top">.10</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Chronic diseases</td><td align="left" valign="top">117 (9.60)</td><td align="left" valign="top">50 (11.09)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Genetic disorders</td><td align="left" valign="top">5 (0.41)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Infectious and immune-related diseases</td><td align="left" valign="top">27 (2.21)</td><td align="left" valign="top">12 (2.66)</td><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mental health and neurological disorders</td><td align="left" valign="top">47 (3.86)</td><td align="left" valign="top">30 (6.65)</td><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Obesity-related conditions</td><td align="left" valign="top">2 (0.16)</td><td align="left" valign="top">2 (0.44)</td><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Surgical or operative conditions</td><td align="left" valign="top">110 (9.02)</td><td align="left" valign="top">43 (9.53)</td><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>None</td><td align="left" valign="top">911 (74.73)</td><td align="left" valign="top">314 (69.62)</td><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content></td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>HC: healthy control.</p></fn><fn id="table2fn2"><p><sup>b</sup>IMD: Index of Multiple Deprivation.</p></fn></table-wrap-foot></table-wrap><p>In this study, we evaluated 5 different machine learning models: random forest, XGBoost, logistic regression, SVM, and a stacking ensemble model. To address class imbalance in the training data, we applied oversampling techniques such as ADASYN before model training. However, to preserve the clinical authenticity and real-world applicability of the evaluation, no oversampling was applied to the test set. A comprehensive evaluation was conducted using multiple performance metrics, including sensitivity, specificity, positive predictive value (PPV), negative predictive value (NPV), positive likelihood ratio (PLR), negative likelihood ratio (NLR), and overall accuracy. The results obtained on the test set are summarized in <xref ref-type="table" rid="table3">Table 3</xref> below.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Comparative performance metrics of machine learning models for predicting GDM<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup>-related adverse outcomes.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Model</td><td align="left" valign="bottom">SEN<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup></td><td align="left" valign="bottom">SPE<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup></td><td align="left" valign="bottom">PPV<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup></td><td align="left" valign="bottom">NPV<sup><xref ref-type="table-fn" rid="table3fn5">e</xref></sup></td><td align="left" valign="bottom">PLR<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup></td><td align="left" valign="bottom">NLR<sup><xref ref-type="table-fn" rid="table3fn7">g</xref></sup></td><td align="left" valign="bottom">Accuracy</td><td align="left" valign="bottom"><italic>F</italic><sub>1</sub>-score</td></tr></thead><tbody><tr><td align="left" valign="top">Random forest</td><td align="left" valign="top">0.600</td><td align="left" valign="top">0.926</td><td align="left" valign="top">0.750</td><td align="left" valign="top">0.863</td><td align="left" valign="top">8.133</td><td align="left" valign="top">0.432</td><td align="left" valign="top">0.838</td><td align="left" valign="top">0.667</td></tr><tr><td align="left" valign="top">XGBoost<sup><xref ref-type="table-fn" rid="table3fn8">h</xref></sup></td><td align="left" valign="top">0.567</td><td align="left" valign="top">0.955</td><td align="left" valign="top">0.823</td><td align="left" valign="top">0.857</td><td align="left" valign="top">12.570</td><td align="left" valign="top">0.454</td><td align="left" valign="top">0.850</td><td align="left" valign="top">0.671</td></tr><tr><td align="left" valign="top">Logistic regression</td><td align="left" valign="top">0.478</td><td align="left" valign="top">0.721</td><td align="left" valign="top">0.387</td><td align="left" valign="top">0.789</td><td align="left" valign="top">1.714</td><td align="left" valign="top">0.724</td><td align="left" valign="top">0.656</td><td align="left" valign="top">0.428</td></tr><tr><td align="left" valign="top">SVM<sup><xref ref-type="table-fn" rid="table3fn9">i</xref></sup></td><td align="left" valign="top">0.633</td><td align="left" valign="top">0.828</td><td align="left" valign="top">0.576</td><td align="left" valign="top">0.860</td><td align="left" valign="top">3.679</td><td align="left" valign="top">0.443</td><td align="left" valign="top">0.775</td><td align="left" valign="top">0.603</td></tr><tr><td align="left" valign="top">Stacking</td><td align="left" valign="top">0.578</td><td align="left" valign="top">0.959</td><td align="left" valign="top">0.839</td><td align="left" valign="top">0.860</td><td align="left" valign="top">14.098</td><td align="left" valign="top">0.440</td><td align="left" valign="top">0.856</td><td align="left" valign="top">0.684</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>GDM: gestational diabetes mellitus.</p></fn><fn id="table3fn2"><p><sup>b</sup>SEN: sensitivity.</p></fn><fn id="table3fn3"><p><sup>c</sup>SPE: specificity.</p></fn><fn id="table3fn4"><p><sup>d</sup>PPV: positive predictive value.</p></fn><fn id="table3fn5"><p><sup>e</sup>NPV: negative predictive value.</p></fn><fn id="table3fn6"><p><sup>f</sup>PLR: positive likelihood ratio.</p></fn><fn id="table3fn7"><p><sup>g</sup>NLR: negative likelihood ratio.</p></fn><fn id="table3fn8"><p><sup>h</sup>XGBoost: extreme gradient boosting.</p></fn><fn id="table3fn9"><p><sup>i</sup>SVM: support vector machine.</p></fn></table-wrap-foot></table-wrap><p>The results showed that the stacking model outperformed the individual models across several key metrics. Through cross-validation, we evaluated accuracy, recall, precision, and <italic>F</italic><sub>1</sub>-score. The results indicated that the stacking model excelled in specificity (0.959), PPV (0.839), and PLR (14.098). Its sensitivity (0.578) and NPV (0.860) were also strong, with a low NLR (0.440) and an overall accuracy of 0.856, demonstrating the effectiveness of the model fusion approach.</p><p>A total of 334 samples were contained in the test set, including 90 cases with adverse pregnancy outcomes (positive class) and 244 cases with favorable outcomes (negative class). The positive-to-negative ratio is approximately 1:2.7, indicating a moderately imbalanced distribution. Based on this dataset, the model demonstrated a satisfactory performance in identifying adverse outcomes, achieving an area under the receiver operating characteristic curve of 0.82. This suggests that the model exhibits high overall discriminative ability and can effectively differentiate individuals with distinct pregnancy outcomes. The receiver operating characteristic curve and confusion matrix for the stacking model are presented in <xref ref-type="fig" rid="figure3">Figure 3</xref>.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>ROC curve and confusion matrix of the stacking model for predicting GDM-related adverse outcomes. AUC: area under the curve; GDM: gestational diabetes mellitus; HC: healthy control; ROC: receiver operating characteristic.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e71539_fig03.png"/></fig><p>To further investigate the effect of different oversampling techniques on model performance, we conducted a comparative experiment using both ADASYN and SMOTE, focusing on the stacking model, which showed the best overall performance in our main evaluation. The results are presented in <xref ref-type="table" rid="table4">Table 4</xref>.</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Performance comparison of ADASYN<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup> and SMOTE<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup>.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Oversampling method</td><td align="left" valign="bottom">SEN<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup></td><td align="left" valign="bottom">SPE<sup><xref ref-type="table-fn" rid="table4fn4">d</xref></sup></td><td align="left" valign="bottom">PPV<sup><xref ref-type="table-fn" rid="table4fn5">e</xref></sup></td><td align="left" valign="bottom">NPV<sup><xref ref-type="table-fn" rid="table4fn6">f</xref></sup></td><td align="left" valign="bottom">PLR<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup></td><td align="left" valign="bottom">NLR<sup><xref ref-type="table-fn" rid="table4fn8">h</xref></sup></td><td align="left" valign="bottom">Accuracy</td><td align="left" valign="bottom"><italic>F</italic><sub>1</sub>-score</td></tr></thead><tbody><tr><td align="left" valign="top">ADASYN (stacking)</td><td align="left" valign="top">0.578</td><td align="left" valign="top">0.959</td><td align="left" valign="top">0.839</td><td align="left" valign="top">0.860</td><td align="left" valign="top">14.098</td><td align="left" valign="top">0.440</td><td align="left" valign="top">0.856</td><td align="left" valign="top">0.684</td></tr><tr><td align="left" valign="top">SMOTE (stacking)</td><td align="left" valign="top">0.266</td><td align="left" valign="top">0.910</td><td align="left" valign="top">0.477</td><td align="left" valign="top">0.800</td><td align="left" valign="top">2.947</td><td align="left" valign="top">0.807</td><td align="left" valign="top">0.728</td><td align="left" valign="top">0.341</td></tr><tr><td align="left" valign="top">/</td><td align="left" valign="top">0.658</td><td align="left" valign="top">0.506</td><td align="left" valign="top">0.292</td><td align="left" valign="top">0.827</td><td align="left" valign="top">1.332</td><td align="left" valign="top">0.676</td><td align="left" valign="top">0.542</td><td align="left" valign="top">0.405</td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>ADASYN: adaptive synthetic sampling.</p></fn><fn id="table4fn2"><p><sup>b</sup>SMOTE: Synthetic Minority Oversampling Technique.</p></fn><fn id="table4fn3"><p><sup>c</sup>SEN: sensitivity.</p></fn><fn id="table4fn4"><p><sup>d</sup>SPE: specificity.</p></fn><fn id="table4fn5"><p><sup>e</sup>PPV: positive predictive value.</p></fn><fn id="table4fn6"><p><sup>f</sup>NPV: negative predictive value.</p></fn><fn id="table4fn7"><p><sup>g</sup>PLR: positive likelihood ratio.</p></fn><fn id="table4fn8"><p><sup>h</sup>NLR: negative likelihood ratio.</p></fn></table-wrap-foot></table-wrap><p>As shown, the stacking model trained with ADASYN achieved superior performance across most metrics, particularly in terms of sensitivity (0.578), PPV (0.839), and <italic>F</italic><sub>1</sub>-score (0.684), suggesting better identification of high-risk cases and overall balance between precision and recall. In contrast, the model trained with SMOTE exhibited a much lower sensitivity (0.266) and <italic>F</italic><sub>1</sub>-score (0.341), indicating its limited ability to correctly identify minority class samples in this setting. We also report the performance of the stacking model trained without any oversampling as a reference, which demonstrated relatively higher sensitivity (0.658) but at the cost of much lower precision (PPV 0.292) and specificity (0.506), further confirming the advantage of using ADASYN in managing class imbalance.</p><p>Additionally, by using the SHAP algorithm, we conducted an in-depth analysis of the model&#x2019;s interpretability. The SHAP values revealed that clinical characteristics significantly impact the prediction of gestational diabetes risk, with specific results as follows. Through the calculation and analysis of SHAP values, we were able to uncover the contribution of each feature to the GDM outcome, thereby gaining a more comprehensive understanding of the risk factors for GDM. This interpretable analysis not only aids in validating the robustness of the model but also provides valuable references for subsequent clinical decision-making. Based on the SHAP algorithm, we were able to perform precise visual analyses for individual patients, as shown in <xref ref-type="fig" rid="figure4">Figure 4</xref>, which includes a global summary of feature importance across all patients (<xref ref-type="fig" rid="figure5">Figure 5A</xref>) and a local explanation for an individual prediction (<xref ref-type="fig" rid="figure5">Figure 5B</xref>).</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>SHAP-based visualization of a machine learning model for predicting adverse pregnancy outcomes in patients with GDM. (A) Summary plot of SHAP values for all features, showing their impact and direction of effect on model output across all patients. (B) Local explanation for a single GDM case, highlighting how individual features contributed to the prediction. GDM: gestational diabetes mellitus; IMD: Index of Multiple Deprivation; SHAP: Shapley additive explanations.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e71539_fig04.png"/></fig><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>SHAP-based interpretation of feature effects and interactions in the prediction model. GDM: gestational diabetes mellitus; IMD: Index of Multiple Deprivation; SHAP: Shapley additive explanations.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e71539_fig05.png"/></fig><p>For each feature, we used the shape function to display the distribution of its different values and their impact on the outcome. The influence of individual features was shown in <xref ref-type="fig" rid="figure5">Figure 5A</xref>, which demonstrates the specific impact of changes in a single variable&#x2019;s values on the model&#x2019;s predicted risk, revealing nonlinear relationships. Additionally, we used visualization techniques to illustrate the interaction values between different features, as shown in <xref ref-type="fig" rid="figure5">Figure 5B</xref>. These analyses will enhance our ability to conduct clinical assessments more effectively.</p><p>We further conducted feature interaction analysis to explore the contribution of different feature combinations in predicting adverse pregnancy outcomes in GDM. As shown in <xref ref-type="fig" rid="figure5">Figure 5C</xref>, the plot illustrates the overall importance of each feature in the model and its direction of influence, with each dot representing the SHAP value of an individual patient. The features are ranked by their mean absolute SHAP values, reflecting their average impact magnitude on the model&#x2019;s output. These results also highlight the significance of key variables and their interactions in clinical risk prediction.</p></sec><sec id="s3-2"><title>External Validation</title><p>Based on the integrated model we ultimately obtained, we collected data from some patients with GDM at Jinniu Maternal and Child Health Hospital (from January 2021 to March 2024) through telephone follow-up, focusing on collecting data from patients with adverse pregnancy outcomes. Due to issues such as patient cooperation and the tightness of related human resources, the number of external validation data is relatively small (159 cases, with a positive to negative ratio of 27:132). We used the stacking model for validation, which had a final accuracy of 0.836 and an area under the receiver operating characteristic curve value of 0.669, showing a significant decline compared to the test set. The results are shown in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>According to the latest Global Diabetes Atlas (9th edition) published by the International Diabetes Federation, the number of patients with GDM worldwide is increasing, with approximately 20.4 (15.8%) million women enduring hyperglycemia; among them, around 17.1 (83.6%) million cases are due to GDM [<xref ref-type="bibr" rid="ref18">18</xref>]. Pregnant women affected by GDM face an elevated risk of adverse pregnancy outcomes, which can pose significant threats to both the mother and the infant. Therefore, predicting adverse pregnancy outcomes in the early stages of pregnancy and providing timely feedback and effective clinical management are particularly important.</p><p>The traditional scoring criteria for adverse pregnancy outcomes currently used in clinical practice, such as the IADPSG (International Association of Diabetes and Pregnancy Study Groups) and the NICE (National Institute for Health and Care Excellence) Diagnostic Criteria, exhibit varying levels of predictive efficacy and are prone to regional biases, making it difficult to achieve a consensus on predictive outcomes [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. Additionally, individual differences, such as physiological variations, hormonal changes, genetics, and dietary structures, also affect the estimated prevalence rates of GDM. However, current clinical strategies for gestational diabetes typically use a one-size-fits-all approach to blood glucose management. Therefore, more comprehensive regular monitoring and earlier preventive and intervention measures should be implemented to reduce the potential for adverse outcomes.</p><p>In this study, we compared 5 machine learning models, random forest, XGBoost, logistic regression, SVM, and stacking, to assess their performance in predicting outcomes related to GDM. The results indicated that the stacking model outperformed the other models across multiple key performance metrics, particularly excelling in specificity (0.959), PPV (0.839), and PLR (14.098). Additionally, the stacking model demonstrated good performance in sensitivity (0.578) and NPV (0.860), with a low NLR (0.44) and overall accuracy (0.856), further proving the significant advantage of model ensemble methods in enhancing predictive performance. The receiver operating characteristic curve and confusion matrix analysis also supported this conclusion, emphasizing the effectiveness of the stacking model in predicting adverse pregnancy outcomes in GDM. However, during external validation, when using domestic patient data, the model&#x2019;s performance significantly declined. This phenomenon may be related to the inconsistent distribution of dataset characteristics, such as differences in demographic characteristics, lifestyle habits, and medical environments between domestic and international datasets. These differences may lead to poor model adaptation when facing new data distributions. Future research should further explore the performance of these models on larger and more diverse datasets to verify their generalization and stability. At the same time, it is recommended to integrate clinical context by introducing more features related to gestational diabetes for analysis, such as real-time vital signs of pregnant women, genetic phenotypes, and other relevant indicators, to enhance the model&#x2019;s predictive power and clinical application value.</p><p>SHAP helps clinicians understand and interpret complex machine learning models. We noticed that adverse pregnancy outcomes have a significant association with gestational age. Previous studies have shown that adverse pregnancy outcomes are directly related to blood glucose control during the perinatal period of gestational diabetes [<xref ref-type="bibr" rid="ref21">21</xref>]. Our results indicate that gestational diabetes with a shorter duration during pregnancy is associated with poorer pregnancy outcomes, which may be related to the early detection of hyperglycemia leading to preterm birth. Therefore, these findings serve as an important alert for clinical practice, suggesting that blood glucose monitoring should be initiated earlier in pregnancy, considering the patient&#x2019;s condition, to conduct earlier glucose monitoring for different individuals. Current clinical guidelines recommend screening for gestational diabetes between 24 and 28 weeks of pregnancy, and screening for and treating gestational diabetes during this period can significantly reduce the risk of adverse pregnancy outcomes [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. Meanwhile, a large cohort study found that women diagnosed with GDM before 12 weeks of pregnancy had worse pregnancy outcomes compared to those diagnosed between 24&#x2010;28 weeks [<xref ref-type="bibr" rid="ref23">23</xref>]; the research by Mustafa et al [<xref ref-type="bibr" rid="ref7">7</xref>] also found that women with early onset (&#x003C;24 weeks) GDM had higher BMI, significantly increased demand for insulin, and more adverse pregnancy outcomes. Therefore, in addition to recommending universal screening at 24&#x2010;28 weeks, identifying and treating GDM at an earlier stage could reduce the potential perinatal or long-term adverse effects on the mother and the offspring. These findings emphasize the importance of identifying GDM earlier than current practices and exploring other interventions that might improve outcomes beyond blood glucose control.</p><p>Pregnant women with GDM experience insulin resistance, as previously reported in studies, which is associated with preterm birth, and preterm newborns are at a higher risk of being admitted to the neonatal intensive care unit or special care baby unit [<xref ref-type="bibr" rid="ref24">24</xref>]. Due to pregnant women with high blood glucose levels, adverse pregnancy outcomes such as preterm birth, large-for-gestational-age infants, and neonatal hypoglycemia often require care in a neonatal intensive care unit. Excess glucose in the mother&#x2019;s circulation is transferred across the placenta to provide the fetus with energy substrates. The fetus&#x2019;s response to the excess substrates is to produce more insulin, leading to fetal hyperinsulinemia, which can result in a series of consequences, particularly rapid fetal growth [<xref ref-type="bibr" rid="ref25">25</xref>]. In pregnancies with GDM, fetal insulin binds to insulin-like growth factor 1 receptors, exerting growth hormone-like effects and serving as a key factor in promoting fetal growth [<xref ref-type="bibr" rid="ref26">26</xref>]. It is common for children born to women with GDM to be large at birth. Extensive research on this population has shown that the increased birth weight of large-for-gestational-age infants is due to an increase in fat mass, not muscle mass [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>]. The impact of GDM on both mother and infant does not end at delivery. Newborns admitted to the neonatal intensive care unit or special care baby unit due to maternal gestational diabetes are often seen with neonatal hypoglycemia, which may occur in 10% of healthy term infants, mainly within the first 24 to 48 hours after birth [<xref ref-type="bibr" rid="ref29">29</xref>]. The high glucose consumption of the brain, coupled with the increased ratio of brain to body mass in newborns compared to adults, increases the demand for glucose in newborns and may expose them to the risk of neurological damage and adverse outcomes.</p><p>Pregnancy hypertension is a common complication of pregnancy and a leading cause of morbidity and mortality in pregnant women and newborns, accounting for about 14% of maternal deaths worldwide [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>]. Both pregnancy-induced hypertension and pre-eclampsia are associated with adverse maternal and fetal outcomes, including an increased risk of future maternal cardiovascular diseases, and there is approximately a 17% chance of pregnancy-induced hypertension progressing to pre-eclampsia [<xref ref-type="bibr" rid="ref32">32</xref>]. As many women are asymptomatic at the time of diagnosis, those who do not receive prenatal care may present with more advanced hypertension-related diseases, such as eclampsia, which is associated with higher risks of morbidity and mortality [<xref ref-type="bibr" rid="ref33">33</xref>]. In correlation analyses, GDM is accompanied by increased blood pressure in late pregnancy. GDM is a known risk factor for stillbirth, fetal macrosomia, fetal structural abnormalities, preterm birth, and pregnancy-induced hypertension diseases. GDM is characterized by significantly increased concentrations of inflammatory molecules and the imbalanced expression of genes encoding inflammatory mediators in the placenta, which together lead to the disruption of vascular, metabolic, and inflammatory processes. Over time, this state of hyperglycemia may be associated with the occurrence of pregnancy-induced hypertension diseases and their related complexities. Additionally, diabetes and hypertension often coexist, sharing various risk factors and disease etiologies, including genetics, obesity, insulin resistance, and inflammation [<xref ref-type="bibr" rid="ref34">34</xref>]. Therefore, the management of GDM should not only focus on blood glucose control but also consider the potential risks associated with pregnancy-induced hypertension diseases. In GDM, oxidative stress plays a role in the pathogenesis of the disease, as excessive secretion of insulin during pregnancy leads to the production of lipid peroxidation factors, which also mask the secretion of antioxidants, making reactive oxygen species abundant at the cellular level. In pre-eclampsia and gestational hypertension, oxidative stress leads to inadequate placental perfusion, resulting in a hypoxic placenta, which generally triggers a systemic maternal inflammatory response [<xref ref-type="bibr" rid="ref35">35</xref>-<xref ref-type="bibr" rid="ref37">37</xref>].</p><p>The adverse pregnancy risks associated with GDM are determined by the complex interplay of multiple biomedical, behavioral, and environmental factors&#x201A; rather than a single factor. Therefore, to investigate the contribution of feature interaction to the prognostic risks of GDM, we conducted multifeature interaction analyses. The feature interaction matrix clearly shows that blood glucose levels and time of diagnosis exhibit the highest degree of aggregation, followed by blood pressure. Additionally, gestational age and antenatal medical factors also demonstrate relatively strong clustering patterns. As previously discussed, individualized diagnosis and treatment should be tailored to different individuals. For those with a genetic predisposition to diabetes, earlier diagnosis during pregnancy should be implemented to achieve more timely blood glucose control. Hypertensive disorders in pregnancy and GDM are among the most common metabolic complications during gestation, with prevalence rates having risen significantly over the past decade, now affecting approximately 12%&#x2010;18% of all pregnancies [<xref ref-type="bibr" rid="ref38">38</xref>]. Pregnant women with hyperglycemia generally exhibit a higher overall incidence of requiring insulin therapy, which increases with maternal age, and women over 35 years old have a significantly higher probability of undergoing cesarean delivery [<xref ref-type="bibr" rid="ref39">39</xref>]. Genes are the most important factor in Antenatal Medical Factors. More recent genome-wide association studies focusing on maternal metabolism during pregnancy have revealed overlaps between genes associated with metabolic traits in pregnant and nonpregnant populations, as well as some genes that appear to be uniquely relevant during gestation. Additionally, reduced gene expression has been observed in transcription factors involved in lipid metabolism, such as LXRa, PPARa, PPARd, PPARg, RXRa, and SREBP1c. These findings indicate the importance of maternal oversupply of substrates in determining neonatal fat accumulation in pregnancies complicated by obesity and GDM [<xref ref-type="bibr" rid="ref40">40</xref>].</p></sec><sec id="s4-2"><title>Limitations</title><p>This study has several limitations. As a single-center retrospective study with a relatively small sample size, the generalizability of the findings may be limited. Although multiple machine learning models were used, the features were primarily derived from structured clinical data, lacking unstructured information such as imaging findings and physician notes. And the external validation dataset also limited our research; the model&#x2019;s performance notably declined on domestic datasets, suggesting potential overfitting or insufficient adaptability to different populations. Although we use SHAP for interpretability analysis, the model&#x2019;s clinical transparency remains constrained due to the complex and nonlinear relationships between features and outcomes, which may affect the interpretability of clinical decision-making.</p></sec><sec id="s4-3"><title>Conclusion</title><p>In conclusion, our study highlights the growing prevalence of GDM and its significant association with adverse pregnancy outcomes, including preterm birth, large-for-gestational-age infants, and neonatal hypoglycemia. Through the evaluation of 5 machine learning models, we found that the stacking model exhibited superior performance in predicting adverse outcomes, demonstrating the potential of machine learning to enhance clinical decision-making in managing GDM. The findings emphasize the importance of early identification and personalized management of GDM to mitigate the risks to both mother and infant. Moreover, incorporating additional clinical features, such as real-time maternal vital signs and genetic phenotypes, may further enhance the predictive accuracy and clinical applicability of these models. Future studies should aim to validate these findings across more diverse datasets to ensure the generalizability and robustness of the models, paving the way for more precise and effective interventions in GDM management.</p></sec></sec></body><back><ack><p>We are grateful to the staff in our research groups involved in this study for their valuable contributions and discussions. This work was supported by the Chengdu Medical Research Project (project 2022-387).</p></ack><notes><sec><title>Data Availability</title><p>The datasets generated or analyzed during this study are available in the figshare repository [<xref ref-type="bibr" rid="ref14">14</xref>]. Access to the related code is available from the corresponding author on reasonable request.</p></sec></notes><fn-group><fn fn-type="con"><p>JL conceptualized and designed this study, performed the research, delivered the model analysis, analyzed the data, and wrote this paper. XL and JL delivered the data analysis and clinical analysis. SH contributed to the research execution and data analysis, and provided critical insights for model interpretation. YR conceptualized and designed this study. All authors contributed to editorial changes in this paper, read and approved this final paper, and have participated sufficiently in this work to take responsibility for all aspects of this work.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">ADASYN </term><def><p>adaptive synthetic sampling</p></def></def-item><def-item><term id="abb2">GDM</term><def><p>gestational diabetes mellitus</p></def></def-item><def-item><term id="abb3">IADPSG</term><def><p>International Association of Diabetes and Pregnancy Study Groups</p></def></def-item><def-item><term id="abb4">IMD</term><def><p>Index of Multiple Deprivation</p></def></def-item><def-item><term id="abb5">NICE</term><def><p>National Institute for Health and Care Excellence</p></def></def-item><def-item><term id="abb6">NLR</term><def><p>negative likelihood ratio</p></def></def-item><def-item><term id="abb7">NPV</term><def><p>negative predictive value</p></def></def-item><def-item><term id="abb8">OGTT</term><def><p>oral glucose tolerance test</p></def></def-item><def-item><term id="abb9">PLR</term><def><p>positive likelihood ratio</p></def></def-item><def-item><term id="abb10">PPV</term><def><p>positive predictive value</p></def></def-item><def-item><term id="abb11">SHAP</term><def><p>Shapley additive explanation</p></def></def-item><def-item><term id="abb12">SMOTE</term><def><p>Synthetic Minority Oversampling Technique</p></def></def-item><def-item><term id="abb13">SVM</term><def><p>support vector machine</p></def></def-item><def-item><term id="abb14">XGBoost</term><def><p>extreme gradient boosting</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Rodriguez</surname><given-names>BSQ</given-names> </name><name name-style="western"><surname>Vadakekut</surname><given-names>ES</given-names> </name><name name-style="western"><surname>Mahdy</surname><given-names>H</given-names> </name></person-group><source>Gestational Diabetes</source><year>2023</year><access-date>2025-07-17</access-date><publisher-name>StatPearls</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/books/NBK545196/">https://www.ncbi.nlm.nih.gov/books/NBK545196/</ext-link></comment></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kampmann</surname><given-names>U</given-names> </name><name name-style="western"><surname>Knorr</surname><given-names>S</given-names> </name><name name-style="western"><surname>Fuglsang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Ovesen</surname><given-names>P</given-names> </name></person-group><article-title>Determinants of maternal insulin resistance during pregnancy: an updated overview</article-title><source>J Diabetes Res</source><year>2019</year><volume>2019</volume><fpage>5320156</fpage><pub-id pub-id-type="doi">10.1155/2019/5320156</pub-id><pub-id pub-id-type="medline">31828161</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Magliano</surname><given-names>DJ</given-names> </name><name name-style="western"><surname>Boyko</surname><given-names>EJ</given-names> </name><collab>IDF Diabetes Atlas 10th Edition Scientific Committee</collab></person-group><source>IDF Diabetes Atlas</source><year>2021</year><edition>10</edition><publisher-name>International Diabetes Federation</publisher-name><pub-id pub-id-type="medline">35914061</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Malaza</surname><given-names>N</given-names> </name><name name-style="western"><surname>Masete</surname><given-names>M</given-names> </name><name name-style="western"><surname>Adam</surname><given-names>S</given-names> </name><name name-style="western"><surname>Dias</surname><given-names>S</given-names> </name><name name-style="western"><surname>Nyawo</surname><given-names>T</given-names> </name><name name-style="western"><surname>Pheiffer</surname><given-names>C</given-names> </name></person-group><article-title>A systematic review to compare adverse pregnancy outcomes in women with pregestational diabetes and gestational diabetes</article-title><source>Int J Environ Res Public Health</source><year>2022</year><month>08</month><day>31</day><volume>19</volume><issue>17</issue><fpage>10846</fpage><pub-id pub-id-type="doi">10.3390/ijerph191710846</pub-id><pub-id pub-id-type="medline">36078559</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>de la Torre</surname><given-names>NG</given-names> </name><name name-style="western"><surname>Assaf-Balut</surname><given-names>C</given-names> </name><name name-style="western"><surname>Jim&#x00E9;nez Varas</surname><given-names>I</given-names> </name><etal/></person-group><article-title>Effectiveness of following mediterranean diet recommendations in the real world in the incidence of gestational diabetes mellitus (GDM) and adverse maternal-foetal outcomes: a prospective, universal, interventional study with a single group. The St Carlos study</article-title><source>Nutrients</source><year>2019</year><month>05</month><day>28</day><volume>11</volume><issue>6</issue><fpage>1210</fpage><pub-id pub-id-type="doi">10.3390/nu11061210</pub-id><pub-id pub-id-type="medline">31141972</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Berger</surname><given-names>H</given-names> </name><name name-style="western"><surname>Gagnon</surname><given-names>R</given-names> </name><name name-style="western"><surname>Sermer</surname><given-names>M</given-names> </name><etal/></person-group><article-title>RETIRED: diabetes in pregnancy</article-title><source>J Obstet Gynaecol Can</source><year>2016</year><volume>38</volume><issue>7</issue><fpage>667</fpage><lpage>679</lpage><pub-id pub-id-type="doi">10.1016/j.jogc.2016.04.002</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mustafa</surname><given-names>M</given-names> </name><name name-style="western"><surname>Bogdanet</surname><given-names>D</given-names> </name><name name-style="western"><surname>Khattak</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Early gestational diabetes mellitus (GDM) is associated with worse pregnancy outcomes compared with GDM diagnosed at 24-28&#x2009;weeks gestation despite early treatment</article-title><source>QJM</source><year>2021</year><month>02</month><day>18</day><volume>114</volume><issue>1</issue><fpage>17</fpage><lpage>24</lpage><pub-id pub-id-type="doi">10.1093/qjmed/hcaa167</pub-id><pub-id pub-id-type="medline">32413109</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bianco</surname><given-names>ME</given-names> </name><name name-style="western"><surname>Josefson</surname><given-names>JL</given-names> </name></person-group><article-title>Hyperglycemia during pregnancy and long-term offspring outcomes</article-title><source>Curr Diab Rep</source><year>2019</year><month>11</month><day>21</day><volume>19</volume><issue>12</issue><fpage>143</fpage><pub-id pub-id-type="doi">10.1007/s11892-019-1267-6</pub-id><pub-id pub-id-type="medline">31754898</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Choi</surname><given-names>RY</given-names> </name><name name-style="western"><surname>Coyner</surname><given-names>AS</given-names> </name><name name-style="western"><surname>Kalpathy-Cramer</surname><given-names>J</given-names> </name><name name-style="western"><surname>Chiang</surname><given-names>MF</given-names> </name><name name-style="western"><surname>Campbell</surname><given-names>JP</given-names> </name></person-group><article-title>Introduction to machine learning, neural networks, and deep learning</article-title><source>Transl Vis Sci Technol</source><year>2020</year><month>02</month><day>27</day><volume>9</volume><issue>2</issue><fpage>14</fpage><pub-id pub-id-type="doi">10.1167/tvst.9.2.14</pub-id><pub-id pub-id-type="medline">32704420</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Darsareh</surname><given-names>F</given-names> </name><name name-style="western"><surname>Ranjbar</surname><given-names>A</given-names> </name><name name-style="western"><surname>Farashah</surname><given-names>MV</given-names> </name><name name-style="western"><surname>Mehrnoush</surname><given-names>V</given-names> </name><name name-style="western"><surname>Shekari</surname><given-names>M</given-names> </name><name name-style="western"><surname>Jahromi</surname><given-names>MS</given-names> </name></person-group><article-title>Application of machine learning to identify risk factors of birth asphyxia</article-title><source>BMC Pregnancy Childbirth</source><year>2023</year><month>03</month><day>8</day><volume>23</volume><issue>1</issue><fpage>156</fpage><pub-id pub-id-type="doi">10.1186/s12884-023-05486-9</pub-id><pub-id pub-id-type="medline">36890453</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Taeidi</surname><given-names>E</given-names> </name><name name-style="western"><surname>Ranjbar</surname><given-names>A</given-names> </name><name name-style="western"><surname>Montazeri</surname><given-names>F</given-names> </name><name name-style="western"><surname>Mehrnoush</surname><given-names>V</given-names> </name><name name-style="western"><surname>Darsareh</surname><given-names>F</given-names> </name></person-group><article-title>Machine learning-based approach to predict intrauterine growth restriction</article-title><source>Cureus</source><year>2023</year><month>07</month><volume>15</volume><issue>7</issue><fpage>e41448</fpage><pub-id pub-id-type="doi">10.7759/cureus.41448</pub-id><pub-id pub-id-type="medline">37546140</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Roozbeh</surname><given-names>N</given-names> </name><name name-style="western"><surname>Montazeri</surname><given-names>F</given-names> </name><name name-style="western"><surname>Farashah</surname><given-names>MV</given-names> </name><name name-style="western"><surname>Mehrnoush</surname><given-names>V</given-names> </name><name name-style="western"><surname>Darsareh</surname><given-names>F</given-names> </name></person-group><article-title>Proposing a machine learning-based model for predicting nonreassuring fetal heart</article-title><source>Sci Rep</source><year>2025</year><month>03</month><day>6</day><volume>15</volume><issue>1</issue><fpage>7812</fpage><pub-id pub-id-type="doi">10.1038/s41598-025-92810-2</pub-id><pub-id pub-id-type="medline">40050357</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Jeyaparam</surname><given-names>S</given-names> </name><name name-style="western"><surname>Agha-Jaffar</surname><given-names>R</given-names> </name><name name-style="western"><surname>Robinson</surname><given-names>S</given-names> </name><name name-style="western"><surname>Khunti</surname><given-names>K</given-names> </name></person-group><article-title>Association of socioeconomic deprivation on gestational diabetes incidence and perinatal outcomes</article-title><source>Research Square</source><comment>Preprint posted online on 2023</comment><pub-id pub-id-type="doi">10.21203/rs.3.rs-2410272/v1</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="web"><article-title>GDM dataset.xlsx</article-title><source>figshare</source><access-date>2025-06-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://figshare.com/articles/dataset/GDM_Dataset_xlsx/21806472?file=38695140">https://figshare.com/articles/dataset/GDM_Dataset_xlsx/21806472?file=38695140</ext-link></comment></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>ME</given-names> </name><name name-style="western"><surname>Aguirre</surname><given-names>RS</given-names> </name><name name-style="western"><surname>Hannon</surname><given-names>TS</given-names> </name></person-group><article-title>Methods for measuring risk for type 2 diabetes in youth: the oral glucose tolerance test (OGTT)</article-title><source>Curr Diab Rep</source><year>2018</year><month>06</month><day>16</day><volume>18</volume><issue>8</issue><fpage>51</fpage><pub-id pub-id-type="doi">10.1007/s11892-018-1023-3</pub-id><pub-id pub-id-type="medline">29909550</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fakhraei</surname><given-names>R</given-names> </name><name name-style="western"><surname>Denize</surname><given-names>K</given-names> </name><name name-style="western"><surname>Simon</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Predictors of adverse pregnancy outcomes in pregnant women living with obesity: a systematic review</article-title><source>Int J Environ Res Public Health</source><year>2022</year><month>02</month><day>12</day><volume>19</volume><issue>4</issue><fpage>2063</fpage><pub-id pub-id-type="doi">10.3390/ijerph19042063</pub-id><pub-id pub-id-type="medline">35206265</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Garcia</surname><given-names>EA</given-names> </name></person-group><article-title>ADASYN: Adaptive Synthetic Sampling approach for imbalanced learning</article-title><conf-name>2008 IEEE International Joint Conference on Neural Networks (IEEE World Congress on Computational Intelligence)</conf-name><conf-date>Jun 1-8, 2008</conf-date><conf-loc>Hong Kong</conf-loc><pub-id pub-id-type="doi">10.1109/IJCNN.2008.4633969</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yuen</surname><given-names>L</given-names> </name><name name-style="western"><surname>Saeedi</surname><given-names>P</given-names> </name><name name-style="western"><surname>Riaz</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Projections of the prevalence of hyperglycaemia in pregnancy in 2019 and beyond: results from the International Diabetes Federation Diabetes Atlas, 9th edition</article-title><source>Diabetes Res Clin Pract</source><year>2019</year><month>11</month><volume>157</volume><fpage>107841</fpage><pub-id pub-id-type="doi">10.1016/j.diabres.2019.107841</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="web"><article-title>Diabetes in pregnancy: management from preconception to the postnatal period</article-title><source>National Institute for Health and Care Excellence</source><access-date>2025-07-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.nice.org.uk/guidance/ng3">https://www.nice.org.uk/guidance/ng3</ext-link></comment></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>He</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Ma</surname><given-names>RCW</given-names> </name><name name-style="western"><surname>McIntyre</surname><given-names>HD</given-names> </name><etal/></person-group><article-title>Comparing IADPSG and NICE diagnostic criteria for GDM in predicting adverse pregnancy outcomes</article-title><source>Diabetes Care</source><year>2022</year><month>09</month><day>1</day><volume>45</volume><issue>9</issue><fpage>2046</fpage><lpage>2054</lpage><pub-id pub-id-type="doi">10.2337/dc22-0579</pub-id><pub-id pub-id-type="medline">35880808</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bogdanet</surname><given-names>D</given-names> </name><name name-style="western"><surname>Egan</surname><given-names>A</given-names> </name><name name-style="western"><surname>Reddin</surname><given-names>C</given-names> </name><name name-style="western"><surname>Kirwan</surname><given-names>B</given-names> </name><name name-style="western"><surname>Carmody</surname><given-names>L</given-names> </name><name name-style="western"><surname>Dunne</surname><given-names>FA</given-names> </name></person-group><article-title>ATLANTIC DIP: despite insulin therapy in women with IADPSG diagnosed GDM, desired pregnancy outcomes are still not achieved. What are we missing?</article-title><source>Diabetes Res Clin Pract</source><year>2018</year><month>02</month><volume>136</volume><fpage>116</fpage><lpage>123</lpage><pub-id pub-id-type="doi">10.1016/j.diabres.2017.12.003</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><collab>American Diabetes Association Professional Practice Committee</collab></person-group><article-title>15. Management of diabetes in pregnancy: standards of care in diabetes-2024</article-title><source>Diabetes Care</source><year>2024</year><month>01</month><day>1</day><volume>47</volume><issue>Suppl 1</issue><fpage>S282</fpage><lpage>S294</lpage><pub-id pub-id-type="doi">10.2337/dc24-S015</pub-id><pub-id pub-id-type="medline">38078583</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sweeting</surname><given-names>AN</given-names> </name><name name-style="western"><surname>Ross</surname><given-names>GP</given-names> </name><name name-style="western"><surname>Hyett</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Gestational diabetes mellitus in early pregnancy: evidence for poor pregnancy outcomes despite treatment</article-title><source>Diabetes Care</source><year>2016</year><month>01</month><volume>39</volume><issue>1</issue><fpage>75</fpage><lpage>81</lpage><pub-id pub-id-type="doi">10.2337/dc15-0433</pub-id><pub-id pub-id-type="medline">26645084</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Harreiter</surname><given-names>J</given-names> </name><name name-style="western"><surname>Simmons</surname><given-names>D</given-names> </name><name name-style="western"><surname>Desoye</surname><given-names>G</given-names> </name><etal/></person-group><article-title>IADPSG and WHO 2013 gestational diabetes mellitus criteria identify obese women with marked insulin resistance in early pregnancy</article-title><source>Diabetes Care</source><year>2016</year><month>07</month><volume>39</volume><issue>7</issue><fpage>e90</fpage><lpage>2</lpage><pub-id pub-id-type="doi">10.2337/dc16-0200</pub-id><pub-id pub-id-type="medline">27208336</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fasoulakis</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Koutras</surname><given-names>A</given-names> </name><name name-style="western"><surname>Antsaklis</surname><given-names>P</given-names> </name><etal/></person-group><article-title>Intrauterine growth restriction due to gestational diabetes: from pathophysiology to diagnosis and management</article-title><source>Medicina (Kaunas)</source><year>2023</year><month>06</month><day>13</day><volume>59</volume><issue>6</issue><fpage>1139</fpage><pub-id pub-id-type="doi">10.3390/medicina59061139</pub-id><pub-id pub-id-type="medline">37374343</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hiden</surname><given-names>U</given-names> </name><name name-style="western"><surname>Glitzner</surname><given-names>E</given-names> </name><name name-style="western"><surname>Hartmann</surname><given-names>M</given-names> </name><name name-style="western"><surname>Desoye</surname><given-names>G</given-names> </name></person-group><article-title>Insulin and the IGF system in the human placenta of normal and diabetic pregnancies</article-title><source>J Anat</source><year>2009</year><month>07</month><volume>215</volume><issue>1</issue><fpage>60</fpage><lpage>68</lpage><pub-id pub-id-type="doi">10.1111/j.1469-7580.2008.01035.x</pub-id><pub-id pub-id-type="medline">19467150</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Moore</surname><given-names>TR</given-names> </name></person-group><article-title>A comparison of amniotic fluid fetal pulmonary phospholipids in normal and diabetic pregnancy</article-title><source>Am J Obstet Gynecol</source><year>2002</year><month>04</month><volume>186</volume><issue>4</issue><fpage>641</fpage><lpage>650</lpage><pub-id pub-id-type="doi">10.1067/mob.2002.122851</pub-id><pub-id pub-id-type="medline">11967485</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Metzger</surname><given-names>BE</given-names> </name><name name-style="western"><surname>Persson</surname><given-names>B</given-names> </name><name name-style="western"><surname>Lowe</surname><given-names>LP</given-names> </name><etal/></person-group><article-title>Hyperglycemia and adverse pregnancy outcome study: neonatal glycemia</article-title><source>Pediatrics</source><year>2010</year><month>12</month><volume>126</volume><issue>6</issue><fpage>e1545</fpage><lpage>52</lpage><pub-id pub-id-type="doi">10.1542/peds.2009-2257</pub-id><pub-id pub-id-type="medline">21078733</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dani</surname><given-names>C</given-names> </name><name name-style="western"><surname>Corsini</surname><given-names>I</given-names> </name></person-group><article-title>Guidelines for management of neonatal hypoglycemia: are they actually applicable?</article-title><source>JAMA Pediatr</source><year>2020</year><month>07</month><day>1</day><volume>174</volume><issue>7</issue><fpage>638</fpage><lpage>639</lpage><pub-id pub-id-type="doi">10.1001/jamapediatrics.2020.0632</pub-id><pub-id pub-id-type="medline">32391888</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Burton</surname><given-names>GJ</given-names> </name><name name-style="western"><surname>Redman</surname><given-names>CW</given-names> </name><name name-style="western"><surname>Roberts</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Moffett</surname><given-names>A</given-names> </name></person-group><article-title>Pre-eclampsia: pathophysiology and clinical implications</article-title><source>BMJ</source><year>2019</year><month>07</month><day>15</day><volume>366</volume><fpage>l2381</fpage><pub-id pub-id-type="doi">10.1136/bmj.l2381</pub-id><pub-id pub-id-type="medline">31307997</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jiang</surname><given-names>L</given-names> </name><name name-style="western"><surname>Tang</surname><given-names>K</given-names> </name><name name-style="western"><surname>Magee</surname><given-names>LA</given-names> </name><etal/></person-group><article-title>A global view of hypertensive disorders and diabetes mellitus during pregnancy</article-title><source>Nat Rev Endocrinol</source><year>2022</year><month>12</month><volume>18</volume><issue>12</issue><fpage>760</fpage><lpage>775</lpage><pub-id pub-id-type="doi">10.1038/s41574-022-00734-y</pub-id><pub-id pub-id-type="medline">36109676</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Riise</surname><given-names>HKR</given-names> </name><name name-style="western"><surname>Sulo</surname><given-names>G</given-names> </name><name name-style="western"><surname>Tell</surname><given-names>GS</given-names> </name><etal/></person-group><article-title>Association between gestational hypertension and risk of cardiovascular disease among 617 589 Norwegian women</article-title><source>J Am Heart Assoc</source><year>2018</year><month>05</month><day>13</day><volume>7</volume><issue>10</issue><fpage>e008337</fpage><pub-id pub-id-type="doi">10.1161/JAHA.117.008337</pub-id><pub-id pub-id-type="medline">29755034</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sinkey</surname><given-names>RG</given-names> </name><name name-style="western"><surname>Battarbee</surname><given-names>AN</given-names> </name><name name-style="western"><surname>Bello</surname><given-names>NA</given-names> </name><name name-style="western"><surname>Ives</surname><given-names>CW</given-names> </name><name name-style="western"><surname>Oparil</surname><given-names>S</given-names> </name><name name-style="western"><surname>Tita</surname><given-names>ATN</given-names> </name></person-group><article-title>Prevention, diagnosis, and management of hypertensive disorders of pregnancy: a comparison of international guidelines</article-title><source>Curr Hypertens Rep</source><year>2020</year><month>08</month><day>27</day><volume>22</volume><issue>9</issue><fpage>66</fpage><pub-id pub-id-type="doi">10.1007/s11906-020-01082-w</pub-id><pub-id pub-id-type="medline">32852691</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cheung</surname><given-names>BMY</given-names> </name><name name-style="western"><surname>Li</surname><given-names>C</given-names> </name></person-group><article-title>Diabetes and hypertension: is there a common metabolic pathway?</article-title><source>Curr Atheroscler Rep</source><year>2012</year><month>04</month><volume>14</volume><issue>2</issue><fpage>160</fpage><lpage>166</lpage><pub-id pub-id-type="doi">10.1007/s11883-012-0227-2</pub-id><pub-id pub-id-type="medline">22281657</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chiarello</surname><given-names>DI</given-names> </name><name name-style="western"><surname>Abad</surname><given-names>C</given-names> </name><name name-style="western"><surname>Rojas</surname><given-names>D</given-names> </name><etal/></person-group><article-title>Oxidative stress: normal pregnancy versus preeclampsia</article-title><source>Biochim Biophys Acta Mol Basis Dis</source><year>2020</year><month>02</month><day>1</day><volume>1866</volume><issue>2</issue><fpage>165354</fpage><pub-id pub-id-type="doi">10.1016/j.bbadis.2018.12.005</pub-id><pub-id pub-id-type="medline">30590104</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rani</surname><given-names>N</given-names> </name><name name-style="western"><surname>Dhingra</surname><given-names>R</given-names> </name><name name-style="western"><surname>Arya</surname><given-names>DS</given-names> </name><name name-style="western"><surname>Kalaivani</surname><given-names>M</given-names> </name><name name-style="western"><surname>Bhatla</surname><given-names>N</given-names> </name><name name-style="western"><surname>Kumar</surname><given-names>R</given-names> </name></person-group><article-title>Role of oxidative stress markers and antioxidants in the placenta of preeclamptic patients</article-title><source>J Obstet Gynaecol Res</source><year>2010</year><month>12</month><volume>36</volume><issue>6</issue><fpage>1189</fpage><lpage>1194</lpage><pub-id pub-id-type="doi">10.1111/j.1447-0756.2010.01303.x</pub-id><pub-id pub-id-type="medline">21114571</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Phoswa</surname><given-names>WN</given-names> </name><name name-style="western"><surname>Khaliq</surname><given-names>OP</given-names> </name></person-group><article-title>The role of oxidative stress in hypertensive disorders of pregnancy (preeclampsia, gestational hypertension) and metabolic disorder of pregnancy (gestational diabetes mellitus)</article-title><source>Oxid Med Cell Longev</source><year>2021</year><volume>2021</volume><fpage>5581570</fpage><pub-id pub-id-type="doi">10.1155/2021/5581570</pub-id><pub-id pub-id-type="medline">34194606</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dalfr&#x00E0;</surname><given-names>MG</given-names> </name><name name-style="western"><surname>Burlina</surname><given-names>S</given-names> </name><name name-style="western"><surname>Del Vescovo</surname><given-names>GG</given-names> </name><name name-style="western"><surname>Lapolla</surname><given-names>A</given-names> </name></person-group><article-title>Genetics and epigenetics: new insight on gestational diabetes mellitus</article-title><source>Front Endocrinol (Lausanne)</source><year>2020</year><volume>11</volume><fpage>602477</fpage><pub-id pub-id-type="doi">10.3389/fendo.2020.602477</pub-id><pub-id pub-id-type="medline">33335512</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lappas</surname><given-names>M</given-names> </name></person-group><article-title>Effect of pre-existing maternal obesity, gestational diabetes and adipokines on the expression of genes involved in lipid metabolism in adipose tissue</article-title><source>Metab Clin Exp</source><year>2014</year><month>02</month><volume>63</volume><issue>2</issue><fpage>250</fpage><lpage>262</lpage><pub-id pub-id-type="doi">10.1016/j.metabol.2013.10.001</pub-id><pub-id pub-id-type="medline">24262292</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Koenigbauer</surname><given-names>JT</given-names> </name><name name-style="western"><surname>Fangmann</surname><given-names>L</given-names> </name><name name-style="western"><surname>Rostin</surname><given-names>P</given-names> </name><etal/></person-group><article-title>Advanced maternal age (AMA) and 75&#x202F;g OGTT glucose levels are pedictors for insulin therapy in women with gestational diabetes (GDM)</article-title><source>J Perinat Med</source><year>2023</year><month>11</month><day>27</day><volume>51</volume><issue>9</issue><fpage>1154</fpage><lpage>1162</lpage><pub-id pub-id-type="doi">10.1515/jpm-2023-0170</pub-id><pub-id pub-id-type="medline">37466452</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Missing value rates of variables in the final dataset.</p><media xlink:href="medinform_v13i1e71539_app1.png" xlink:title="PNG File, 112 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>External validation outcomes for the stacking model in patients with gestational diabetes mellitus.</p><media xlink:href="medinform_v13i1e71539_app2.png" xlink:title="PNG File, 85 KB"/></supplementary-material></app-group></back></article>