<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="review-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id><journal-id journal-id-type="publisher-id">medinform</journal-id><journal-id journal-id-type="index">7</journal-id><journal-title>JMIR Medical Informatics</journal-title><abbrev-journal-title>JMIR Med Inform</abbrev-journal-title><issn pub-type="epub">2291-9694</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v14i1e80930</article-id><article-id pub-id-type="doi">10.2196/80930</article-id><article-categories><subj-group subj-group-type="heading"><subject>Review</subject></subj-group></article-categories><title-group><article-title>Machine Learning for Intraoperative Bleeding Prediction in Patients Undergoing Surgery: Scoping Review</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Yan</surname><given-names>Shiqiong</given-names></name><degrees>MA</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Zhang</surname><given-names>Ping</given-names></name><degrees>DA</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Qiao</surname><given-names>Wanwan</given-names></name><degrees>MA</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Xie</surname><given-names>Sijia</given-names></name><degrees>MA</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Hu</surname><given-names>Huan</given-names></name><degrees>DA</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Gao</surname><given-names>Yi</given-names></name><degrees>MA</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Xie</surname><given-names>Linli</given-names></name><degrees>MA</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Jing</surname><given-names>Jie</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Nursing, Sichuan Provincial People&#x2019;s Hospital, University of Electronic Science and Technology of China</institution><addr-line>No. 32, West Section 2, First Ring Road, Qingyang District</addr-line><addr-line>Chengdu</addr-line><country>China</country></aff><aff id="aff2"><institution>Department of nursing, Chengdu University of Traditional Chinese Medicine</institution><addr-line>Chengdu</addr-line><country>China</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Benis</surname><given-names>Arriel</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Beunza</surname><given-names>Juan-Jose</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Sawesi</surname><given-names>Suhila</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Jie Jing, PhD, Department of Nursing, Sichuan Provincial People&#x2019;s Hospital, University of Electronic Science and Technology of China, No. 32, West Section 2, First Ring Road, Qingyang District, Chengdu, 610072, China, 86 028-87393999, 86 028-87393999; <email>jingjie_1130@163.com</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>10</day><month>6</month><year>2026</year></pub-date><volume>14</volume><elocation-id>e80930</elocation-id><history><date date-type="received"><day>18</day><month>07</month><year>2025</year></date><date date-type="rev-recd"><day>08</day><month>01</month><year>2026</year></date><date date-type="accepted"><day>08</day><month>01</month><year>2026</year></date></history><copyright-statement>&#x00A9; Shiqiong Yan, Ping Zhang, Wanwan Qiao, Sijia Xie, Huan Hu, Yi Gao, Linli Xie, Jie Jing. Originally published in JMIR Medical Informatics (<ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org">https://medinform.jmir.org</ext-link>), 10.6.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/">https://medinform.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://medinform.jmir.org/2026/1/e80930"/><abstract><sec><title>Background</title><p>Intraoperative bleeding is a critical event that impacts surgical safety and patient outcomes. Machine learning (ML) has demonstrated potential in prediction tasks, yet its methodological rigor and clinical translation face challenges.</p></sec><sec><title>Objective</title><p>This scoping review aims to systematically synthesize the current state of development, performance, and validation of ML models for predicting intraoperative bleeding, and to identify key barriers to their clinical implementation.</p></sec><sec sec-type="methods"><title>Methods</title><p>Following the PRISMA-ScR (Preferred Reporting Items for Systematic Reviews and Meta-Analyses extension for Scoping Reviews) guidelines, we systematically searched 7 databases (PubMed, Web of Science, Embase, CINAHL, CNKI [China National Knowledge Infrastructure], Wanfang, and VIP [China Science and Technology Journal Database]) from their inception to April 2025. Moreover, 2 reviewers (SY and PZ) independently screened studies, extracted data using the Checklist for Critical Appraisal and Data Extraction for Systematic Reviews of Prediction Modeling Studies (CHARMS), and assessed the risk of bias using the Prediction Model Risk Of Bias Assessment Tool (PROBAST). A narrative synthesis was used for data analysis.</p></sec><sec sec-type="results"><title>Results</title><p>Out of 2651 screened records, 23 studies were included (sample sizes ranging from 48 to 48,543). Tree-based ensemble models (eg, random forests and extreme gradient boosting) were the most frequently used (16/23, 70%), followed by logistic regression (13/23, 57%), and deep learning (11/23, 48%). Model discrimination varied widely (mean area under the curve [AUC] 0.82, SD 0.08, range 0.63&#x2010;0.93). Integration of multimodal data (electronic health records+imaging) was associated with higher performance. However, model validation was often inadequate; only 6 studies (6/23, 26%) performed external validation, and performance often declined (eg, AUC decreased from 0.85 to 0.63 in 1 study). Reporting exhibited selective bias; AUC was commonly reported (19/23, 83%), whereas key classification metrics, such as calibration (10/23, 43%) and precision (4/23, 17%), were often omitted. PROBAST assessment indicated a high risk of bias in all included studies (23/23, 100%).</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>While ML models demonstrate technical promise for predicting intraoperative bleeding, our PROBAST assessment revealed a universally high risk of bias across all included studies. This fundamental methodological limitation, coupled with a severe lack of external validation and poor transparency in reporting, severely constrains the current clinical reliability of these models. Future research must prioritize prospective multicenter validation, adherence to Transparent Reporting of a Multivariable Prediction Model for Individual Prognosis or Diagnosis (TRIPOD) reporting guidelines, and enhanced model interpretability to bridge the gap toward clinical utility.</p></sec></abstract><kwd-group><kwd>intraoperative bleeding</kwd><kwd>machine learning</kwd><kwd>scoping review</kwd><kwd>clinical decision support</kwd><kwd>predictive models</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><sec id="s1-1"><title>Background</title><p>Perioperative bleeding is a significant risk factor for surgical procedures and is strongly linked to increased patient mortality, higher rates of postoperative complications, and excessive use of health care resources [<xref ref-type="bibr" rid="ref1">1</xref>]. Intraoperative bleeding control effectiveness directly impacts both surgical safety and patient outcomes [<xref ref-type="bibr" rid="ref2">2</xref>]. Excessive blood loss compromises the surgical field. It prolongs the duration of surgery [<xref ref-type="bibr" rid="ref3">3</xref>] while also increasing the risk of severe adverse events, such as myocardial infarction and acute kidney injury [<xref ref-type="bibr" rid="ref4">4</xref>]. While patient blood management strategies focus on optimizing preoperative risk assessment, facilitating real-time intraoperative interventions, and guiding postoperative transfusion decisions through accurate predictions of blood loss [<xref ref-type="bibr" rid="ref5">5</xref>], current clinical practice still struggles with the reliability of predictive tools.</p><p>Intraoperative blood loss, quantified as estimated blood loss, is a fundamental quantitative metric in perioperative management, providing critical evidence to guide fluid resuscitation strategies, transfusion decisions, and the prevention and control of postoperative complications. Consequently, monitoring accuracy is regarded as a quality standard for perioperative care [<xref ref-type="bibr" rid="ref6">6</xref>]. However, current clinical assessment methods exhibit dual limitations&#x2014;subjective assessment techniques (eg, visual estimation of soaked gauze or suction canister volume) are susceptible to operator experience, resulting in high error rates, and calculation-based methods (relying on material weight differences) struggle to capture the dynamic blood loss process in real time [<xref ref-type="bibr" rid="ref2">2</xref>]. Such inaccuracies can lead to erroneous transfusion decisions. Research has confirmed that inappropriate transfusion is an independent risk factor for postoperative infection and organ dysfunction [<xref ref-type="bibr" rid="ref7">7</xref>]. Although existing risk assessment tools (the surgical blood loss score) are widely used [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>], their inherent weaknesses, namely heterogeneous scoring criteria and a lag in advances in surgical techniques, are becoming increasingly apparent.</p><p>Although traditional prediction models (such as logistic regression) are widely used, they are constrained by linear assumptions and fail to effectively capture complex nonlinear interactions and multicollinearity among variables. Evidence suggests that predictive accuracy based on clinical experience is significantly lower than that achieved by machine learning (ML) methods [<xref ref-type="bibr" rid="ref10">10</xref>]. With the advancement of hospital information platforms, vast amounts of high-dimensional, heterogeneous clinical data have been accumulated. Due to its unique advantages in processing such data and identifying nonlinear patterns [<xref ref-type="bibr" rid="ref11">11</xref>], ML has rapidly emerged as a research hotspot in the field of intraoperative bleeding prediction. However, the existing body of research evidence exhibits significant fragmentation. Studies predominantly concentrate on single surgical procedures (eg, cesarean section [<xref ref-type="bibr" rid="ref12">12</xref>] and spinal surgery [<xref ref-type="bibr" rid="ref13">13</xref>]), resulting in a scarcity of cross-scenario algorithm comparisons; equally important, the methodological quality and validation rigor of these models are highly variable and often inadequate. Methodological limitations (such as inconsistent data preprocessing and the absence of standardized validation frameworks) have yet to be systematically evaluated and standardized. More critically, the clinical translation pathway is severely hindered by inadequate model generalizability, largely due to a pervasive lack of robust external validation. This fragmented landscape and lack of comprehensive evaluation, coupled with unaddressed methodological concerns, critically impede the understanding of ML&#x2019;s actual value and the identification of optimal implementation pathways for intraoperative bleeding prediction, necessitating the urgent integration and assessment of these methodologies through systematic approaches.</p></sec><sec id="s1-2"><title>Research Objective</title><p>Therefore, based on the PRISMA-Scr (Preferred Reporting Items for Systematic Reviews and Meta-Analyses extension for Scoping Reviews) framework [<xref ref-type="bibr" rid="ref14">14</xref>], this study establishes the following objectives:</p><list list-type="order"><list-item><p>To show how ML algorithms are used to predict bleeding during surgery in different settings;</p></list-item><list-item><p>To look at how ways of building and testing models (like picking features or choosing algorithms) affect their results (such as sensitivity and specificity);</p></list-item><list-item><p>To find the best-performing algorithms and define the criteria to judge them in specific fields; and</p></list-item><list-item><p>To highlight key problems that slow real-world use and suggest practical steps for future research and practice.</p></list-item></list></sec></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Overview</title><p>This scoping review was conducted following the methodological framework proposed by Arksey and O&#x2019;Malley [<xref ref-type="bibr" rid="ref15">15</xref>] and reported in accordance with the PRISMA-ScR guidelines [<xref ref-type="bibr" rid="ref14">14</xref>] to ensure transparency and consistency. Given the focus on prediction models, the Checklist for Critical Appraisal and Data Extraction for Systematic Reviews of Prediction Modeling Studies (CHARMS) [<xref ref-type="bibr" rid="ref16">16</xref>] was used to guide data extraction.</p></sec><sec id="s2-2"><title>Search Strategy</title><p>A systematic literature search was conducted on April 10, 2025. The search followed the Population, Intervention, Comparator, Outcome, and Study design (PICOS) framework. Both controlled vocabularies (eg, Medical Subject Headings for PubMed and Emtree for Embase) and free-text terms were used. Searches focused on three concepts&#x2014;population (patients undergoing surgery), predictive tool (ML models), and outcome (risk of bleeding during surgery). In total, seven databases were searched&#x2014;PubMed, Web of Science, Embase, CINAHL Complete, CNKI (China National Knowledge Infrastructure), Wanfang Data, and VIP (China Science and Technology Journal Database). <xref ref-type="table" rid="table1">Table 1</xref> details search strategies for each database. Reference lists of included studies and leading journals were also manually screened.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Search terms used to find studies.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Database</td><td align="left" valign="bottom">Hits, n</td><td align="left" valign="bottom">Search strategy</td></tr></thead><tbody><tr><td align="left" valign="top">PubMed</td><td align="left" valign="top">86</td><td align="left" valign="top">(&#x201C;Machine Learning&#x201D;[Mesh] OR &#x201C;Artificial Intelligence&#x201D;[Mesh] OR &#x201C;machine learning&#x201D;[tiab] OR &#x201C;deep learning&#x201D;[tiab]) AND (&#x201C;Surgery&#x201D;[Mesh] OR &#x201C;Surgical Procedures, Operative&#x201D;[Mesh] OR surg[tiab] OR intraoperative[tiab]) AND (&#x201C;Intraoperative Complications&#x201D;[Mesh] OR &#x201C;Hemorrhage&#x201D;[Mesh] OR &#x201C;Blood Loss, Surgical&#x201D;[Mesh] OR bleed[tiab] OR &#x201C;blood loss&#x201D;[tiab])</td></tr><tr><td align="left" valign="top">Web of Science</td><td align="left" valign="top">79</td><td align="left" valign="top">TS=((&#x201C;machine learning&#x201D; OR &#x201C;artificial intelligence&#x201D;) AND (surg* OR intraoperative) AND (bleed* OR &#x201C;blood loss&#x201D; OR hemorrhag*))</td></tr><tr><td align="left" valign="top">Embase</td><td align="left" valign="top">220</td><td align="left" valign="top">(&#x2018;machine learning&#x2019;/exp OR &#x2018;artificial intelligence&#x2019;/exp OR &#x2018;machine learning&#x2019;:ab,ti) AND (&#x2018;surgery&#x2019;/exp OR &#x2018;intraoperative period&#x2019;/exp OR surg:ab,ti) AND (&#x2018;intraoperative bleeding&#x2019;/exp OR &#x2018;surgical blood loss&#x2019;/exp OR bleed:ab,ti)</td></tr><tr><td align="left" valign="top">CINAHL Complete</td><td align="left" valign="top">1709</td><td align="left" valign="top">(MH &#x201C;Machine Learning+&#x201D; OR TI &#x201C;machine learning&#x201D; OR AB &#x201C;artificial intelligence&#x201D;) AND (MH &#x201C;Surgery, Operative+&#x201D; OR TI surg* OR AB intraoperative) AND (MH &#x201C;Intraoperative Complications+&#x201D; OR MH &#x201C;Blood Loss, Surgical+&#x201D; OR TI bleed* OR AB &#x201C;blood loss&#x201D;)</td></tr><tr><td align="left" valign="top">CNKI<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup></td><td align="left" valign="top">212</td><td align="left" valign="top">(SU=(&#x2018;machine learning&#x2019; OR &#x2018;deep learning&#x2019; OR &#x2018;artificial intelligence&#x2019;)) AND (SU=(&#x2018;surgery&#x2019; OR &#x2018;intraoperative&#x2019; OR &#x2018;surgical procedure&#x2019;)) AND (SU=(&#x2018;intraoperative bleeding&#x2019; OR &#x2018;surgical bleeding&#x2019; OR &#x2018;blood loss&#x2019;))</td></tr><tr><td align="left" valign="top">Wanfang Data</td><td align="left" valign="top">331</td><td align="left" valign="top">(Subject:(&#x201C;machine learning&#x201D; OR &#x201C;artificial intelligence&#x201D;)) AND (Subject:(&#x201C;surgery&#x201D; OR &#x201C;surgical&#x201D;)) AND (Subject:(&#x201C;intraoperative bleeding&#x201D; OR &#x201C;surgical bleeding&#x201D;))</td></tr><tr><td align="left" valign="top">VIP<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="top">12</td><td align="left" valign="top">(U=(&#x2018;machine learning&#x2019; OR &#x2018;artificial intelligence&#x2019;)) AND (U=(&#x2018;intraoperative bleeding&#x2019; OR &#x2018;surgical blood loss&#x2019;)) AND (M=(&#x2018;surgery&#x2019;) OR T=(&#x2018;surgical patients&#x2019;))</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>CNKI: China National Knowledge Infrastructure.</p></fn><fn id="table1fn2"><p><sup>b</sup>VIP: China Science and Technology Journal Database.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2-3"><title>Study Selection</title><p>Initial search records were imported into EndNote X9 (Clarivate). Duplicates were removed using automated and manual deduplication. Moreover, 2 reviewers (SY and PZ) independently screened titles and abstracts for relevance, recording decisions separately. For records retained after screening, both assessed full-text articles for eligibility and recorded decisions independently. Assessment was blind to ensure objectivity. Disagreements were resolved through discussion or, if needed, a third senior researcher (HH). A systematic review decision matrix (<xref ref-type="table" rid="table2">Table 2</xref>) guided the application of eligibility criteria.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Eligibility criteria.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Category</td><td align="left" valign="bottom">Inclusion criteria</td><td align="left" valign="bottom">Exclusion criteria</td></tr></thead><tbody><tr><td align="left" valign="top">Population</td><td align="left" valign="top">Adult patients (&#x2265;18 y) undergoing surgery</td><td align="left" valign="top">&#x2015;<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td></tr><tr><td align="left" valign="top">Predictive tool</td><td align="left" valign="top">ML-based models explicitly developed to predict intraoperative bleeding risk</td><td align="left" valign="top">Models predicting only postoperative bleeding or failing to distinguish intraoperative or postoperative outcomes</td></tr><tr><td align="left" valign="top">Outcome reporting</td><td align="left" valign="top">Reported at least one performance metric: area under the curve (AUC), sensitivity, or specificity</td><td align="left" valign="top">&#x2015;</td></tr><tr><td align="left" valign="top">Study design</td><td align="left" valign="top">Primary research: retrospective or prospective cohort studies, case-control studies</td><td align="left" valign="top">Conference abstracts, reviews, case reports, editorials, letters</td></tr><tr><td align="left" valign="top">Publication status</td><td align="left" valign="top">Full text in Chinese or English (including peer-reviewed preprints)</td><td align="left" valign="top">Non&#x2013;peer-reviewed manuscripts, publications not in Chinese or English</td></tr><tr><td align="left" valign="top">Data source</td><td align="left" valign="top">&#x2015;</td><td align="left" valign="top">Nonclinical or invalid sources: animal experiments, simulated datasets, nonhospital data</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>Not applicable.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2-4"><title>Eligibility Criteria</title><p>Studies that did not meet the inclusion criteria were excluded during screening. Eligibility was determined using predefined criteria outlined in <xref ref-type="table" rid="table2">Table 2</xref>. The review decision matrix applied these criteria to the full texts to determine whether studies reported outcomes of intraoperative bleeding prediction.</p></sec><sec id="s2-5"><title>Data Extraction and Synthesis</title><p>Data extraction was performed independently by 2 reviewers (SY and PZ) using a standardized electronic form based on the aforementioned CHARMS checklist. The reviewers extracted data on the following: (1) study characteristics (author, year, country, design, sample size, surgical type, and data source), (2) model development (candidate and final predictors, data preprocessing, and ML algorithms), and (3) model performance and validation (validation method, performance metrics such as area under the curve [AUC], sensitivity, specificity, precision, and calibration). Any discrepancies were resolved through discussion or by consultation with a third reviewer (HH). Given methodological heterogeneity across studies, including differences in algorithms, validation strategies, and outcome reporting, a narrative synthesis was used for data analysis. The primary studies in this review reported model performance metrics (eg, AUC and sensitivity) and their CIs, not traditional hypothesis-testing <italic>P</italic> values for intergroup comparisons. Therefore, <italic>P</italic> values were neither extracted nor assessed. This approach aligns with the methodological focus of prediction model research.</p></sec><sec id="s2-6"><title>Risk of Bias and Quality Assessment</title><p>The risk of bias and applicability of the included studies were rigorously assessed using the Prediction model Risk of Bias Assessment Tool (PROBAST) [<xref ref-type="bibr" rid="ref17">17</xref>]. PROBAST tool covers 4 domains&#x2014;participants, predictors, outcome, and analysis. Furthermore, 2 reviewers (SY and PZ) independently assessed each study, with disagreements resolved by consensus or consultation with a third researcher (HH). The results of this assessment are summarized descriptively in the Results section.</p></sec><sec id="s2-7"><title>Ethical Considerations</title><p>This study did not require ethical approval. We did not study any human or animal subjects, and we did not collect personal information or sensitive data.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Search Results</title><p>The systematic search initially identified 2651 records. After removing 143 duplicates, 2508 records were screened based on titles and abstracts. Of these, 2429 records were excluded. The full texts of the remaining 79 articles were assessed for eligibility, of which 56 were excluded for reasons detailed in <xref ref-type="fig" rid="figure1">Figure 1</xref>. Consequently, 23 studies [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref18">18</xref>-<xref ref-type="bibr" rid="ref37">37</xref>] met the inclusion criteria and were included in this scoping review (<xref ref-type="fig" rid="figure1">Figure 1</xref>).</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Flow diagram of the review process and the identification of studies via databases. ML: machine learning.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v14i1e80930_fig01.png"/></fig></sec><sec id="s3-2"><title>Characteristics of Included Studies</title><p>The detailed characteristics of the 23 included studies [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref18">18</xref>-<xref ref-type="bibr" rid="ref37">37</xref>] are presented in <xref ref-type="table" rid="table3">Table 3</xref>. The sample sizes varied widely, ranging from 48 to 48,543 cases. All studies were retrospective in design, with 17 (74%) [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref23">23</xref>-<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref33">33</xref>-<xref ref-type="bibr" rid="ref37">37</xref>] being single-center investigations. The publication years were concentrated between 2019 and 2025, and the geographical distribution was highly skewed, with studies from China dominating (17/23, 74% [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref29">29</xref>-<xref ref-type="bibr" rid="ref37">37</xref>]). The main surgical contexts were obstetric procedures (10/23, 43% [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]), orthopedic surgery (4/23, 17% [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref31">31</xref>]), and hepato-biliary surgery (4/23, 17% [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]). Considerable heterogeneity was observed in the definitions of intraoperative major bleeding across studies, ranging from &#x2265;200 mL to &#x003E;5000 mL.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Characteristics of the included studies (n=23).</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Author, year</td><td align="left" valign="bottom">Country</td><td align="left" valign="bottom">Study design</td><td align="left" valign="bottom">Surgical type (Specific procedure)</td><td align="left" valign="bottom">Sample size (Development/Validation)</td><td align="left" valign="bottom">Data source</td><td align="left" valign="bottom">EBL<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup> definition</td></tr></thead><tbody><tr><td align="left" valign="top">Akazawa and Hashimoto [<xref ref-type="bibr" rid="ref10">10</xref>], 2023</td><td align="left" valign="top">Japan</td><td align="left" valign="top">Single-Center Retrospective Cohort Study</td><td align="left" valign="top">Obstetric (Cesarean section)</td><td align="left" valign="top">48</td><td align="left" valign="top">MRI<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup> + EMR<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup></td><td align="left" valign="top">&#x2265;2000 mL</td></tr><tr><td align="left" valign="top">Akazawa and Hashimoto [<xref ref-type="bibr" rid="ref18">18</xref>], 2024</td><td align="left" valign="top">Japan</td><td align="left" valign="top">Multi-Center Retrospective Cohort Study</td><td align="left" valign="top">Obstetric (Cesarean section)</td><td align="left" valign="top">63 (50/13)</td><td align="left" valign="top">MRI + EMR</td><td align="left" valign="top">&#xFF1E;2000 mL</td></tr><tr><td align="left" valign="top">Chen et al [<xref ref-type="bibr" rid="ref12">12</xref>], 2024</td><td align="left" valign="top">China</td><td align="left" valign="top">Multi-Center Retrospective Cohort Study</td><td align="left" valign="top">Obstetric (Cesarean section)</td><td align="left" valign="top">1975 (1680/295)</td><td align="left" valign="top">EMR</td><td align="left" valign="top">&#x2265;300 mL</td></tr><tr><td align="left" valign="top">de Reus DC et al [<xref ref-type="bibr" rid="ref19">19</xref>], 2025</td><td align="left" valign="top">United States, Netherlands, and United Kingdom</td><td align="left" valign="top">Multi-center Retrospective Cohort Study</td><td align="left" valign="top">Orthopedic (Spinal decompression)</td><td align="left" valign="top">880</td><td align="left" valign="top">EMR</td><td align="left" valign="top">&#x003E;2500 mL</td></tr><tr><td align="left" valign="top">Li et al [<xref ref-type="bibr" rid="ref20">20</xref>], 2024</td><td align="left" valign="top">China</td><td align="left" valign="top">Single-Center Retrospective Study</td><td align="left" valign="top">Hepatic (Tumor resection)</td><td align="left" valign="top">406 (284/122)</td><td align="left" valign="top">EMR</td><td align="left" valign="top">&#x2265;1000 mL</td></tr><tr><td align="left" valign="top">Liu et al [<xref ref-type="bibr" rid="ref21">21</xref>], 2020</td><td align="left" valign="top">China</td><td align="left" valign="top">Single-Center Retrospective Study</td><td align="left" valign="top">Obstetric (Cesarean section)</td><td align="left" valign="top">210</td><td align="left" valign="top">MRI</td><td align="left" valign="top">&#x2265;500 mL</td></tr><tr><td align="left" valign="top">Mo et al [<xref ref-type="bibr" rid="ref22">22</xref>], 2023</td><td align="left" valign="top">China</td><td align="left" valign="top">Multi-center Retrospective Study</td><td align="left" valign="top">Gynecological (Hysteroscopic surgery)</td><td align="left" valign="top">200 (120/80)</td><td align="left" valign="top">EMR</td><td align="left" valign="top">&#x2265;200 mL</td></tr><tr><td align="left" valign="top">Park et al [<xref ref-type="bibr" rid="ref23">23</xref>], 2022</td><td align="left" valign="top">South Korea</td><td align="left" valign="top">Single-Center Retrospective Study</td><td align="left" valign="top">Hepatic (Transplantation)</td><td align="left" valign="top">414</td><td align="left" valign="top">EMR</td><td align="left" valign="top">&#x2265;5000 mL</td></tr><tr><td align="left" valign="top">Shi et al [<xref ref-type="bibr" rid="ref13">13</xref>], 2024</td><td align="left" valign="top">China</td><td align="left" valign="top">Multi-center Observational Cohort Study</td><td align="left" valign="top">Orthopedic (Spinal decompression)</td><td align="left" valign="top">276 (200/76)</td><td align="left" valign="top">EMR</td><td align="left" valign="top">&#x2265;2500 mL</td></tr><tr><td align="left" valign="top">Shi et al [<xref ref-type="bibr" rid="ref24">24</xref>], 2023</td><td align="left" valign="top">China</td><td align="left" valign="top">Single-Center Retrospective Cohort Study</td><td align="left" valign="top">Multi-departmental surgeries</td><td align="left" valign="top">48,543</td><td align="left" valign="top">EMR</td><td align="left" valign="top">&#x003E;200 mL</td></tr><tr><td align="left" valign="top">Stehrer et al [<xref ref-type="bibr" rid="ref25">25</xref>], 2019</td><td align="left" valign="top">Austria</td><td align="left" valign="top">Single-Center Retrospective Study</td><td align="left" valign="top">Craniofacial (Orthognathic surgery)</td><td align="left" valign="top">950 (760/190)</td><td align="left" valign="top">EMR</td><td align="left" valign="top">Calculated using hemoglobin balance method</td></tr><tr><td align="left" valign="top">Sun et al [<xref ref-type="bibr" rid="ref26">26</xref>], 2025</td><td align="left" valign="top">China</td><td align="left" valign="top">Single-Center Retrospective Study</td><td align="left" valign="top">Orthopedic (Lumbar fusion)</td><td align="left" valign="top">2054 (1437/617)</td><td align="left" valign="top">EMR</td><td align="left" valign="top">&#x2265;500 mL</td></tr><tr><td align="left" valign="top">Wang [<xref ref-type="bibr" rid="ref27">27</xref>], 2023</td><td align="left" valign="top">China</td><td align="left" valign="top">Single-Center Retrospective Study</td><td align="left" valign="top">Obstetric (Cesarean section)</td><td align="left" valign="top">168 (117/51)</td><td align="left" valign="top">EMR</td><td align="left" valign="top">&#x003E;1000 mL</td></tr><tr><td align="left" valign="top">Wakiya et al [<xref ref-type="bibr" rid="ref28">28</xref>], 2021</td><td align="left" valign="top">Japan</td><td align="left" valign="top">Single-Center Retrospective Cohort Study</td><td align="left" valign="top">General (Pancreatic cancer resection)</td><td align="left" valign="top">175 (128/47)</td><td align="left" valign="top">EMR</td><td align="left" valign="top">&#x003E;20% of circulating blood volume</td></tr><tr><td align="left" valign="top">Xu [<xref ref-type="bibr" rid="ref29">29</xref>], 2024</td><td align="left" valign="top">China</td><td align="left" valign="top">Single-Center Retrospective Study</td><td align="left" valign="top">Obstetric (Cesarean section)</td><td align="left" valign="top">249 (149/50/50)</td><td align="left" valign="top">MRI + EMR</td><td align="left" valign="top">&#x2265;1000 mL</td></tr><tr><td align="left" valign="top">Xue et al [<xref ref-type="bibr" rid="ref30">30</xref>], 2021</td><td align="left" valign="top">China</td><td align="left" valign="top">Single-Center Retrospective Study</td><td align="left" valign="top">Hepatic (Tumor resection)</td><td align="left" valign="top">665 (466/199)</td><td align="left" valign="top">EMR</td><td align="left" valign="top">&#x2265;800 mL</td></tr><tr><td align="left" valign="top">Yang et al [<xref ref-type="bibr" rid="ref31">31</xref>], 2022</td><td align="left" valign="top">China</td><td align="left" valign="top">Single-Center Retrospective Study</td><td align="left" valign="top">Orthopedic (Spinal fracture)</td><td align="left" valign="top">161</td><td align="left" valign="top">EMR</td><td align="left" valign="top">Hidden blood loss (no explicit quantitative threshold)</td></tr><tr><td align="left" valign="top">Yang et al [<xref ref-type="bibr" rid="ref32">32</xref>], 2023</td><td align="left" valign="top">China</td><td align="left" valign="top">Multi-center Retrospective Cohort Study</td><td align="left" valign="top">Obstetric (Cesarean section)</td><td align="left" valign="top">125 (85/40)</td><td align="left" valign="top">MRI + EMR</td><td align="left" valign="top">&#x2265;1500 mL</td></tr><tr><td align="left" valign="top">Yin et al [<xref ref-type="bibr" rid="ref33">33</xref>], 2021</td><td align="left" valign="top">China</td><td align="left" valign="top">Single-Center Retrospective Study</td><td align="left" valign="top">Oncological (Pelvic/sacral tumors)</td><td align="left" valign="top">810</td><td align="left" valign="top">CT<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup> + EMR</td><td align="left" valign="top">&#x003E;3000 mL</td></tr><tr><td align="left" valign="top">Zheng et al [<xref ref-type="bibr" rid="ref34">34</xref>], 2024</td><td align="left" valign="top">China</td><td align="left" valign="top">Single-Center Retrospective Study</td><td align="left" valign="top">Obstetric (Cesarean section)</td><td align="left" valign="top">346 (156/68/122)</td><td align="left" valign="top">MRI + Coagulation tests + EMR</td><td align="left" valign="top">&#x003E;1000 mL</td></tr><tr><td align="left" valign="top">Zheng et al [<xref ref-type="bibr" rid="ref35">35</xref>], 2022</td><td align="left" valign="top">China</td><td align="left" valign="top">Single-Center Retrospective Study</td><td align="left" valign="top">Hepatic (Tumor resection)</td><td align="left" valign="top">336 (268/68)</td><td align="left" valign="top">EMR</td><td align="left" valign="top">&#x2265;300 mL</td></tr><tr><td align="left" valign="top">Zong et al [<xref ref-type="bibr" rid="ref36">36</xref>], 2024</td><td align="left" valign="top">China</td><td align="left" valign="top">Single-Center Retrospective Cohort Study</td><td align="left" valign="top">Obstetric (Cesarean section)</td><td align="left" valign="top">323 (227/96)</td><td align="left" valign="top">MRI + EMR</td><td align="left" valign="top">&#x2265;1500 mL</td></tr><tr><td align="left" valign="top">Li [<xref ref-type="bibr" rid="ref37">37</xref>], 2024</td><td align="left" valign="top">China</td><td align="left" valign="top">Single-Center Retrospective Case-Control Study</td><td align="left" valign="top">Obstetric (Cesarean section)</td><td align="left" valign="top">231</td><td align="left" valign="top">EMR</td><td align="left" valign="top">&#x2265;1500 mL</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>EBL: estimated blood loss.</p></fn><fn id="table3fn2"><p><sup>b</sup>MRI: magnetic resonance imaging.</p></fn><fn id="table3fn3"><p><sup>c</sup>EMR: electronic medical record.</p></fn><fn id="table3fn4"><p><sup>d</sup>CT: computed tomography.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-3"><title>Technical Features and Performance of Prediction Models</title><p>All models were based on electronic health records (EHRs). A total of 8 studies (35%) [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>] further integrated medical imaging data, including magnetic resonance imaging (MRI) or computed tomography, of which 7 (30%) [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>] focused on predicting obstetric bleeding. In terms of algorithms, tree-based ensemble models were most frequently applied (12/23, 52% [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref23">23</xref>-<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref30">30</xref>-<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]), especially random forests (8/23, 34% [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]) and extreme gradient boosting (9/23, 39% [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]); logistic regression (13/23, 57% [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref30">30</xref>-<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]) and deep learning (6/23, 26% [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]) models were also commonly used. Model discrimination performance is illustrated in <xref ref-type="table" rid="table4">Table 4</xref>. The AUC ranged from 0.63 to 0.93, with a mean of 0.82 (SD 0.08). Models incorporating multimodal data (eg, EHR+imaging) showed a performance advantage (mean AUC&#x2248;0.84, SD 0.075) over unimodal models relying solely on EHR (mean AUC&#x2248;0.82, SD 0.069). For instance, the support vector machine model by Xu [<xref ref-type="bibr" rid="ref29">29</xref>], which fused MRI radiomic features with clinical data, achieved an AUC of 0.87.</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Characteristics and validation performance of ML<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup> prediction models in included studies (n=23).</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Author</td><td align="left" valign="bottom">Predictors categories</td><td align="left" valign="bottom">ML algorithms</td><td align="left" valign="bottom">Best model</td><td align="left" valign="bottom">Internal validation (test set performance)</td><td align="left" valign="bottom">External validation performance</td><td align="left" valign="bottom">Validation methods</td></tr></thead><tbody><tr><td align="left" valign="top">Akazawa and Hashimoto [<xref ref-type="bibr" rid="ref10">10</xref>]</td><td align="left" valign="top">MRI<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup>, laboratory parameters, demographic characteristics</td><td align="left" valign="top">Multimodal DL<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup>, XGBoost<sup><xref ref-type="table-fn" rid="table4fn4">d</xref></sup>, VGG16<sup><xref ref-type="table-fn" rid="table4fn5">e</xref></sup></td><td align="left" valign="top">Multimodal DL</td><td align="left" valign="top">AUC<sup><xref ref-type="table-fn" rid="table4fn6">f</xref></sup>=0.73 (95% CI 0.66&#x2010;0.80), Accuracy=0.68</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Random split (8:2), cross-validation</td></tr><tr><td align="left" valign="top">Akazawa and Hashimoto [<xref ref-type="bibr" rid="ref18">18</xref>]</td><td align="left" valign="top">Radiomics features, clinical variables</td><td align="left" valign="top">LR<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup></td><td align="left" valign="top">LR</td><td align="left" valign="top">AUC=0.69 (95% CI 0.62&#x2010;0.75)</td><td align="left" valign="top">AUC=0.70 (95% CI 0.66&#x2010;0.73)</td><td align="left" valign="top">Internal: random split (7:3), external: another institution</td></tr><tr><td align="left" valign="top">Chen et al [<xref ref-type="bibr" rid="ref12">12</xref>]</td><td align="left" valign="top">Clinical variables</td><td align="left" valign="top">Bayes<sup><xref ref-type="table-fn" rid="table4fn8">h</xref></sup>, MLP<sup><xref ref-type="table-fn" rid="table4fn9">i</xref></sup>, DT<sup><xref ref-type="table-fn" rid="table4fn10">j</xref></sup>, KNN<sup><xref ref-type="table-fn" rid="table4fn11">k</xref></sup>, LR, RF<sup><xref ref-type="table-fn" rid="table4fn12">l</xref></sup>, SVM<sup><xref ref-type="table-fn" rid="table4fn13">m</xref></sup>, XGBoost</td><td align="left" valign="top">Bayes</td><td align="left" valign="top">AUC=0.82 (95% CI 0.80&#x2010;0.84), Sensitivity=0.93, Specificity=0.42, <italic>F</italic> score=0.92</td><td align="left" valign="top">AUC=0.85 (95% CI 0.83&#x2010;0.87), Sensitivity=0.95, Specificity=0.50, <italic>F</italic> score=0.96</td><td align="left" valign="top">Internal validation: 10-fold cross-validation, (8:2 split), multicenter external validation</td></tr><tr><td align="left" valign="top">de Reus DC et al [<xref ref-type="bibr" rid="ref19">19</xref>]</td><td align="left" valign="top">Tumor type, ECOG<sup><xref ref-type="table-fn" rid="table4fn14">n</xref></sup> score, surgical procedure, preoperative platelet count</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">AUC=0.63 (95% CI 0.58&#x2010;0.68), Sensitivity=0.74, Specificity=0.41, <italic>F</italic> score=0.33</td><td align="left" valign="top">Multicenter external validation</td></tr><tr><td align="left" valign="top">Li et al [<xref ref-type="bibr" rid="ref20">20</xref>]</td><td align="left" valign="top">Demographic characteristics, laboratory parameters, imaging characteristics, pathological characteristics</td><td align="left" valign="top">LR</td><td align="left" valign="top">LR</td><td align="left" valign="top">AUC=0.80</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Random split (training set:test set=7:3)</td></tr><tr><td align="left" valign="top">Liu et al [<xref ref-type="bibr" rid="ref21">21</xref>]</td><td align="left" valign="top">MRI</td><td align="left" valign="top">DL</td><td align="left" valign="top">VGG16</td><td align="left" valign="top">Accuracy=0.75, Sensitivity=0.73, Specificity=0.77</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">5-fold cross-validation</td></tr><tr><td align="left" valign="top">Mo et al [<xref ref-type="bibr" rid="ref22">22</xref>]</td><td align="left" valign="top">Clinical variables</td><td align="left" valign="top">DNN<sup><xref ref-type="table-fn" rid="table4fn15">o</xref></sup></td><td align="left" valign="top">DNN</td><td align="left" valign="top">Accuracy=0.91, Sensitivity=0.89, Specificity=0.92, Precision=0.92</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Training:test=6:4</td></tr><tr><td align="left" valign="top">Park et al [<xref ref-type="bibr" rid="ref23">23</xref>]</td><td align="left" valign="top">Laboratory parameters, surgical parameters, MELD<sup><xref ref-type="table-fn" rid="table4fn16">p</xref></sup> score, demographic characteristics</td><td align="left" valign="top">LR, Elastic Net, SVM, RF, XGBoost, NN<sup><xref ref-type="table-fn" rid="table4fn17">q</xref></sup></td><td align="left" valign="top">LR</td><td align="left" valign="top">AUROC<sup><xref ref-type="table-fn" rid="table4fn18">r</xref></sup>=0.84, AUPR<sup><xref ref-type="table-fn" rid="table4fn19">s</xref></sup>=0.82</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Training:test=7:3, feature selection via nested cross-validation</td></tr><tr><td align="left" valign="top">Shi et al [<xref ref-type="bibr" rid="ref13">13</xref>]</td><td align="left" valign="top">Tumor type, ECOG score, surgical procedure, preoperative platelet count</td><td align="left" valign="top">LR, KNN, DT, XGBoost, RF, SVM</td><td align="left" valign="top">XGBoost</td><td align="left" valign="top">AUC=0.85 (95% CI 0.82&#x2010;0.87), Accuracy=0.77, Recall=0.85, <italic>F</italic> score=0.78, Precision=0.72</td><td align="left" valign="top">AUC=0.80(95% CI 0.77&#x2010;0.86), Accuracy=0.73, Recall=0.73,<break/><italic>F</italic> score=0.73, Precision=0.73</td><td align="left" valign="top">Internal validation: random split (7:3 ratio),<break/>external validation: independent cohort</td></tr><tr><td align="left" valign="top">Shi et al [<xref ref-type="bibr" rid="ref24">24</xref>]</td><td align="left" valign="top">Surgical parameters, laboratory parameters, demographic characteristics</td><td align="left" valign="top">LGB<sup><xref ref-type="table-fn" rid="table4fn20">t</xref></sup>, XGBoost, CatB<sup><xref ref-type="table-fn" rid="table4fn21">u</xref></sup>, AdaB<sup><xref ref-type="table-fn" rid="table4fn22">v</xref></sup>, LR, LSTM<sup><xref ref-type="table-fn" rid="table4fn23">w</xref></sup>, MLP</td><td align="left" valign="top">LGB</td><td align="left" valign="top">AUC=0.93, Accuracy=0.87, Sensitivity=0.8, Specificity=0.85</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Training:test =2:1, ADASYN<sup><xref ref-type="table-fn" rid="table4fn24">x</xref></sup> was used to address data imbalance</td></tr><tr><td align="left" valign="top">Stehrer et al [<xref ref-type="bibr" rid="ref25">25</xref>]</td><td align="left" valign="top">Surgical parameters, laboratory parameters, demographic characteristics</td><td align="left" valign="top">RF</td><td align="left" valign="top">RF</td><td align="left" valign="top">Regression performance: significant correlation between predicted and actual values; mean error 7.4 (SD 172.3) mL</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Random split (training:test=8:2), performance evaluation: correlation and mean error between predicted and actual values</td></tr><tr><td align="left" valign="top">Sun et al [<xref ref-type="bibr" rid="ref26">26</xref>]</td><td align="left" valign="top">Surgical parameters, laboratory parameters, demographic characteristics</td><td align="left" valign="top">LR</td><td align="left" valign="top">LR</td><td align="left" valign="top">AUC=0.73 (95% CI 0.67&#x2010;0.79), Accuracy=0.88</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Random split (training set:test set=7:3), 5-fold cross-validation</td></tr><tr><td align="left" valign="top">Wang [<xref ref-type="bibr" rid="ref27">27</xref>]</td><td align="left" valign="top">Radiomics features, clinical variables</td><td align="left" valign="top">LR, SVM, RF, SGD<sup><xref ref-type="table-fn" rid="table4fn25">y</xref></sup>, KNN</td><td align="left" valign="top">LR</td><td align="left" valign="top">AUC=0.83, Accuracy=0.80, Sensitivity=0.75, Specificity=0.83</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Random split (training set:test set=7:3), 5-fold cross-validation</td></tr><tr><td align="left" valign="top">Wakiya et al [<xref ref-type="bibr" rid="ref28">28</xref>]</td><td align="left" valign="top">Surgical parameters, laboratory parameters, tumor markers</td><td align="left" valign="top">DT</td><td align="left" valign="top">DT</td><td align="left" valign="top">Accuracy=0.80, Sensitivity=1, Specificity=0.66</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Random split (training set:test set=3:1)</td></tr><tr><td align="left" valign="top">Xu [<xref ref-type="bibr" rid="ref29">29</xref>]</td><td align="left" valign="top">Radiomics features, clinical features</td><td align="left" valign="top">SVM</td><td align="left" valign="top">SVM</td><td align="left" valign="top">AUC=0.87, Accuracy=0.85, Sensitivity=0.72, Specificity=0.89</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Random split: training:validation:test=6:2:2</td></tr><tr><td align="left" valign="top">Xue et al [<xref ref-type="bibr" rid="ref30">30</xref>]</td><td align="left" valign="top">Laboratory parameters</td><td align="left" valign="top">LR, DT, XGBoost, CNN<sup><xref ref-type="table-fn" rid="table4fn26">z</xref></sup>, LSTM</td><td align="left" valign="top">XGBoost</td><td align="left" valign="top">AUC=0.72, Accuracy=0.87, Precision=1, Recall=0.18, <italic>F</italic> score=0.31</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Random split (training set:test set=7:3), 5-fold cross-validation</td></tr><tr><td align="left" valign="top">Yang et al [<xref ref-type="bibr" rid="ref31">31</xref>]</td><td align="left" valign="top">Demographic characteristics, surgical parameters, laboratory parameters</td><td align="left" valign="top">XGBoost, LR, LGBM, RF, SVM</td><td align="left" valign="top">RF</td><td align="left" valign="top">AUC=0.86, Accuracy=0.78, Sensitivity=0.86, Specificity=0.81</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Random split into training and internal validation sets; 15-fold cross-validation conducted on the training set</td></tr><tr><td align="left" valign="top">Yang et al [<xref ref-type="bibr" rid="ref32">32</xref>]</td><td align="left" valign="top">MRI-anatomical-clinical features, morphological features</td><td align="left" valign="top">LR, SVM, RF, XGBoost</td><td align="left" valign="top">XGBoost</td><td align="left" valign="top">AUROC=0.88 (95% CI 0.74&#x2010;1.00), Accuracy=0.85, Sensitivity=0.90, Specificity=0.81</td><td align="left" valign="top">AUROC=0.82 (95% CI 0.68&#x2010;0.96), Accuracy=0.78, Sensitivity=0.81, Specificity=0.75</td><td align="left" valign="top">Data from 2 medical centers</td></tr><tr><td align="left" valign="top">Yin et al [<xref ref-type="bibr" rid="ref33">33</xref>]</td><td align="left" valign="top">CT<sup><xref ref-type="table-fn" rid="table4fn28">ab</xref></sup>-based radiomics features, clinical factors</td><td align="left" valign="top">DNN, LR</td><td align="left" valign="top">DNN</td><td align="left" valign="top">AUC=0.92, Accuracy=0.75, Sensitivity=0.30, Specificity=0.83</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Random split (training set:test set=7:3), temporal split, class imbalance handling: SMOTE<sup><xref ref-type="table-fn" rid="table4fn27">aa</xref></sup></td></tr><tr><td align="left" valign="top">Zheng et al [<xref ref-type="bibr" rid="ref34">34</xref>]</td><td align="left" valign="top">Radiomics features, clinical factors, laboratory parameters</td><td align="left" valign="top">SVM</td><td align="left" valign="top">SVM</td><td align="left" valign="top">AUC=0.87 (95% CI 0.76&#x2010;0.94), Accuracy=0.76, Sensitivity=1, Specificity=0.65</td><td align="left" valign="top">AUC=0.81 (95% CI 0.72&#x2010;0.87), Accuracy=0.79, Sensitivity=0.87, Specificity=0.65</td><td align="left" valign="top">Center 1: partitioned into training and internal test sets.<break/>Center 2: designated as the external test set.</td></tr><tr><td align="left" valign="top">Zheng et al [<xref ref-type="bibr" rid="ref35">35</xref>]</td><td align="left" valign="top">Tumor characteristics, surgical parameters, laboratory parameters</td><td align="left" valign="top">RF, MDN<sup><xref ref-type="table-fn" rid="table4fn29">ac</xref></sup></td><td align="left" valign="top">RF</td><td align="left" valign="top">AUC=0.79 (95% CI 0.65&#x2010;0.93), Accuracy=0.82</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Random split (training set:test set=8:2), bootstrap</td></tr><tr><td align="left" valign="top">Zong et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td><td align="left" valign="top">Multiparametric MRI</td><td align="left" valign="top">DL</td><td align="left" valign="top">MS-3D-ResNet<sup><xref ref-type="table-fn" rid="table4fn30">ad</xref></sup></td><td align="left" valign="top">AUC=0.87 (95% CI 0.86&#x2010;0.89), Accuracy=0.85, Sensitivity=0.86, Specificity=0.85</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Random split (training set:test set=7:3)</td></tr><tr><td align="left" valign="top">Li [<xref ref-type="bibr" rid="ref37">37</xref>]</td><td align="left" valign="top">Clinical risk factors in obstetrics</td><td align="left" valign="top">LR, DT, KNN, BPNN<sup><xref ref-type="table-fn" rid="table4fn31">ae</xref></sup>, XGBoost, LGBM</td><td align="left" valign="top">LR</td><td align="left" valign="top">AUC=0.88 (95% CI 0.83&#x2010;0.92), Accuracy=0.77, Sensitivity=0.84, Specificity=0.67, PPV<sup><xref ref-type="table-fn" rid="table4fn32">af</xref></sup>=0.78, NPV<sup><xref ref-type="table-fn" rid="table4fn33">ag</xref></sup>=0.75</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">5-fold cross-validation</td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>ML: machine learning.</p></fn><fn id="table4fn2"><p><sup>b</sup>MRI: magnetic resonance imaging.</p></fn><fn id="table4fn3"><p><sup>c</sup>DL: deep learning.</p></fn><fn id="table4fn4"><p><sup>d</sup>XGBoost: extreme gradient boosting.</p></fn><fn id="table4fn5"><p><sup>e</sup>VGG-16: visual geometry group - 16 layers.</p></fn><fn id="table4fn6"><p><sup>f</sup>AUC: area under the curve.</p></fn><fn id="table4fn7"><p><sup>g</sup>LR: logistic regression.</p></fn><fn id="table4fn8"><p><sup>h</sup>Bayes: na&#x00EF;ve Bayes.</p></fn><fn id="table4fn9"><p><sup>i</sup>MLP: multilayer perceptron.</p></fn><fn id="table4fn10"><p><sup>j</sup>DT: decision tree.</p></fn><fn id="table4fn11"><p><sup>k</sup>KNN: k-nearest neighbors.</p></fn><fn id="table4fn12"><p><sup>l</sup>RF: random forest.</p></fn><fn id="table4fn13"><p><sup>m</sup>SVM: support vector machine.</p></fn><fn id="table4fn14"><p><sup>n</sup>ECOG: eastern cooperative oncology group.</p></fn><fn id="table4fn15"><p><sup>o</sup>DNN: deep neural network.</p></fn><fn id="table4fn16"><p><sup>p</sup>MELD: model for end-stage liver disease.</p></fn><fn id="table4fn17"><p><sup>q</sup>NN: neural network.</p></fn><fn id="table4fn18"><p><sup>r</sup>AUROC: area under receiver operating characteristic curve.</p></fn><fn id="table4fn19"><p><sup>s</sup>AUPR: area under the precision versus recall curve.</p></fn><fn id="table4fn20"><p><sup>t</sup>LGB: light gradient boosting machine (LightGBM).</p></fn><fn id="table4fn21"><p><sup>u</sup>CatB: categorical boosting (CatBoost).</p></fn><fn id="table4fn22"><p><sup>v</sup>AdaB: adaptive boosting (AdaBoost).</p></fn><fn id="table4fn23"><p><sup>w</sup>LSTM: long short-term memory.</p></fn><fn id="table4fn24"><p><sup>x</sup>ADASYN: adaptive synthetic sampling.</p></fn><fn id="table4fn25"><p><sup>y</sup>SGD: stochastic gradient descent.</p></fn><fn id="table4fn26"><p><sup>z</sup>CNN: convolutional neural networks.</p></fn><fn id="table4fn27"><p><sup>aa</sup>SMOTE: synthetic minority over-sampling technique.</p></fn><fn id="table4fn28"><p><sup>ab</sup>CT: computed tomography.</p></fn><fn id="table4fn29"><p><sup>ac</sup>MDN: mixture density network.</p></fn><fn id="table4fn30"><p><sup>ad</sup>MS-3D-ResNet: multi-stream 3D residual network.</p></fn><fn id="table4fn31"><p><sup>ae</sup>BPNN: back propagation neural network.</p></fn><fn id="table4fn32"><p><sup>af</sup>PPV: positive predictive value.</p></fn><fn id="table4fn33"><p><sup>ag</sup>NPV: negative predictive value.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-4"><title>Model Validation Strategies</title><p>Although internal validation was widely applied (22/23, 96% [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref37">37</xref>]), its methodological rigor was insufficient (<xref ref-type="table" rid="table4">Table 4</xref>). Only half of the studies (12/23, 52% [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref22">22</xref>-<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref33">33</xref>]) established an independent test set to evaluate final performance; even fewer used cross-validation (9/23, 39% [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]). External validation was notably lacking, implemented in only 6 studies (26%) [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref34">34</xref>]. Critically, among the limited external validations, model performance generally declined. For example, the model by Shi et al [<xref ref-type="bibr" rid="ref13">13</xref>] dropped from an internal AUC of 0.85 to an external AUC of 0.80; when de Reus et al [<xref ref-type="bibr" rid="ref19">19</xref>] independently validated the same model in a multinational, multicenter setting, the AUC further decreased to 0.63.</p></sec><sec id="s3-5"><title>Completeness of Performance Metric Reporting</title><p>There was substantial selective bias in the reporting of key performance metrics (<xref ref-type="table" rid="table4">Table 4</xref>). Discrimination metrics AUC were reported most frequently (19/23, 83% [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref18">18</xref>-<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref29">29</xref>-<xref ref-type="bibr" rid="ref37">37</xref>]), whereas reporting of essential classification metrics was incomplete: sensitivity (16/23, 70% [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref27">27</xref>-<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]), specificity (14/23, 61% [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref27">27</xref>-<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref31">31</xref>-<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]). Reporting rates for precision (4/23, 17% [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]) and <italic>F</italic><sub>1</sub>-score (4/23, 17% [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]) were very low. Furthermore, only 10/23 (43%) [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>] of the studies reported model calibration (eg, calibration curves).</p></sec><sec id="s3-6"><title>Data Preprocessing and Interpretability</title><p>Reporting of data-preprocessing pipelines was seriously deficient (<xref ref-type="table" rid="table5">Table 5</xref>). In total, 11 studies (47%) [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref30">30</xref>-<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>] did not describe any method for handling missing data. Only 3 studies (13%) [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref33">33</xref>] reported strategies to address class imbalance (eg, using the synthetic minority oversampling technique [SMOTE]). The vast majority of studies neither applied nor reported any model interpretability analyses (eg, Shapley Additive Explanations [SHAP] and local interpretable model-agnostic explanations), rendering the models essentially &#x201C;black-box.&#x201D;</p><table-wrap id="t5" position="float"><label>Table 5.</label><caption><p>Summary of data preprocessing methods in included studies (n=23).</p></caption><table id="table5" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Author</td><td align="left" valign="bottom">Missing data handling</td><td align="left" valign="bottom">Class imbalance handling</td><td align="left" valign="bottom">Data normalization or standardization</td></tr></thead><tbody><tr><td align="left" valign="top">Akazawa and Hashimoto [<xref ref-type="bibr" rid="ref10">10</xref>]</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td></tr><tr><td align="left" valign="top">Akazawa and Hashimoto [<xref ref-type="bibr" rid="ref18">18</xref>]</td><td align="left" valign="top">Exclusion of cases with missing data</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Standardization of all radiomic features</td></tr><tr><td align="left" valign="top">Chen et al [<xref ref-type="bibr" rid="ref12">12</xref>]</td><td align="left" valign="top">Multiple imputation using MICE<sup><xref ref-type="table-fn" rid="table5fn1">a</xref></sup> package</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Standardization: numerical variables were standardized</td></tr><tr><td align="left" valign="top">de Reus DC et al [<xref ref-type="bibr" rid="ref19">19</xref>]</td><td align="left" valign="top">Multiple imputation combined with exclusion</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td></tr><tr><td align="left" valign="top">Li et al [<xref ref-type="bibr" rid="ref20">20</xref>]</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td></tr><tr><td align="left" valign="top">Liu et al [<xref ref-type="bibr" rid="ref21">21</xref>]</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td></tr><tr><td align="left" valign="top">Mo et al [<xref ref-type="bibr" rid="ref22">22</xref>]</td><td align="left" valign="top">Missing values were filled with 0</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td></tr><tr><td align="left" valign="top">Park et al [<xref ref-type="bibr" rid="ref23">23</xref>]</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td></tr><tr><td align="left" valign="top">Shi et al [<xref ref-type="bibr" rid="ref13">13</xref>]</td><td align="left" valign="top">Median imputation</td><td align="left" valign="top">SMOTE<sup><xref ref-type="table-fn" rid="table5fn2">b</xref></sup> Tomek</td><td align="left" valign="top">Not reported</td></tr><tr><td align="left" valign="top">Shi et al [<xref ref-type="bibr" rid="ref24">24</xref>]</td><td align="left" valign="top">KNN<sup><xref ref-type="table-fn" rid="table5fn3">c</xref></sup> imputation</td><td align="left" valign="top">ADASYN<sup><xref ref-type="table-fn" rid="table5fn4">d</xref></sup></td><td align="left" valign="top">Not reported</td></tr><tr><td align="left" valign="top">Stehrer et al [<xref ref-type="bibr" rid="ref25">25</xref>]</td><td align="left" valign="top">Exclusion if &#x003E;25% missing; mean or mode imputation if &#x003C;25%</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td></tr><tr><td align="left" valign="top">Sun et al [<xref ref-type="bibr" rid="ref26">26</xref>]</td><td align="left" valign="top">Exclusion of patients with missing key indicators</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td></tr><tr><td align="left" valign="top">Wang [<xref ref-type="bibr" rid="ref27">27</xref>]</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Z-score normalization</td></tr><tr><td align="left" valign="top">Wakiya et al [<xref ref-type="bibr" rid="ref28">28</xref>]</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td></tr><tr><td align="left" valign="top">Xu [<xref ref-type="bibr" rid="ref29">29</xref>]</td><td align="left" valign="top">Exclusion of patients with missing key indicators</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">MRI<sup><xref ref-type="table-fn" rid="table5fn5">e</xref></sup> pixel values scaled to [0,1]</td></tr><tr><td align="left" valign="top">Xue et al [<xref ref-type="bibr" rid="ref30">30</xref>]</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td></tr><tr><td align="left" valign="top">Yang et al [<xref ref-type="bibr" rid="ref31">31</xref>]</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td></tr><tr><td align="left" valign="top">Yang et al [<xref ref-type="bibr" rid="ref32">32</xref>]</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td></tr><tr><td align="left" valign="top">Yin et al [<xref ref-type="bibr" rid="ref33">33</xref>]</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">SMOTE</td><td align="left" valign="top">Not reported</td></tr><tr><td align="left" valign="top">Zheng et al [<xref ref-type="bibr" rid="ref34">34</xref>]</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td></tr><tr><td align="left" valign="top">Zheng et al [<xref ref-type="bibr" rid="ref35">35</xref>]</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Standardization and normalization applied</td></tr><tr><td align="left" valign="top">Zong et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td></tr><tr><td align="left" valign="top">Li [<xref ref-type="bibr" rid="ref37">37</xref>]</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Not reported</td></tr></tbody></table><table-wrap-foot><fn id="table5fn1"><p><sup>a</sup>MICE: multivariate imputation by chained equations.</p></fn><fn id="table5fn2"><p><sup>b</sup>SMOTE: synthetic minority oversampling technique.</p></fn><fn id="table5fn3"><p><sup>c</sup>KNN: k-nearest neighbors.</p></fn><fn id="table5fn4"><p><sup>d</sup>ADASYN: adaptive synthetic sampling.</p></fn><fn id="table5fn5"><p><sup>e</sup>MRI: magnetic resonance imaging.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-7"><title>Risk-of-Bias Assessment of Included Studies</title><p>Based on a systematic evaluation using the PROBAST (<xref ref-type="table" rid="table6">Table 6</xref>), all included studies (23/23, 100% [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref18">18</xref>-<xref ref-type="bibr" rid="ref37">37</xref>]) were judged to have an overall &#x201C;high&#x201D; risk of bias. High risk primarily stemmed from 2 domains&#x2014;the &#x201C;participants&#x201D; domain (23/23, 100% [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref18">18</xref>-<xref ref-type="bibr" rid="ref37">37</xref>], due to selection bias inherent in retrospective designs) and the &#x201C;analysis&#x201D; domain (20/23, 87% [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>-<xref ref-type="bibr" rid="ref37">37</xref>], mainly attributable to inconsistent data preprocessing and shortcomings in validation strategies).</p><table-wrap id="t6" position="float"><label>Table 6.</label><caption><p>Risk of bias assessment of included models (n=23 studies).</p></caption><table id="table6" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Author</td><td align="left" valign="bottom">Participants</td><td align="left" valign="bottom">Predictors</td><td align="left" valign="bottom">Outcome</td><td align="left" valign="bottom">Analysis</td><td align="left" valign="bottom">Overall</td></tr></thead><tbody><tr><td align="left" valign="top">Akazawa and Hashimoto [<xref ref-type="bibr" rid="ref10">10</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">Low</td><td align="left" valign="top">Unclear</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">Akazawa and Hashimoto [<xref ref-type="bibr" rid="ref18">18</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">Low</td><td align="left" valign="top">Unclear</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">Chen et al [<xref ref-type="bibr" rid="ref12">12</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">Unclear</td><td align="left" valign="top">Unclear</td><td align="left" valign="top">Low</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">de Reus DC et al [<xref ref-type="bibr" rid="ref19">19</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">Unclear</td><td align="left" valign="top">Unclear</td><td align="left" valign="top">Low</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">Li et al [<xref ref-type="bibr" rid="ref20">20</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">Low</td><td align="left" valign="top">Low</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">Liu et al [<xref ref-type="bibr" rid="ref21">21</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">Unclear</td><td align="left" valign="top">Unclear</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">Mo et al [<xref ref-type="bibr" rid="ref22">22</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">Unclear</td><td align="left" valign="top">Low</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">Park et al [<xref ref-type="bibr" rid="ref23">23</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">Low</td><td align="left" valign="top">Low</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">Shi et al [<xref ref-type="bibr" rid="ref13">13</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">Low</td><td align="left" valign="top">Low</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">Shi et al [<xref ref-type="bibr" rid="ref24">24</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">Unclear</td><td align="left" valign="top">Unclear</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">Stehrer et al [<xref ref-type="bibr" rid="ref25">25</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">Low</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">Sun et al [<xref ref-type="bibr" rid="ref26">26</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">Low</td><td align="left" valign="top">Low</td><td align="left" valign="top">Low</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">Wang [<xref ref-type="bibr" rid="ref27">27</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td><td align="left" valign="top">Low</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">Wakiya et al [<xref ref-type="bibr" rid="ref28">28</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">Xu [<xref ref-type="bibr" rid="ref29">29</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">Xue et al [<xref ref-type="bibr" rid="ref30">30</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">Yang et al [<xref ref-type="bibr" rid="ref31">31</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">Yang et al [<xref ref-type="bibr" rid="ref32">32</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">Low</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">Yin et al [<xref ref-type="bibr" rid="ref33">33</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">Unclear</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">Zheng et al [<xref ref-type="bibr" rid="ref34">34</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">Low</td><td align="left" valign="top">Low</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">Zheng et al [<xref ref-type="bibr" rid="ref35">35</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">Low</td><td align="left" valign="top">Low</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">Zong et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">Low</td><td align="left" valign="top">Low</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td></tr><tr><td align="left" valign="top">Li [<xref ref-type="bibr" rid="ref37">37</xref>]</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td><td align="left" valign="top">High</td></tr></tbody></table></table-wrap></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>This systematic scoping review synthesizes the current state of ML in predicting intraoperative bleeding in patients undergoing surgery. The results indicate that ML models demonstrate good discriminative ability (mean AUC 0.82, SD 0.008) and, in some scenarios, outperform traditional methods [<xref ref-type="bibr" rid="ref10">10</xref>]. Multimodal data (eg, EHR combined with medical imaging) can further enhance predictive efficacy, aligning with the paradigm shift from &#x201C;unimodal perception&#x201D; to &#x201C;multimodal cognition&#x201D; [<xref ref-type="bibr" rid="ref38">38</xref>]. However, the PROBAST assessment reveals a fundamental contradiction; despite significant technical potential, current studies exhibit a universally high risk of bias, particularly in the analysis domain (22/23, 87% of the included studies [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>-<xref ref-type="bibr" rid="ref37">37</xref>]). This raises serious concerns that the reported performance metrics are likely overestimated. Specifically, this systematic risk of overestimation stems from three interconnected methodological shortcomings: (1) selective reporting and optimization bias, whereby studies tend to report only the best-performing models and favorable metrics (eg, AUC) while omitting critical measures such as calibration; (2) inadequate internal validation strategies, characterized by reliance on simple data splitting without temporal validation, which may lead to overfitting and overly optimistic performance estimates; and (3) insufficient handling of critical data issues, like class imbalance and missing data, which can artificially inflate discrimination metrics. Collectively, these flaws indicate that the reported mean AUC of 0.82 (SD 0.008) likely reflects optimal laboratory performance under ideal conditions, rather than the true generalizability of the models to independent, prospectively collected clinical data. This view is corroborated by the commonly observed performance degradation in the limited external validations available, where models often exhibit significant drops in AUC when applied to independent cohorts [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. Based on this, the subsequent discussion of this review will systematically focus on these three core aspects&#x2014;the completeness of model performance reporting, the rigor of validation strategies, and the transparency of data preprocessing and interpretability.</p><p>First, there is severe selective bias in the reporting of model performance, which limits a comprehensive assessment of their clinical applicability. Current research is overly focused on reporting discrimination metrics (AUC reported in 19/23, 83% of studies [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>-<xref ref-type="bibr" rid="ref37">37</xref>]), while seriously neglecting calibration (reported in 10/23, 43% [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]) and key classification metrics (eg, precision and <italic>F</italic><sub>1</sub>-score, reported in 4/23, 17% [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]). This bias obscures two core issues. First, the widespread absence of model calibration assessment undermines the clinical credibility of predicted probabilities. Calibration reflects the consistency between predicted probabilities and actual risks, serving as the direct basis for risk stratification [<xref ref-type="bibr" rid="ref39">39</xref>]. However, only a minority of studies reported calibration results [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]. More critically, calibration performance is unstable and cannot be inferred from a high AUC. For example, one study [<xref ref-type="bibr" rid="ref33">33</xref>] reported good internal calibration, whereas independent external validation [<xref ref-type="bibr" rid="ref19">19</xref>] revealed significant miscalibration. This suggests that calibration must be independently evaluated, as its issues are often exposed during external validation. Furthermore, its absence in most studies casts doubt on the reliability of their &#x201C;risk probability&#x201D; outputs. Second, incomplete reporting of key classification metrics hinders the judgment of model utility. Precision is crucial for assessing alert efficiency and preventing alarm fatigue, yet its reporting is severely inadequate [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]. This makes it impossible to quantify the model&#x2019;s false-positive risk. For instance, a model [<xref ref-type="bibr" rid="ref12">12</xref>] reported high sensitivity (eg, identifying most true bleeding events) but lower specificity, implying a higher number of false-positive alerts. Without reporting precision, the accuracy of these alerts cannot be quantified, making it difficult to assess whether this high-sensitivity strategy would lead to &#x201C;alert fatigue&#x201D; in practice. Conversely, the model developed by Xue et al [<xref ref-type="bibr" rid="ref30">30</xref>] achieved high accuracy (eg, most of its alerts are true), but its sensitivity might be low, potentially missing a considerable proportion of true bleeding events, which could increase the risk of clinical under-diagnosis. The systematic absence of these key metrics makes it challenging to evaluate model robustness across different clinical decision thresholds. Therefore, future research must strictly adhere to reporting guidelines, such as Transparent Reporting of a Multivariable Prediction Model for Individual Prognosis or Diagnosis (TRIPOD) [<xref ref-type="bibr" rid="ref40">40</xref>] and comprehensively present calibration and classification metrics to bridge the gap between technical development and clinical practice.</p><p>Second, model validation strategies generally lack rigor. The widespread absence of external validation, in particular, weakens the reliability of their generalizability assessment. This review found that although over half of the studies (12/23, 52% [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref22">22</xref>-<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref33">33</xref>]) established an independent test set, their internal validation mostly relied on simple data splitting, with only one study [<xref ref-type="bibr" rid="ref33">33</xref>] using the more robust temporal validation method. This overreliance on simple hold-out methods, coupled with limited adoption of methods such as cross-validation, may lead to optimistic performance estimates. More critically, external validation is severely lacking (only 6/23, 26% [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref34">34</xref>]), and performance degradation is commonly observed in implemented validations. This directly reveals the limited generalizability of models developed on homogeneous data. For example, the model by Shi et al [<xref ref-type="bibr" rid="ref13">13</xref>] experienced a decrease in AUC from 0.85 in internal validation to 0.63 during multinational, multicenter external validation [<xref ref-type="bibr" rid="ref19">19</xref>]. Models by Yang et al [<xref ref-type="bibr" rid="ref32">32</xref>] and Zheng et al [<xref ref-type="bibr" rid="ref34">34</xref>] showed similar trends in external performance decline. A notable exception is the model by Chen et al [<xref ref-type="bibr" rid="ref12">12</xref>], which was built on large-scale multicenter data and showed improved performance in external validation, suggesting that an appropriate study design can enhance generalizability. In summary, the generalizability of existing models has not been sufficiently or rigorously validated. To further confirm the effectiveness and broad applicability of models in real-world settings, future research must incorporate prospective design, temporal validation, and multicenter external validation as key components of model evaluation.</p><p>Furthermore, insufficient transparency in data preprocessing and the widespread lack of model interpretability constitute another systemic methodological defect hindering research reproducibility and clinical translation. This review found that over 40% (11/23) of studies [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref30">30</xref>-<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>] did not report methods for handling missing data, and only 13% (3/23) [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref33">33</xref>] addressed class imbalance. The reporting of data preprocessing steps is severely deficient and nonstandard (eg, failing to clearly describe key procedures such as handling missing values and normalization [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref29">29</xref>-<xref ref-type="bibr" rid="ref31">31</xref>]), thereby directly compromising model robustness and reproducibility. Although a few studies adopted more rigorous methods (eg, multiple imputation [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref18">18</xref>], SMOTE [<xref ref-type="bibr" rid="ref33">33</xref>], or adaptive synthetic sampling [<xref ref-type="bibr" rid="ref24">24</xref>]), simpler strategies that may introduce bias (eg, direct case deletion [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref28">28</xref>]) remain common. This lack of transparency makes interstudy comparison and independent replication exceptionally difficult and may partly explain the performance decline observed for some models during external validation [<xref ref-type="bibr" rid="ref19">19</xref>]. Concurrently, model interpretability analysis is far from standard practice. The vast majority of studies lack any explanatory analysis (eg, SHAP values and feature importance), rendering them &#x201C;black boxes&#x201D; that clinical decision-makers find difficult to trust. Although a few studies have attempted to apply interpretability techniques, such as SHAP values or feature importance rankings [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref22">22</xref>], to identify key risk features and enhance transparency, this has not become routine. Therefore, future research must be committed to promoting the standardized reporting of data preprocessing workflows and deeply integrating interpretability analysis throughout the entire model development and validation process, which is a key prerequisite for building trustworthy and clinically usable prediction tools.</p></sec><sec id="s4-2"><title>Future Research Directions</title><p>Based on the findings of this review, to promote the transition of prediction models from &#x201C;technically feasible&#x201D; to &#x201C;clinically applicable,&#x201D; future research should focus on four core directions. First, promote rigorous validation and generalizability assessment. Model development must move beyond retrospective single-center designs, collect data through multicenter prospective studies, and use temporal validation and independent external validation as cornerstones of evaluation to rigorously test their robustness. Second, improve performance reporting and clinical utility evaluation. Research must strictly adhere to reporting guidelines, such as TRIPOD, and fully present performance metrics. Furthermore, methods such as decision curve analysis should be actively adopted to quantify the clinical net benefit of models across different decision thresholds, aligning evaluation with real-world decision-making scenarios. Third, standardize data processing and enhance model interpretability. Detailed reporting of data preprocessing workflows, along with the adoption of advanced methods for handling missing values and class imbalance, should become standard practice. Simultaneously, interpretability techniques, such as SHAP, should be integrated into the development pipeline as essential components to elucidate risk mechanisms and build clinical trust. Finally, explore clinical integration pathways and evaluate real-world impact. Current research in the field mostly remains at the stage of model development and technical validation, and its potential clinical value has not yet been substantiated. Specifically, building on preliminary evidence, future research should be dedicated to deepening and validating the following key translational aspects. First, promote the prospective application and effect evaluation of prediction models to guide preoperative blood preparation. Although existing models show potential to optimize blood preparation strategies [<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref42">42</xref>], their impact on resource conservation and team response efficiency after integration into actual workflows remains to be confirmed by prospective studies. Second, expand the generalizability and clinical integration of real-time alert models. Although some studies have successfully developed real-time prediction models for intraoperative massive transfusion and demonstrated excellent performance [<xref ref-type="bibr" rid="ref43">43</xref>], their generalizability across different surgical types and medical centers, as well as their actual alert efficacy and clinical acceptance after integration into anesthesia monitoring systems, requires further validation. Finally, and most challengingly, evaluate the improvement effect of model-based clinical decisions on patient hard endpoints through prospective interventional trials. Existing observational studies suggest that transfusion is associated with worse outcomes and higher costs [<xref ref-type="bibr" rid="ref44">44</xref>]. Future well-designed studies are needed to confirm whether effective prediction-intervention strategies can ultimately achieve comprehensive benefits&#x2014;such as reducing unnecessary transfusions and timely management of major bleeding&#x2014;thereby lowering complications, improving patient prognosis, and saving medical costs.</p></sec><sec id="s4-3"><title>Limitations</title><p>The limitations of this review primarily stem from the methodological quality of the included original studies. First, the search strategy may not have captured all relevant literature, posing a risk of omission. More critically, the widespread retrospective design and high risk of bias in the current field necessitate cautious interpretation regarding the true performance and generalizability of the evaluated models.</p></sec><sec id="s4-4"><title>Conclusion</title><p>This scoping review indicates that research on ML for predicting intraoperative bleeding is growing rapidly in quantity, but the quality of studies has not improved correspondingly, constituting the main obstacle to clinical translation. Existing models are generally built on retrospective data and suffer from core methodological flaws, including a high risk of bias, a severe lack of external validation, and incomplete reporting of key performance metrics. Therefore, the clinical applicability and reliability of current models are far from established. To achieve the leap from methodological exploration to clinical utility, future research must meet higher standards&#x2014;prioritize prospective design, enforce independent and multicenter external validation, strictly adhere to standardized reporting guidelines such as TRIPOD, and strive to explore effective pathways for integrating models into perioperative workflows.</p></sec></sec></body><back><ack><p>No generative AI tools were used at any stage in the preparation of this manuscript. All content, including text, data, analyses, references, and citations, was generated and reviewed entirely by the authors. We remain fully responsible for the accuracy, originality, and integrity of the manuscript. SY and PZ are co-first authors.</p></ack><notes><sec><title>Funding</title><p>No external financial support or grants were received from any public, commercial, or not-for-profit entities for the research, authorship, or publication of this article.</p></sec><sec><title>Data Availability</title><p>This study is a scoping review and does not involve the generation or analysis of new data. All data used in this review were extracted from publicly available papers indexed in PubMed, Web of Science, Embase, CINAHL, CNKI, Wanfang, and VIP. No new datasets were created or analyzed in the course of this research. The studies included in this review can be accessed through their respective journals and databases.</p></sec></notes><fn-group><fn fn-type="con"><p>SY contributed to conceptualization, methodology, investigation, and writing&#x2014;original draft.</p><p>PZ contributed to methodology, formal analysis, data curation, and writing&#x2014;original draft.</p><p>LX and JJ contributed to conceptualization, supervision, and project administration.</p><p>SX and WQ contributed to investigation.</p><p>HH and YG contributed to formal analysis and data curation.</p><p>All authors participated in writing&#x2014;review &#x0026; editing and approved the final manuscript.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AUC</term><def><p>area under the curve</p></def></def-item><def-item><term id="abb2">CHARMS</term><def><p>Critical Appraisal and Data Extraction for Systematic Reviews of Prediction Modeling studies</p></def></def-item><def-item><term id="abb3">CNKI</term><def><p>China National Knowledge Infrastructure</p></def></def-item><def-item><term id="abb4">EHR</term><def><p>electronic health record</p></def></def-item><def-item><term id="abb5">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb6">MRI</term><def><p>magnetic resonance imaging</p></def></def-item><def-item><term id="abb7">PICOS</term><def><p>Population, Intervention, Comparator, Outcome, and Study design</p></def></def-item><def-item><term id="abb8">PRISMA-ScR</term><def><p>Preferred Reporting Items for Systematic Reviews and Meta-Analyses extension for Scoping Reviews</p></def></def-item><def-item><term id="abb9">PROBAST</term><def><p>Prediction model Risk of Bias Assessment Tool</p></def></def-item><def-item><term id="abb10">SHAP</term><def><p>Shapley Additive Explanations</p></def></def-item><def-item><term id="abb11">SMOTE</term><def><p>synthetic minority over-sampling technique</p></def></def-item><def-item><term id="abb12">TRIPOD</term><def><p>Transparent Reporting of a Multivariable Prediction Model for Individual Prognosis or Diagnosis</p></def></def-item><def-item><term id="abb13">VIP</term><def><p>China Science and Technology Journal Database</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shah</surname><given-names>A</given-names> </name><name name-style="western"><surname>Palmer</surname><given-names>AJR</given-names> </name><name name-style="western"><surname>Klein</surname><given-names>AA</given-names> </name></person-group><article-title>Strategies to minimize intraoperative blood loss during major surgery</article-title><source>Br J Surg</source><year>2020</year><month>01</month><volume>107</volume><issue>2</issue><fpage>e26</fpage><lpage>e38</lpage><pub-id pub-id-type="doi">10.1002/bjs.11393</pub-id><pub-id pub-id-type="medline">31903592</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lin</surname><given-names>YM</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>C</given-names> </name><name name-style="western"><surname>Xian</surname><given-names>GZ</given-names> </name></person-group><article-title>Calculation methods for intraoperative blood loss: a literature review</article-title><source>BMC Surg</source><year>2024</year><month>12</month><day>20</day><volume>24</volume><issue>1</issue><fpage>394</fpage><pub-id pub-id-type="doi">10.1186/s12893-024-02699-3</pub-id><pub-id pub-id-type="medline">39707278</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sie&#x015B;kiewicz</surname><given-names>A</given-names> </name><name name-style="western"><surname>Resze&#x0107;</surname><given-names>J</given-names> </name><name name-style="western"><surname>Piszczatowski</surname><given-names>B</given-names> </name><etal/></person-group><article-title>Intraoperative bleeding during endoscopic sinus surgery and microvascular density of the nasal mucosa</article-title><source>Adv Med Sci</source><year>2014</year><month>03</month><volume>59</volume><issue>1</issue><fpage>132</fpage><lpage>135</lpage><pub-id pub-id-type="doi">10.1016/j.advms.2013.10.001</pub-id><pub-id pub-id-type="medline">24797989</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Park</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kwon</surname><given-names>J hye</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>SH</given-names> </name><etal/></person-group><article-title>Intraoperative blood loss may be associated with myocardial injury after non-cardiac surgery</article-title><source>PLOS ONE</source><year>2021</year><volume>16</volume><issue>2</issue><fpage>e0241114</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0241114</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shander</surname><given-names>A</given-names> </name><name name-style="western"><surname>Hardy</surname><given-names>JF</given-names> </name><name name-style="western"><surname>Ozawa</surname><given-names>S</given-names> </name><etal/></person-group><article-title>A global definition of patient blood management</article-title><source>Anesth Analg</source><year>2022</year><month>09</month><day>1</day><volume>135</volume><issue>3</issue><fpage>476</fpage><lpage>488</lpage><pub-id pub-id-type="doi">10.1213/ANE.0000000000005873</pub-id><pub-id pub-id-type="medline">35147598</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yoon</surname><given-names>D</given-names> </name><name name-style="western"><surname>Yoo</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>BS</given-names> </name><etal/></person-group><article-title>Automated deep learning model for estimating intraoperative blood loss using gauze images</article-title><source>Sci Rep</source><year>2024</year><month>01</month><day>31</day><volume>14</volume><issue>1</issue><fpage>2597</fpage><pub-id pub-id-type="doi">10.1038/s41598-024-52524-3</pub-id><pub-id pub-id-type="medline">38297011</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kirchhoff</surname><given-names>P</given-names> </name><name name-style="western"><surname>Clavien</surname><given-names>PA</given-names> </name><name name-style="western"><surname>Hahnloser</surname><given-names>D</given-names> </name></person-group><article-title>Complications in colorectal surgery: risk factors and preventive strategies</article-title><source>Patient Saf Surg</source><year>2010</year><month>03</month><day>25</day><volume>4</volume><issue>1</issue><fpage>5</fpage><pub-id pub-id-type="doi">10.1186/1754-9493-4-5</pub-id><pub-id pub-id-type="medline">20338045</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mahmood</surname><given-names>E</given-names> </name><name name-style="western"><surname>Matyal</surname><given-names>R</given-names> </name><name name-style="western"><surname>Mueller</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Multifactorial risk index for prediction of intraoperative blood transfusion in endovascular aneurysm repair</article-title><source>J Vasc Surg</source><year>2018</year><month>03</month><volume>67</volume><issue>3</issue><fpage>778</fpage><lpage>784</lpage><pub-id pub-id-type="doi">10.1016/j.jvs.2017.06.106</pub-id><pub-id pub-id-type="medline">28965799</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alali</surname><given-names>AA</given-names> </name><name name-style="western"><surname>Boustany</surname><given-names>A</given-names> </name><name name-style="western"><surname>Martel</surname><given-names>M</given-names> </name><name name-style="western"><surname>Barkun</surname><given-names>AN</given-names> </name></person-group><article-title>Strengths and limitations of risk stratification tools for patients with upper gastrointestinal bleeding: a narrative review</article-title><source>Expert Rev Gastroenterol Hepatol</source><year>2023</year><volume>17</volume><issue>8</issue><fpage>795</fpage><lpage>803</lpage><pub-id pub-id-type="doi">10.1080/17474124.2023.2242252</pub-id><pub-id pub-id-type="medline">37496492</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Akazawa</surname><given-names>M</given-names> </name><name name-style="western"><surname>Hashimoto</surname><given-names>K</given-names> </name></person-group><article-title>A multimodal deep learning model for predicting severe hemorrhage in placenta previa</article-title><source>Sci Rep</source><year>2023</year><month>10</month><day>13</day><volume>13</volume><issue>1</issue><fpage>17320</fpage><pub-id pub-id-type="doi">10.1038/s41598-023-44634-1</pub-id><pub-id pub-id-type="medline">37833537</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Eckhardt</surname><given-names>CM</given-names> </name><name name-style="western"><surname>Madjarova</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>Williams</surname><given-names>RJ</given-names> </name><etal/></person-group><article-title>Unsupervised machine learning methods and emerging applications in healthcare</article-title><source>Knee Surg Sports Traumatol Arthrosc</source><year>2023</year><month>02</month><volume>31</volume><issue>2</issue><fpage>376</fpage><lpage>381</lpage><pub-id pub-id-type="doi">10.1007/s00167-022-07233-7</pub-id><pub-id pub-id-type="medline">36378293</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>X</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Guo</surname><given-names>D</given-names> </name><etal/></person-group><article-title>Risk of intraoperative hemorrhage during cesarean scar ectopic pregnancy surgery: development and validation of an interpretable machine learning prediction model</article-title><source>EClinicalMedicine</source><year>2024</year><month>12</month><volume>78</volume><fpage>102969</fpage><pub-id pub-id-type="doi">10.1016/j.eclinm.2024.102969</pub-id><pub-id pub-id-type="medline">39687425</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shi</surname><given-names>X</given-names> </name><name name-style="western"><surname>Cui</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>S</given-names> </name><name name-style="western"><surname>Pan</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>B</given-names> </name><name name-style="western"><surname>Lei</surname><given-names>M</given-names> </name></person-group><article-title>Development and validation of a web-based artificial intelligence prediction model to assess massive intraoperative blood loss for metastatic spinal disease using machine learning techniques</article-title><source>Spine J</source><year>2024</year><month>01</month><volume>24</volume><issue>1</issue><fpage>146</fpage><lpage>160</lpage><pub-id pub-id-type="doi">10.1016/j.spinee.2023.09.001</pub-id><pub-id pub-id-type="medline">37704048</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tricco</surname><given-names>AC</given-names> </name><name name-style="western"><surname>Lillie</surname><given-names>E</given-names> </name><name name-style="western"><surname>Zarin</surname><given-names>W</given-names> </name><etal/></person-group><article-title>PRISMA Extension for Scoping Reviews (PRISMA-ScR): checklist and explanation</article-title><source>Ann Intern Med</source><year>2018</year><month>10</month><day>2</day><volume>169</volume><issue>7</issue><fpage>467</fpage><lpage>473</lpage><pub-id pub-id-type="doi">10.7326/M18-0850</pub-id><pub-id pub-id-type="medline">30178033</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Arksey</surname><given-names>H</given-names> </name><name name-style="western"><surname>O&#x2019;Malley</surname><given-names>L</given-names> </name></person-group><article-title>Scoping studies: towards a methodological framework</article-title><source>Int J Soc Res Methodol</source><year>2005</year><month>02</month><volume>8</volume><issue>1</issue><fpage>19</fpage><lpage>32</lpage><pub-id pub-id-type="doi">10.1080/1364557032000119616</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Moons</surname><given-names>KGM</given-names> </name><name name-style="western"><surname>de Groot</surname><given-names>JAH</given-names> </name><name name-style="western"><surname>Bouwmeester</surname><given-names>W</given-names> </name><etal/></person-group><article-title>Critical appraisal and data extraction for systematic reviews of prediction modelling studies: the CHARMS checklist</article-title><source>PLOS Med</source><year>2014</year><month>10</month><volume>11</volume><issue>10</issue><fpage>e1001744</fpage><pub-id pub-id-type="doi">10.1371/journal.pmed.1001744</pub-id><pub-id pub-id-type="medline">25314315</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kaul</surname><given-names>T</given-names> </name><name name-style="western"><surname>Damen</surname><given-names>JAA</given-names> </name><name name-style="western"><surname>Wynants</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Assessing the quality of prediction models in health care using the Prediction model Risk Of Bias ASsessment Tool (PROBAST): an evaluation of its use and practical application</article-title><source>J Clin Epidemiol</source><year>2025</year><month>05</month><volume>181</volume><fpage>111732</fpage><pub-id pub-id-type="doi">10.1016/j.jclinepi.2025.111732</pub-id><pub-id pub-id-type="medline">40010583</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Akazawa</surname><given-names>M</given-names> </name><name name-style="western"><surname>Hashimoto</surname><given-names>K</given-names> </name></person-group><article-title>Prediction of hemorrhage in placenta previa: radiomics analysis of pelvic MRI images</article-title><source>Eur J Obstet Gynecol Reprod Biol</source><year>2024</year><month>08</month><volume>299</volume><fpage>37</fpage><lpage>42</lpage><pub-id pub-id-type="doi">10.1016/j.ejogrb.2024.05.033</pub-id><pub-id pub-id-type="medline">38830301</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>de Reus</surname><given-names>DC</given-names> </name><name name-style="western"><surname>Kuijten</surname><given-names>RH</given-names> </name><name name-style="western"><surname>Saha</surname><given-names>P</given-names> </name><etal/></person-group><article-title>External validation of a machine learning prediction model for massive blood loss during surgery for spinal metastases: a multi-institutional study using 880 patients</article-title><source>Spine J</source><year>2025</year><month>07</month><volume>25</volume><issue>7</issue><fpage>1386</fpage><lpage>1399</lpage><pub-id pub-id-type="doi">10.1016/j.spinee.2025.03.018</pub-id><pub-id pub-id-type="medline">40157430</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name><name name-style="western"><surname>Jia</surname><given-names>YM</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>ZL</given-names> </name><etal/></person-group><article-title>Development and validation of a machine learning-based early prediction model for massive intraoperative bleeding in patients with primary hepatic malignancies</article-title><source>World J Gastrointest Oncol</source><year>2024</year><month>01</month><day>15</day><volume>16</volume><issue>1</issue><fpage>90</fpage><lpage>101</lpage><pub-id pub-id-type="doi">10.4251/wjgo.v16.i1.90</pub-id><pub-id pub-id-type="medline">38292843</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>T</given-names> </name><name name-style="western"><surname>Peng</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Luo</surname><given-names>R</given-names> </name></person-group><article-title>Grade prediction of bleeding volume in cesarean section of patients with pernicious placenta previa based on deep learning</article-title><source>Front Bioeng Biotechnol</source><year>2020</year><volume>8</volume><fpage>343</fpage><pub-id pub-id-type="doi">10.3389/fbioe.2020.00343</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mo</surname><given-names>J</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>JY</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Based on the deep neural network principle, construct prediction model for massive bleeding risk during hysteroscopic removal of scar gestation</article-title><source>Chin J Fam Plann Gynecol</source><year>2023</year><volume>15</volume><issue>3</issue><fpage>72</fpage><lpage>77</lpage><pub-id pub-id-type="doi">10.3969/j.issn.1674-4020.2023.03.17</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Park</surname><given-names>S</given-names> </name><name name-style="western"><surname>Park</surname><given-names>K</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>JG</given-names> </name><etal/></person-group><article-title>Development of machine learning models predicting estimated blood loss during liver transplant surgery</article-title><source>J Pers Med</source><year>2022</year><month>06</month><day>23</day><volume>12</volume><issue>7</issue><fpage>1028</fpage><pub-id pub-id-type="doi">10.3390/jpm12071028</pub-id><pub-id pub-id-type="medline">35887525</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shi</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>G</given-names> </name><name name-style="western"><surname>Ma</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Machine learning algorithms to predict intraoperative hemorrhage in surgical patients: a modeling study of real-world data in Shanghai, China</article-title><source>BMC Med Inform Decis Mak</source><year>2023</year><month>08</month><day>10</day><volume>23</volume><issue>1</issue><fpage>156</fpage><pub-id pub-id-type="doi">10.1186/s12911-023-02253-w</pub-id><pub-id pub-id-type="medline">37563676</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Stehrer</surname><given-names>R</given-names> </name><name name-style="western"><surname>Hingsammer</surname><given-names>L</given-names> </name><name name-style="western"><surname>Staudigl</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Machine learning based prediction of perioperative blood loss in orthognathic surgery</article-title><source>J Craniomaxillofac Surg</source><year>2019</year><month>11</month><volume>47</volume><issue>11</issue><fpage>1676</fpage><lpage>1681</lpage><pub-id pub-id-type="doi">10.1016/j.jcms.2019.08.005</pub-id><pub-id pub-id-type="medline">31711996</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sun</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>N</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>L</given-names> </name><name name-style="western"><surname>Zhou</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>J</given-names> </name></person-group><article-title>Constructing a predictive model for high intraoperative excessive bleeding in patients undergoing posterior lumbar decompression and fusion internal fixation surgery during outpatient visits</article-title><source>Clin Biochem</source><year>2025</year><month>01</month><volume>135</volume><fpage>110856</fpage><pub-id pub-id-type="doi">10.1016/j.clinbiochem.2024.110856</pub-id><pub-id pub-id-type="medline">39626837</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>YC</given-names> </name></person-group><source>Value of MRI-Based Radiomics in Diagnosing Placenta Accreta Spectrum Disorders and Predicting Blood Loss during Cesarean Section</source><year>2023</year><access-date>2026-04-22</access-date><publisher-name>Gansu University of Chinese Medicine</publisher-name><pub-id pub-id-type="doi">10.27026/d.cnki.ggszc.2023.000255</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wakiya</surname><given-names>T</given-names> </name><name name-style="western"><surname>Ishido</surname><given-names>K</given-names> </name><name name-style="western"><surname>Kimura</surname><given-names>N</given-names> </name><etal/></person-group><article-title>Prediction of massive bleeding in pancreatic surgery based on preoperative patient characteristics using a decision tree</article-title><source>PLOS ONE</source><year>2021</year><volume>16</volume><issue>11</issue><fpage>e0259682</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0259682</pub-id><pub-id pub-id-type="medline">34752505</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="thesis"><person-group person-group-type="author"><name name-style="western"><surname>Xu</surname><given-names>XY</given-names> </name></person-group><article-title>Value of T2WI-based deep learning and radiomics models in predicting blood loss risk during cesarean section for placenta accreta spectrum disorders</article-title><year>2024</year><access-date>2026-04-22</access-date><publisher-name>Guangdong Medical University</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://d.wanfangdata.com.cn/thesis/Ch1UaGVzaXNOZXdTb2xyOVMyMDI2MDQxNTE0Mjg1MRIJRDAzNDg1NDIzGghla3o0bGZoaA%3D%3D">https://d.wanfangdata.com.cn/thesis/Ch1UaGVzaXNOZXdTb2xyOVMyMDI2MDQxNTE0Mjg1MRIJRDAzNDg1NDIzGghla3o0bGZoaA%3D%3D</ext-link></comment></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xue</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Predicting intraoperative bleeding in patients undergoing a hepatectomy using multiple machine learning and deep learning techniques</article-title><source>J Clin Anesth</source><year>2021</year><month>11</month><volume>74</volume><fpage>110444</fpage><pub-id pub-id-type="doi">10.1016/j.jclinane.2021.110444</pub-id><pub-id pub-id-type="medline">34217119</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>B</given-names> </name><name name-style="western"><surname>Gao</surname><given-names>L</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>X</given-names> </name><etal/></person-group><article-title>Application of supervised machine learning algorithms to predict the risk of hidden blood loss during the perioperative period in thoracolumbar burst fracture patients complicated with neurological compromise</article-title><source>Front Public Health</source><year>2022</year><volume>10</volume><fpage>969919</fpage><pub-id pub-id-type="doi">10.3389/fpubh.2022.969919</pub-id><pub-id pub-id-type="medline">36225767</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>X</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>W</given-names> </name><etal/></person-group><article-title>A quantitative analysis framework of placenta accreta spectrum: placenta subtype, intraoperative bleeding, and hysterectomy risk evaluation based on magnetic resonance imaging-anatomical-clinical features</article-title><source>Quant Imaging Med Surg</source><year>2023</year><month>10</month><day>1</day><volume>13</volume><issue>10</issue><fpage>7105</fpage><lpage>7116</lpage><pub-id pub-id-type="doi">10.21037/qims-23-142</pub-id><pub-id pub-id-type="medline">37869322</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yin</surname><given-names>P</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>C</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>S</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>L</given-names> </name><name name-style="western"><surname>Hong</surname><given-names>N</given-names> </name></person-group><article-title>Clinical-deep neural network and clinical-radiomics nomograms for predicting the intraoperative massive blood loss of pelvic and sacral tumors</article-title><source>Front Oncol</source><year>2021</year><volume>11</volume><fpage>752672</fpage><pub-id pub-id-type="doi">10.3389/fonc.2021.752672</pub-id><pub-id pub-id-type="medline">34760700</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zheng</surname><given-names>C</given-names> </name><name name-style="western"><surname>Yue</surname><given-names>P</given-names> </name><name name-style="western"><surname>Cao</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Predicting intraoperative blood loss during cesarean sections based on multi-modal information: a two-center study</article-title><source>Abdom Radiol (NY)</source><year>2024</year><month>07</month><volume>49</volume><issue>7</issue><fpage>2325</fpage><lpage>2339</lpage><pub-id pub-id-type="doi">10.1007/s00261-024-04419-0</pub-id><pub-id pub-id-type="medline">38896245</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zheng</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>CX</given-names> </name><name name-style="western"><surname>Yao</surname><given-names>ZX</given-names> </name></person-group><article-title>Development of a hemorrhage prediction model for hepatectomy based on machine learning and preoperative data</article-title><source>Fujian Med Univ J</source><year>2022</year><access-date>2026-04-22</access-date><volume>56</volume><issue>6</issue><fpage>552</fpage><lpage>560</lpage><comment><ext-link ext-link-type="uri" xlink:href="http://kns--cnki--net--https.cnki.scrm.scsycy.vip:2222/kcms2/article/abstract?v=9sxxlkkbz5M8EE0nVpwqU-q3rja4vJevci2btiIU5sY8j8KErSyAfQCankDdkEL869MGzKbdF5MTYxkMF1NMbha1qC-G_Y_dJLGe03VDKwenUTgMP-T3x_vNC6pCOeiGLgA8Phc-aU2bzCqyE8dbObWAR7g5fXstcqkzzR5jlGg-B9EcIqGbp6qXjF9nkoIl&#x0026;uniplatform=NZKPT&#x0026;language=CHS">http://kns--cnki--net--https.cnki.scrm.scsycy.vip:2222/kcms2/article/abstract?v=9sxxlkkbz5M8EE0nVpwqU-q3rja4vJevci2btiIU5sY8j8KErSyAfQCankDdkEL869MGzKbdF5MTYxkMF1NMbha1qC-G_Y_dJLGe03VDKwenUTgMP-T3x_vNC6pCOeiGLgA8Phc-aU2bzCqyE8dbObWAR7g5fXstcqkzzR5jlGg-B9EcIqGbp6qXjF9nkoIl&#x0026;uniplatform=NZKPT&#x0026;language=CHS</ext-link></comment></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zong</surname><given-names>M</given-names> </name><name name-style="western"><surname>Pei</surname><given-names>X</given-names> </name><name name-style="western"><surname>Yan</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Deep learning model based on multisequence MRI images for assessing adverse pregnancy outcome in placenta accreta</article-title><source>J Magn Reson Imaging</source><year>2024</year><month>02</month><volume>59</volume><issue>2</issue><fpage>510</fpage><lpage>521</lpage><pub-id pub-id-type="doi">10.1002/jmri.29023</pub-id><pub-id pub-id-type="medline">37851581</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>H</given-names> </name></person-group><source>Analysis of Risk Factors and Development of a Predictive Model for Massive Hemorrhage during Cesarean Section in Women with Placenta Percreta</source><year>2024</year><publisher-name>Jilin University</publisher-name><pub-id pub-id-type="doi">10.27162/d.cnki.gjlin.2024.006375</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>S</given-names> </name><name name-style="western"><surname>Guo</surname><given-names>X</given-names> </name></person-group><article-title>A review of multimodal large models in the field of major diseases [Chinese]</article-title><source>Journal of Harbin Institute of Technology</source><year>2025</year><month>12</month><day>15</day><access-date>2026-04-06</access-date><volume>57</volume><issue>12</issue><fpage>156</fpage><lpage>164</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://scholar.hit.edu.cn/en/publications/%E5%A4%9A%E6%A8%A1%E6%80%81%E5%A4%A7%E6%A8%A1%E5%9E%8B%E5%9C%A8%E9%87%8D%E5%A4%A7%E7%96%BE%E7%97%85%E9%A2%86%E5%9F%9F%E7%9A%84%E7%A0%94%E7%A9%B6%E7%BB%BC%E8%BF%B0/">https://scholar.hit.edu.cn/en/publications/%E5%A4%9A%E6%A8%A1%E6%80%81%E5%A4%A7%E6%A8%A1%E5%9E%8B%E5%9C%A8%E9%87%8D%E5%A4%A7%E7%96%BE%E7%97%85%E9%A2%86%E5%9F%9F%E7%9A%84%E7%A0%94%E7%A9%B6%E7%BB%BC%E8%BF%B0/</ext-link></comment></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alba</surname><given-names>AC</given-names> </name><name name-style="western"><surname>Agoritsas</surname><given-names>T</given-names> </name><name name-style="western"><surname>Walsh</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Discrimination and calibration of clinical prediction models: users&#x2019; guides to the medical literature</article-title><source>JAMA</source><year>2017</year><month>10</month><day>10</day><volume>318</volume><issue>14</issue><fpage>1377</fpage><lpage>1384</lpage><pub-id pub-id-type="doi">10.1001/jama.2017.12126</pub-id><pub-id pub-id-type="medline">29049590</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Moons</surname><given-names>KGM</given-names> </name><name name-style="western"><surname>Damen</surname><given-names>JAA</given-names> </name><name name-style="western"><surname>Kaul</surname><given-names>T</given-names> </name><etal/></person-group><article-title>PROBAST+AI: an updated quality, risk of bias, and applicability assessment tool for prediction models using regression or artificial intelligence methods</article-title><source>BMJ</source><year>2025</year><month>03</month><day>24</day><volume>388</volume><fpage>e082505</fpage><pub-id pub-id-type="doi">10.1136/bmj-2024-082505</pub-id><pub-id pub-id-type="medline">40127903</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lou</surname><given-names>SS</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>H</given-names> </name><name name-style="western"><surname>Lu</surname><given-names>C</given-names> </name><name name-style="western"><surname>Wildes</surname><given-names>TS</given-names> </name><name name-style="western"><surname>Hall</surname><given-names>BL</given-names> </name><name name-style="western"><surname>Kannampallil</surname><given-names>T</given-names> </name></person-group><article-title>Personalized surgical transfusion risk prediction using machine learning to guide preoperative type and screen orders</article-title><source>Anesthesiology</source><year>2022</year><month>07</month><day>1</day><volume>137</volume><issue>1</issue><fpage>55</fpage><lpage>66</lpage><pub-id pub-id-type="doi">10.1097/ALN.0000000000004139</pub-id><pub-id pub-id-type="medline">35147666</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zapf</surname><given-names>MAC</given-names> </name><name name-style="western"><surname>Fabbri</surname><given-names>DV</given-names> </name><name name-style="western"><surname>Andrews</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Development of a machine learning model to predict intraoperative transfusion and guide type and screen ordering</article-title><source>J Clin Anesth</source><year>2023</year><month>12</month><volume>91</volume><fpage>111272</fpage><pub-id pub-id-type="doi">10.1016/j.jclinane.2023.111272</pub-id><pub-id pub-id-type="medline">37774648</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>G</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>TK</given-names> </name><etal/></person-group><article-title>Development and validation of a prediction model for need for massive transfusion during surgery using intraoperative hemodynamic monitoring data</article-title><source>JAMA Netw Open</source><year>2022</year><month>12</month><day>1</day><volume>5</volume><issue>12</issue><fpage>e2246637</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2022.46637</pub-id><pub-id pub-id-type="medline">36515949</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lang</surname><given-names>FF</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>LY</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>SW</given-names> </name></person-group><article-title>Predictive modeling of perioperative blood transfusion in lumbar posterior interbody fusion using machine learning</article-title><source>Front Physiol</source><year>2023</year><volume>14</volume><fpage>1306453</fpage><pub-id pub-id-type="doi">10.3389/fphys.2023.1306453</pub-id><pub-id pub-id-type="medline">38187137</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Checklist 1</label><p>PRISMA checklist.</p><media xlink:href="medinform_v14i1e80930_app1.pdf" xlink:title="PDF File, 562 KB"/></supplementary-material></app-group></back></article>