<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id><journal-id journal-id-type="publisher-id">medinform</journal-id><journal-id journal-id-type="index">7</journal-id><journal-title>JMIR Medical Informatics</journal-title><abbrev-journal-title>JMIR Med Inform</abbrev-journal-title><issn pub-type="epub">2291-9694</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v13i1e70857</article-id><article-id pub-id-type="doi">10.2196/70857</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Using Machine Learning to Predict-Then-Optimize Elective Orthopedic Surgery Scheduling to Improve Operating Room Utilization: Retrospective Study</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Lex</surname><given-names>Johnathan R</given-names></name><degrees>MBChB, MASc</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" corresp="yes" equal-contrib="yes"><name name-style="western"><surname>Abbas</surname><given-names>Aazad</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Mosseri</surname><given-names>Jacob</given-names></name><degrees>MASc</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Singh Toor</surname><given-names>Jay</given-names></name><degrees>MD, MBA</degrees><xref ref-type="aff" rid="aff5">5</xref><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Simone</surname><given-names>Michael</given-names></name><degrees>BASc</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ravi</surname><given-names>Bheeshma</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff7">7</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Whyne</surname><given-names>Cari</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff7">7</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Khalil</surname><given-names>Elias B</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib></contrib-group><aff id="aff1"><institution>Orthopaedic Biomechanics Lab, Sunnybrook Research Institute</institution><addr-line>2075 Bayview Avenue, Suite S620</addr-line><addr-line>Toronto</addr-line><addr-line>ON</addr-line><country>Canada</country></aff><aff id="aff2"><institution>Institute of Biomedical Engineering, University of Toronto</institution><addr-line>Toronto</addr-line><addr-line>ON</addr-line><country>Canada</country></aff><aff id="aff3"><institution>Department of Surgery, Division of Orthopedic Surgery, University of Toronto</institution><addr-line>149 College St</addr-line><addr-line>Toronto</addr-line><addr-line>ON</addr-line><country>Canada</country></aff><aff id="aff4"><institution>Department of Mechanical and Industrial Engineering, Faculty of Engineering, University of Toronto</institution><addr-line>Toronto</addr-line><addr-line>ON</addr-line><country>Canada</country></aff><aff id="aff5"><institution>Winnipeg Spine Program, Health Sciences Centre, Department of Surgery, University of Manitoba</institution><addr-line>Manitoba</addr-line><country>Canada</country></aff><aff id="aff6"><institution>Orthopaedic Surgery Section, Department of Surgery, University of Manitoba</institution><addr-line>Manitoba</addr-line><country>Canada</country></aff><aff id="aff7"><institution>Division of Orthopaedic Surgery, Department of Surgery, Sunnybrook Health Science Centre</institution><addr-line>Toronto</addr-line><addr-line>ON</addr-line><country>Canada</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Benis</surname><given-names>Arriel</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Wang</surname><given-names>Chia -Hung</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Subih</surname><given-names>Murad</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Aazad Abbas, MD, Orthopaedic Biomechanics Lab, Sunnybrook Research Institute, 2075 Bayview Avenue, Suite S620, Toronto, ON, M4N 3M5, Canada; <email>aazad.abbas@mail.utoronto.ca</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>10</day><month>9</month><year>2025</year></pub-date><volume>13</volume><elocation-id>e70857</elocation-id><history><date date-type="received"><day>03</day><month>01</month><year>2025</year></date><date date-type="rev-recd"><day>23</day><month>07</month><year>2025</year></date><date date-type="accepted"><day>28</day><month>07</month><year>2025</year></date></history><copyright-statement>&#x00A9; Johnathan R Lex, Aazad Abbas, Jacob Mosseri, Jay Singh Toor, Michael Simone, Bheeshma Ravi, Cari Whyne, Elias B Khalil. Originally published in JMIR Medical Informatics (<ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org">https://medinform.jmir.org</ext-link>), 10.9.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/">https://medinform.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://medinform.jmir.org/2025/1/e70857"/><abstract><sec><title>Background</title><p>Total knee and hip arthroplasty (TKA and THA) are among the most performed elective procedures. Rising demand and the resource-intensive nature of these procedures have contributed to longer wait times despite significant health care investment. Current scheduling methods often rely on average surgical durations, overlooking patient-specific variability.</p></sec><sec><title>Objective</title><p>To determine the potential for improving elective surgery scheduling for TKA and THA, respectively, by using a 2-stage approach that incorporates machine learning (ML) prediction of the duration of surgery (DOS) with scheduling optimization.</p></sec><sec sec-type="methods"><title>Methods</title><p>In total, 2 ML models (one each for TKA and THA) were trained to predict DOS using patient factors based on 302,490 and 196,942 patients, respectively, from a large international database. In total, 3 optimization formulations based on varying surgeon flexibility were compared: Any (surgeons could operate in any operating room at any time), Split (limitation of 2 surgeons per operating room per day), and multiple subset sum problem (MSSP; limit of 1 surgeon per operating room per day). Two years of daily scheduling simulations were performed for each optimization problem using ML prediction or mean DOS over a range of schedule parameters. Constraints and resources were based on a high-volume arthroplasty hospital in Canada.</p></sec><sec sec-type="results"><title>Results</title><p>The TKA and THA prediction models achieved test accuracy (with a 30 min buffer) of 78.1% (mean squared error 0.898) and 75.4% (mean squared error 0.916), respectively. Any scheduling formulation performed significantly worse than the Split and MSSP formulations with respect to overtime and underutilization (<italic>P</italic>&#x003C;.001). The latter 2 problems performed similarly (<italic>P</italic>&#x003E;.05) over most schedule parameters. The ML prediction schedules outperformed those generated using a mean DOS for most scheduling parameters, with overtime reduced on average by 300-500 minutes per week (12&#x2010;20 min per operating room per day; <italic>P</italic>&#x003C;.001). However, there was more operating room underutilization with the ML prediction schedules, with it ranging from 70&#x2010;192 minutes more underutilization (<italic>P</italic>&#x003C;.001). Using a 15-minute schedule granularity with a waitlist pool of a minimum of 1 month generated the ML schedule that outperformed the mean schedule 97.1% of times.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>Assuming a full waiting list, optimizing an individual surgeon&#x2019;s elective operating room time using an ML-assisted predict-then-optimize scheduling system improves overall operating room efficiency, significantly decreasing overtime. This has significant potential implications for health care systems struggling with pressures of rising costs and growing operative waitlists.</p></sec></abstract><kwd-group><kwd>machine learning</kwd><kwd>orthopedic surgery</kwd><kwd>optimization</kwd><kwd>elective surgery</kwd><kwd>scheduling</kwd><kwd>hip and knee arthroplasty</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Total knee and hip arthroplasty (TKA and THA, respectively) are the gold-standard treatment for end-stage arthritis of the hip and knee joints. These procedures are the first and second most frequently performed in the United States, excluding maternal and neonatal procedures [<xref ref-type="bibr" rid="ref1">1</xref>]. In 2018, 1.3 million of these procedures were performed in the United States, a 21.9% increase from 2008 [<xref ref-type="bibr" rid="ref1">1</xref>]. This number will continue to increase globally due to an aging population and the ongoing obesity pandemic [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. The ubiquity of these procedures correlates strongly with their burden on health care systems globally. In the United States, approximately 5% of the gross domestic product is to care for musculoskeletal conditions [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. Despite this spending, wait times for elective surgical procedures in OECD countries continue to increase, conferring extended periods of time with poor quality of life for TKA and THA patients [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. For these reasons, there is a growing interest and research into improving the efficiency and cost-effectiveness of arthritis care [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>].</p><p>Most research has focused purely on the prediction of duration of surgery (DOS) or the optimization of operating room scheduling, ignoring their inherent interrelation [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref14">14</xref>]. More recently, these approaches have been combined to plan post-surgical beds and plan emergency surgeries based on predicted priority with varying results [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. DOS prediction models typically represent a large volume of varying procedures, spanning multiple surgical specialties with limited practical applications. Classic regression modeling in orthopedics has identified age, BMI, surgical procedure, primary or revision, and gender as important variables affecting DOS predictions [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. Machine learning (ML) models have been applied to predict DOS for various surgeries [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref24">24</xref>]. However, in practice, mean time or surgeon-specific rolling mean time is typically used to generate schedules at the operational level.</p><p>Research evaluating the optimization of surgery scheduling has been performed using an average or a randomly sampled (typically from a lognormal distribution) DOS value prior to optimizing a schedule through integer linear programming based on either the multiple knapsack or job-shop scheduling problem [<xref ref-type="bibr" rid="ref25">25</xref>-<xref ref-type="bibr" rid="ref27">27</xref>]. Stochastic programming and distributionally robust optimization have also been attempted to mitigate the effects of an uncertain DOS, but these approaches assume a distribution of DOS rather than using specific features to aid in prediction [<xref ref-type="bibr" rid="ref28">28</xref>].</p><p>To our knowledge, no prior work has combined patient-level DOS predictions with schedule optimization to create an optimized surgical schedule at the operational level. It is known that neural networks are strong predictors of DOS; however, their realizable improvements when implemented over various surgical schedule optimization problems, while performing simulations accounting for real-world constraints, remain unclear [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. The primary aim of this paper was to determine if a 2-stage approach using an ML model for prediction of DOS paired with schedule optimization improves operating room overutilization or underutilization compared to using the mean DOS. Secondary objectives were to determine the effect of schedule granularity and length of surgeon waitlist on scheduling accuracy.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Ethical Considerations</title><p>This retrospective study analyzed deidentified American College of Surgeons National Surgical Quality Improvement (ACS NSQIP) data. The study was approved by the Institutional Research Ethics Board (Sunnybrook Health Sciences Center, Project REB ID #4899). Informed consent was waived due to the secondary, minimal-risk nature of the analysis. No local institutional patient data were used. Privacy and confidentiality were protected in accordance with institutional and journal policies. Data use complied with NSQIP data-use agreements. The study adhered to the Declaration of Helsinki.</p></sec><sec id="s2-2"><title>Setting</title><p>Population-level data from the ACS NSQIP database were used to generate prediction models. This database compiles patient and outcome data following surgery from over 700 hospitals in North America, capturing over 1 million surgeries per year, with a high level of accuracy [<xref ref-type="bibr" rid="ref29">29</xref>]. The database was queried for all TKA and THA surgical procedures performed between 2014 and 2019. The actual DOS times as reported in the ACS NSQIP dataset were used to inform simulated daily operating room schedules. A flowchart that helps visualize the overall 2-stage approach is shown in <xref ref-type="fig" rid="figure1">Figure 1</xref>.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>High-level overview of the predict-then-optimize approach. ACS NSQIP: American College of Surgeons National Surgical Quality Improvement Program; DOS: duration of surgery; MSSP: multiple subset sum problem.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e70857_fig01.png"/></fig></sec><sec id="s2-3"><title>Duration of Surgery Prediction</title><p>Data pertaining to 302,490 TKA and 196,942 THA procedures performed during this period as identified from the ACS NSQIP database were used to train models to predict DOS. DOS predictions were done as per Abbas et al [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. They identified a PyTorch multilayer perceptron model that outperformed 10 alternative ML models for predicting DOS for TKA and THA [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. Both models were trained on procedures from 2014 to 2017, hyperparameters tuned with Ray on procedures from 2018, and evaluated on procedures from 2019 [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>]. These models were generated using the Niagara supercomputer at the SciNet HPC Consortium [<xref ref-type="bibr" rid="ref32">32</xref>]. Predictions of DOS from the test subsets of data were used in the optimization model. Refer to the study by Abbas et al [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>] for further details regarding the DOS prediction, model development, hyperparameter tuning, and feature importance.</p></sec><sec id="s2-4"><title>Schedule Optimization Formulations</title><sec id="s2-4-1"><title>Assumptions</title><p>The generated scheduling model considered elective case scheduling, in which surgeries are planned for in advance. The constraints and available resources for the model were generated using real-world constraints from the authors&#x2019; institution, the highest-volume elective arthroplasty hospital in Canada. This included cleaning time (30 min), number of operating rooms (n=5), number of surgeons (n=11), and days a surgeon was unavailable in a week. The planning horizon of 1 week (5 workdays) was also based on these constraints. The penalty for an individual operating room running overtime (after 5 pm), &#x03BB;, was chosen to be double the value of daytime operating room underutilization. This was due to the approximate additional costs associated with operating room staff working after hours. The following assumptions regarding scheduling were made: surgeons are available to operate any day anytime except for 0&#x2010;2 randomly selected days per week per surgeon, and once a surgery is assigned to a surgeon, they must perform it (ie, no sharing patients). These assumptions were made as the study did not have access to historical data on surgeon availability from the authors&#x2019; institution. There were no constraints placed on the schedule based on staffing or patient beds in the recovery unit or ward.</p></sec><sec id="s2-4-2"><title>Optimization Formulations</title><p>In total, 3 scheduling optimization problems were formulated. All formulations were based on an integer linear programming framework that has been used for many different scheduling problems, including but not limited to surgery scheduling [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref33">33</xref>]. The first, &#x201C;Any,&#x201D; was adapted from Marques et al [<xref ref-type="bibr" rid="ref27">27</xref>] with notable modifications including the addition of an overtime penalty and only considering 1 surgery specialty. &#x201C;Any&#x201D; allows any surgery to be scheduled at any time of day in any room subject to the constraints that no surgeries in a room overlap, and that no surgeon is operating in 2 rooms simultaneously. The second formulation, &#x201C;Split,&#x201D; is the same as &#x201C;Any&#x201D; but enforces a maximum of 2 surgeons per operating room on a given day and a maximum of 1 room per surgeon per day. This was chosen as it is common when there are rooms that may be split between 2 surgeons if 1 surgeon cannot fill the room for that particular day. Finally, the third formulation is akin to a max-sum multiple subset sum problem and is thus referred to as &#x201C;MSSP.&#x201D; It enforces 1 surgeon per operating room on a given day, simplified into multiple optimization problems for each surgeon, following a fair distribution of rooms among surgeons. This is the most common configuration used on a clinical basis, where one surgeon has one operative room dedicated to their cases per day. &#x201C;Any&#x201D; is the most flexible optimization formulation, ie, the least constrained of the 3. &#x201C;Split&#x201D; and &#x201D;Any&#x201D; impose additional constraints on feasible schedules and reflect realistic logistical restrictions that a hospital may want to impose, eg, having a surgeon use the same room on any given day. Details of these formulations are found in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s2-4-3"><title>Simulated Schedule Generation</title><p>Using the ACS NSQIP data, simulated schedules were generated using each optimization formulation, with schedule parameters as follows. Schedule granularity of 10- and 15-minute block times was considered. These sizes were chosen to ensure interpretable schedule generation. Surgery completion times were rounded up to the nearest block. The effect of surgeon waitlist size on schedule accuracy was also evaluated. Waitlist sizes representing 2 weeks (n=250), 4 weeks (n=500), 8 weeks (n=1000), and 12 weeks (n=1500) were considered. The cases within the waitlist were all given the same priority to be booked (no rank by time), unless randomly considered to be of high priority.</p><p>Three different versions of each model with the above schedule parameters were created. The first model used the ML-predicted DOS values for THA and TKA; this is the novel 2-stage approach of predicting then optimizing that we are proposing in this work. The second model used the mean DOS for each different type of surgery (THA and TKA) in order to obtain a schedule that mimics the current operating room schedule. Finally, a hindsight model was created that used the true DOS values to provide an upper bound on the best possible schedule that could be generated with perfect information (100% accurate to the minute). Each of these 3 simulations was performed 104 times (to represent 2 y) using a random sample of surgeries from the testing set.</p></sec><sec id="s2-4-4"><title>Scheduling Comparisons</title><p>To compare the 3 schedule optimization formulations (Any, Split, and MSSP), the results of the 2-stage predict-then-optimize simulation results across all schedule parameter combinations were assessed. To evaluate the efficacy of the 2-stage schedule generation technique, it was compared to the results of scheduling by 2 other techniques: the mean DOS for each surgery (the current gold standard at most institutions) and the hindsight schedule. Each of these 3 schedules was constructed for each week of the simulation, and metrics consisting of overtime, underutilization, and the objective function value were calculated for each schedule. Student&#x2019;s t-test was used to compare the effect between scheduling formulations. Overtime and underutilization for 2-stage and mean DOS schedules over the simulated weeks were compared using the paired Wilcoxon signed-rank test, as the same surgical cases were randomly selected for each generated schedule. The effect of schedule granularity and considered waitlist size was evaluated using unpaired Student&#x2019;s <italic>t</italic>-test and analysis of variance as these were grouped over multiple selections of random cases. <italic>P</italic> values of &#x003C;.05 were considered statistically significant.</p></sec></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Prediction Model Accuracy</title><p>Demographic details of patients included are found in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>. A summary of the DOS prediction models is found in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>. The TKA prediction model obtained a training accuracy (with a 30 min buffer) of 76.9% and a training mean squared error (MSE) of 0.904. The validation accuracy was 77.7% with an MSE of 0.904. The test accuracy was 78.1% with an MSE of 0.898. The THA prediction model obtained a training accuracy of 74.0% and a training MSE of 0.888. The validation accuracy was 75.0% with an MSE of 0.910, and the test accuracy was 75.4% with an MSE of 0.916.</p></sec><sec id="s3-2"><title>Schedule Optimization Formulation Comparison</title><p>Overall, the Any scheduling optimization formulation exhibited the poorest performance across all different schedule parameter combinations (<xref ref-type="table" rid="table1">Table 1</xref>). There was no significant difference in overtime across all schedule parameters between the Split and MSSP formulations. For 2 combinations of schedule parameters (10 min granularity, 1500 waitlist size and 15 min granularity, 1500 waitlist size), there was significantly less operating room underutilization with the MSSP formulation; however, this was only 10.9 minutes and 15.4 minutes, respectively, on average over an entire week (<xref ref-type="table" rid="table1">Table 1</xref>). In contrast, for 15-minute granularity and a 250-waitlist size, there was significantly more operating room underutilization with MSSP compared to the Split formulation, 42.3 minutes over an entire week (<xref ref-type="table" rid="table1">Table 1</xref>). <xref ref-type="fig" rid="figure2">Figures 2</xref> and <xref ref-type="fig" rid="figure3">3</xref> display this comparison for overtime and underutilization across all 3 optimization problems, respectively.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Simulated schedule results for 2-stage (predict-then-optimize) for each schedule optimization formulation. The mean number of cases/week is not significant between any schedule optimization formulations.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Schedule parameters</td><td align="left" valign="bottom">Overtime min/week, mean (SD)</td><td align="left" valign="bottom" colspan="2"><italic>P</italic> value</td><td align="left" valign="bottom">Underutilization min/week, mean (SD)</td><td align="left" valign="bottom" colspan="2"><italic>P</italic> value</td><td align="left" valign="bottom">Mean cases/week (SD)</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="8">Granularity=10 minutes, waitlist=250 patients (2 wk)</td></tr><tr><td align="left" valign="top">Any</td><td align="left" valign="top">1335.7 (322.1)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">669.1 (189.1)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">125.0 (0.2)</td></tr><tr><td align="left" valign="top">Split</td><td align="left" valign="top">1003.8 (238.1)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">Reference</td><td align="left" valign="top">285.2 (117.4)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">Reference</td><td align="left" valign="top">125.0 (0.2)</td></tr><tr><td align="left" valign="top">MSSP<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup></td><td align="left" valign="top">1010.9 (211.3)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">.82</td><td align="left" valign="top">309.7 (128.7)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">.15</td><td align="left" valign="top">124.2 (0.9)</td></tr><tr><td align="left" valign="top" colspan="8">Granularity=10 minutes, waitlist=500 patients (4 wk)</td></tr><tr><td align="left" valign="top">Any</td><td align="left" valign="top">1410.4 (331.2)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">694.4 (157.0)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">125.0 (0.2)</td></tr><tr><td align="left" valign="top">Split</td><td align="left" valign="top">966.7 (232.9)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">Reference</td><td align="left" valign="top">300.8 (113.9)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">Reference</td><td align="left" valign="top">125.0 (0.1)</td></tr><tr><td align="left" valign="top">MSSP</td><td align="left" valign="top">988.6 (216.3)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">.49</td><td align="left" valign="top">298.8 (119.8)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">.91</td><td align="left" valign="top">124.9 (0.2)</td></tr><tr><td align="left" valign="top" colspan="8">Granularity=10 minutes, waitlist=1000 patients (8 wk)</td></tr><tr><td align="left" valign="top">Any</td><td align="left" valign="top">1368.8 (310.0)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">689.6 (183.7)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">124.9 (0.3)</td></tr><tr><td align="left" valign="top">Split</td><td align="left" valign="top">964.0 (243.9)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">Reference</td><td align="left" valign="top">301.6 (119.9)</td><td align="left" valign="top">&#x003C;0.001</td><td align="left" valign="top">Reference</td><td align="left" valign="top">125.0 (0.2)</td></tr><tr><td align="left" valign="top">MSSP</td><td align="left" valign="top">954.9 (225.7)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">.78</td><td align="left" valign="top">306.3 (112.8)</td><td align="left" valign="top">&#x003C;0.001</td><td align="left" valign="top">.78</td><td align="left" valign="top">124.7 (0.6)</td></tr><tr><td align="left" valign="top" colspan="8">Granularity=10 minutes, waitlist=1500 patients (12 wk)</td></tr><tr><td align="left" valign="top">Any</td><td align="left" valign="top">1267.9 (321.9)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">657.7 (165.2)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">124.8 (0.4)</td></tr><tr><td align="left" valign="top">Split</td><td align="left" valign="top">972.2 (225.2)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">Reference</td><td align="left" valign="top">325.9 (114.8)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">Reference</td><td align="left" valign="top">124.9 (0.3)</td></tr><tr><td align="left" valign="top">MSSP</td><td align="left" valign="top">981.3 (199.0)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">.34</td><td align="left" valign="top">315.0 (109.9)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">124.3 (0.7)</td></tr><tr><td align="left" valign="top" colspan="8">Granularity=15 minutes, waitlist=250 patients (2 wk)</td></tr><tr><td align="left" valign="top">Any</td><td align="left" valign="top">1416.2 (357.7)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">702.3 (185.5)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">123.4 (1.8)</td></tr><tr><td align="left" valign="top">Split</td><td align="left" valign="top">985.1 (235.6)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">Reference</td><td align="left" valign="top">307.6 (119.9)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">Reference</td><td align="left" valign="top">123.1 (1.9)</td></tr><tr><td align="left" valign="top">MSSP</td><td align="left" valign="top">977.9 (229.7)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">.82</td><td align="left" valign="top">349.9 (144.4)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">.02</td><td align="left" valign="top">121.6 (1.5)</td></tr><tr><td align="left" valign="top" colspan="8">Granularity=15 minutes, waitlist=500 patients (4 wk)</td></tr><tr><td align="left" valign="top">Any</td><td align="left" valign="top">1450.8 (331.3)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">674.4 (167.6)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">124.8 (0.4)</td></tr><tr><td align="left" valign="top">Split</td><td align="left" valign="top">1016.3 (240.1)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">Reference</td><td align="left" valign="top">273.9 (104.0)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">Reference</td><td align="left" valign="top">124.9 (0.3)</td></tr><tr><td align="left" valign="top">MSSP</td><td align="left" valign="top">1025.6 (235.9)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">.78</td><td align="left" valign="top">263.7 (111.3)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">.50</td><td align="left" valign="top">124.6 (0.7)</td></tr><tr><td align="left" valign="top" colspan="8">Granularity=15 minutes, waitlist=1000 patients (8 wk)</td></tr><tr><td align="left" valign="top">Any</td><td align="left" valign="top">1434.7 (324.7)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">669.7 (160.8)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">124.6 (0.7)</td></tr><tr><td align="left" valign="top">Split</td><td align="left" valign="top">1039.3 (229.5)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">Reference</td><td align="left" valign="top">242.0 (99.3)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">Reference</td><td align="left" valign="top">124.9 (0.4)</td></tr><tr><td align="left" valign="top">MSSP</td><td align="left" valign="top">1040.8 (230.6)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">.96</td><td align="left" valign="top">260.5 (100.1)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">.19</td><td align="left" valign="top">124.8 (0.5)</td></tr><tr><td align="left" valign="top" colspan="8">Granularity=15 minutes, waitlist=1500 patients (12 wk)</td></tr><tr><td align="left" valign="top">Any</td><td align="left" valign="top">1369.9 (356.1)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">641.3 (153.5)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">123.8 (1.2)</td></tr><tr><td align="left" valign="top">Split</td><td align="left" valign="top">996.2 (207.1)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">Reference</td><td align="left" valign="top">294.1 (108.3)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">Reference</td><td align="left" valign="top">124.5 (0.7)</td></tr><tr><td align="left" valign="top">MSSP</td><td align="left" valign="top">988.6 (229.9)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">.59</td><td align="left" valign="top">278.7 (113.1)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">.001</td><td align="left" valign="top">124.5 (0.7)</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>MSSP: multiple subset sum problem.</p></fn></table-wrap-foot></table-wrap><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Mean overtime for each schedule optimization formulation across all schedule parameter combinations. MSSP: multiple subset sum problem.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e70857_fig02.png"/></fig><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Mean underutilization for each schedule optimization formulation across all schedule parameter combinations. MSSP: multiple subset sum problem.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e70857_fig03.png"/></fig></sec><sec id="s3-3"><title>Simulated Schedule Comparison</title><p>As the MSSP scheduling formulation performed best across all schedule parameters, it was used in all further analyses. The 2-stage predict-then-optimize approach performed better than using mean DOS for over 80% of weekly schedules in terms of objective optimization problem value across all schedule parameter combinations. This difference was more consistent across the schedules generated using 15-minute schedule granularity size, where 2-stage was superior to mean in over 90% of simulated schedules (<xref ref-type="table" rid="table2">Table 2</xref>). There was less overtime across all schedule parameters when using the 2-stage approach (<italic>P</italic>&#x003C;.001), equating to an average decrease in overtime of 300-500 minutes per week at the simulated hospital (or 12-20 min per operating room per day). However, there was more operating room underutilization with the 2-stage approach across all schedule parameters (<xref ref-type="table" rid="table3">Table 3</xref>; <italic>P</italic>&#x003C;.001). As expected, the hindsight schedule was nearly perfect for all generated schedules and was significantly better than the 2-stage or mean approach with respect to objective value, overtime, and underutilization (<xref ref-type="table" rid="table3">Table 3</xref>). Despite a statistically significant difference, there was no clinically realizable difference in the number of cases performed between the 2-stage and mean groups; however, the hindsight formulation scheduled less cases than both the mean and the 2-stage approach (mean of approximately 12 fewer cases per wk). Details regarding the Any and Split scheduling formulation results are found in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendices 4</xref> and <xref ref-type="supplementary-material" rid="app5">5</xref>, respectively.</p><p>The changes to schedule granularity and considered waitlist size did not influence the amount of overtime. However, there was significantly less operating room underutilization with the 15-minute granularity schedules (<italic>P</italic>=.02) and with waitlist sizes greater than 500, or 1 month considered (<italic>P</italic>&#x003C;.001) (<xref ref-type="table" rid="table4">Table 4</xref>).</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Percentage of simulations in which the 2-stage performed better than mean for all schedule parameters using the MSSP schedule optimization formulation.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Granularity</td><td align="left" valign="bottom">250 cases</td><td align="left" valign="bottom">500 cases</td><td align="left" valign="bottom">1000 cases</td><td align="left" valign="bottom">1500 cases</td></tr></thead><tbody><tr><td align="left" valign="top">10 minutes</td><td align="left" valign="top">86.5</td><td align="left" valign="top">90.4</td><td align="left" valign="top">80.1</td><td align="left" valign="top">81.7</td></tr><tr><td align="left" valign="top">15 minutes</td><td align="left" valign="top">95.2</td><td align="left" valign="top">91.3</td><td align="left" valign="top">97.1</td><td align="left" valign="top">93.3</td></tr></tbody></table></table-wrap><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Comparing 2-stage mean and hindsight durations of surgery using the multiple subset sum problem (MSSP) schedule optimization formulation.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Method</td><td align="left" valign="bottom">Overtime (min/week), mean (SD)</td><td align="left" valign="bottom"><italic>P</italic> value</td><td align="left" valign="bottom">Underutilization (min/week), mean (SD)</td><td align="left" valign="bottom"><italic>P</italic> value</td><td align="left" valign="bottom">Mean cases/week (SD)</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="7">Granularity=10 minutes, waitlist=250 patients (2 wk)</td></tr><tr><td align="left" valign="top">Two-stage</td><td align="left" valign="top">1010.9 (211.3)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">309.7 (128.7)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">124.2 (0.9)</td><td align="left" valign="top">Reference</td></tr><tr><td align="left" valign="top">Mean</td><td align="left" valign="top">1310.9 (296.9)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">218.7 (99.1)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">124.9 (0.5)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Hindsight</td><td align="left" valign="top">0.4 (3.1)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">13.8 (52.8)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">112.5 (2.8)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top" colspan="7">Granularity=10 minutes, waitlist=500 patients (4 wk)</td></tr><tr><td align="left" valign="top">Two-stage</td><td align="left" valign="top">988.6 (216.3)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">298.8 (119.8)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">124.9 (0.2)</td><td align="left" valign="top">Reference</td></tr><tr><td align="left" valign="top">Mean</td><td align="left" valign="top">1305.7 (242.2)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">220.8 (102.0)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">125.0 (0)</td><td align="left" valign="top">.01</td></tr><tr><td align="left" valign="top">Hindsight</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">112.8 (2.7)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top" colspan="7">Granularity=10 minutes, waitlist=1000 patients (8 wk)</td></tr><tr><td align="left" valign="top">Two-stage</td><td align="left" valign="top">954.9 (225.7)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">306.3 (112.8)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">124.7 (0.6)</td><td align="left" valign="top">Reference</td></tr><tr><td align="left" valign="top">Mean</td><td align="left" valign="top">1276.3 (310.1)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">220.4 (101.5)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">125.0 (0)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Hindsight</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">120.3 (3.4)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top" colspan="7">Granularity=10 minutes, waitlist=1500 patients (12 wk)</td></tr><tr><td align="left" valign="top">Two-stage</td><td align="left" valign="top">981.3 (199.0)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">315.0 (109.9)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">124.3 (0.7)</td><td align="left" valign="top">Reference</td></tr><tr><td align="left" valign="top">Mean</td><td align="left" valign="top">1267.7 (224.0)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">223.4 (95.1)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">125.0 (0)</td><td align="left" valign="top">.24</td></tr><tr><td align="left" valign="top">Hindsight</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">0.0 (0)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">125.4 (3.9)</td><td align="left" valign="top">.006</td></tr><tr><td align="left" valign="top" colspan="7">Granularity=15 minutes, waitlist=250 patients (2 wk)</td></tr><tr><td align="left" valign="top">Two-stage</td><td align="left" valign="top">977.9 (229.7)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">349.9 (144.4)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">121.6 (1.5)</td><td align="left" valign="top">Reference</td></tr><tr><td align="left" valign="top">Mean</td><td align="left" valign="top">1485.0 (274.0)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">158.1 (107.4)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">124.9 (0.5)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Hindsight</td><td align="left" valign="top">0.4 (3.3)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">15.7 (66.2)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">113.8 (2.5)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top" colspan="7">Granularity=15 minutes, waitlist=500 patients (4 wk)</td></tr><tr><td align="left" valign="top">Two-stage</td><td align="left" valign="top">1025.6 (235.9)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">263.7 (111.3)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">124.6 (0.7)</td><td align="left" valign="top">Reference</td></tr><tr><td align="left" valign="top">Mean</td><td align="left" valign="top">1526.7 (275.6)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">149.3 (81.9)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">125.0 (0)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Hindsight</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">116.1 (2.5)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top" colspan="7">Granularity=15 minutes, waitlist=1000 patients (8 wk)</td></tr><tr><td align="left" valign="top">Two-stage</td><td align="left" valign="top">1040.8 (239.8)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">260.5 (100.1)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">124.8 (0.5)</td><td align="left" valign="top">Reference</td></tr><tr><td align="left" valign="top">Mean</td><td align="left" valign="top">1562.2 (262.0)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">140.6 (90.7)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">125.0 (0)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Hindsight</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">119.0 (2.1)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top" colspan="7">Granularity=15 minutes, waitlist=1500 patients (12 wk)</td></tr><tr><td align="left" valign="top">Two-stage</td><td align="left" valign="top">988.6 (229.9)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">278.7 (113.1)</td><td align="left" valign="top">Reference</td><td align="left" valign="top">124.5 (0.7)</td><td align="left" valign="top">Reference</td></tr><tr><td align="left" valign="top">Mean</td><td align="left" valign="top">1540.0 (267.0)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">164.6 (79.8)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">125.0 (0)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Hindsight</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">118.8 (2.4)</td><td align="left" valign="top">&#x003C;.001</td></tr></tbody></table></table-wrap><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Comparing the impact of schedule parameters for the 2-stage multiple subset sum problem (MSSP).</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Schedule parameters</td><td align="left" valign="bottom">Overtime, min/week, mean (SD)</td><td align="left" valign="bottom"><italic>P</italic> value</td><td align="left" valign="bottom">Underutilization, min/week, mean (SD)</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top">Granularity</td><td align="left" valign="top"/><td align="left" valign="top">.12</td><td align="left" valign="top"/><td align="left" valign="top">.02</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>10 min</td><td align="left" valign="top">983.9 (213.9)</td><td align="left" valign="top" rowspan="2"/><td align="left" valign="top">307.5 (117.8)</td><td align="left" valign="top" rowspan="2"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>15 min</td><td align="left" valign="top">1008.2 (231.5)</td><td align="left" valign="top">288.2 (117.2)</td></tr><tr><td align="left" valign="top">Waitlist size</td><td align="left" valign="top"/><td align="left" valign="top">.79</td><td align="left" valign="top"/><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>250 (2 weeks)</td><td align="left" valign="top">994.4 (221.9)</td><td align="left" valign="top"/><td align="left" valign="top">329.8 (138.5)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>500 (4 weeks)</td><td align="left" valign="top">1007.1 (227.6)</td><td align="left" valign="top"/><td align="left" valign="top">281.25 (117.2)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1000 (8 weeks)</td><td align="left" valign="top">997.8 (232.8)</td><td align="left" valign="top"/><td align="left" valign="top">283.4 (109.4)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1500 (12 weeks)</td><td align="left" valign="top">984.9 (215.5)</td><td align="left" valign="top"/><td align="left" valign="top">296.8 (113.3)</td><td align="left" valign="top"/></tr></tbody></table></table-wrap></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><p>This paper compared 3 different scheduling optimization problems and evaluated a novel approach to surgical scheduling for TKAs and THAs using a combined 2-stage ML DOS prediction and optimization. There was no significant difference in operating room underutilization or overtime between the MSSP (one surgeon designated to one operating room per day) or Split (maximum of 2 surgeons designated for 1 operating room per day) optimization formulations. However, both performed significantly better than the Any (no limit on surgeons per operating room per day) formulation.</p><p>We believe this is due to the limitations of the predictions: underestimating the DOS of 1 case c being performed by surgeon h in room r can have cascading effects on another room r<sup>&#x2032;</sup> in which the same surgeon h is due to perform another surgery c<sup>&#x2032;</sup> at a later time. This causes additional overtime penalties for &#x201C;Any,&#x201D; something that the more restrictive &#x201C;Split&#x201D; and &#x201C;MSSP&#x201D; do not encounter. This is why, despite optimal solutions to &#x201C;Any&#x201D; being theoretically better than those of &#x201C;Split,&#x201D; they performed worse when simulated with the actual DOS.</p><p>Overall, the combined 2-stage approach significantly outperformed the current standard for scheduling cases, which is a case-specific mean surgery duration. This performance improvement was maintained across all schedule parameter combinations, including different schedule block granularity and different patient waitlist sizes considered. Despite this improvement, the 2-stage approach performed considerably worse than the hindsight schedule, highlighting the limitations of the current predictions that are based solely on preoperative patient data. Interestingly, there was no impact on overtime by varying schedule granularity or waitlist size; however, both of these impacted the amount of underutilization. The smaller waitlist size of 2 weeks of considered cases had a greater amount of underutilization, which was likely due to surgeons not having enough cases to fill their operating room time. Once a threshold was met at a 4-week pool of cases, there was no difference between groups. Also notable was the fact that when only considering a 2-week pool of cases, the Split optimization formulation outperformed MSSP, likely due to some surgeons not having enough cases to fill their time. Therefore, as the MSSP formulation is most practically implementable, it must be ensured that either the considered case pool is large enough or surgeons are allocated time when they have enough cases to fill an entire operating room day to avoid underutilization.</p><p>Errors in procedure length estimation by clinicians occur in approximately 75% of cases, with 32%&#x2010;50% of daily operating room schedules being underbooked and 37%&#x2010;42% overbooked [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]. This is compounded by the fact that less than 50% of operating time is spent doing surgery [<xref ref-type="bibr" rid="ref34">34</xref>]. Booking based on a historical mean is more accurate than when estimated by the surgical team, though less accurate than traditional ML approaches [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref36">36</xref>-<xref ref-type="bibr" rid="ref38">38</xref>]. Previous approaches using computing to improve surgical scheduling have included schedule optimization or ML to predict DOS in isolation [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>]. Other approaches to scheduling operating room utilization include the use of surgeon-specific mean DOS or a surgeon case-specific rolling average time. To our knowledge, these have not been compared to an ML prediction-based approach. Due to the lack of surgeon-specific details included in the ACS NSQIP dataset, we could not assess the efficacy of these approaches in the present study.</p><p>The implementation of this predict-then-optimize scheduling approach would face several challenges in the real world. The MSSP optimization model is in line with current surgical scheduling practices at most hospitals. This formulation optimizes a specific surgeon&#x2019;s waiting list, increasing their ability to accurately plan their day while ensuring a fair distribution of time (by operating room days) for each surgeon. However, attempting to implement the other optimization formulations (Split and Any) may be faced with resistance by end-users. Particularly, using the Any formulation, surgeons may have cases at the beginning and end of the day spread out across more days in a week. ML-predicted DOS has been trialed previously in operating room planning by one group that found a reduction in wait time between cases [<xref ref-type="bibr" rid="ref41">41</xref>]. However, they generated the predicted DOS and evaluated the implications of that information over a single day, not considering other cases from the waitlist or optimizing the schedule based on the predicted DOS.</p><p>In addition to improving operating room utilization at the systems level, the present study has implications for surgeon-level daily planning. Accurate patient-specific DOS prediction and scheduling allow for more effective personal scheduling, including preoperative preparation, intraoperative workflow, and postoperative responsibilities. Accurate DOS predictions can assist surgeons in anticipating the need for ancillary support (eg, anesthesia, nursing, imaging) and have the potential to help decrease fatigue associated with unplanned overruns. When integrated into scheduling systems that allocate block time based on surgeon-specific waitlists (as in the MSSP formulation), this can enhance both surgeon efficiency and case throughput, aligning institutional resource allocation with the surgeon&#x2019;s realistic operative capacity.</p><p>The generated models and optimization formulations have the ability to transform how elective operating room scheduling is performed. By developing models specific to each operation, this increases the accuracy of each model. Most previous research evaluating the effect of ML for DOS prediction has grouped multiple different procedures [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]. Using such models, the procedure performed would generally be the most important feature, diluting the effect of other important patient factors without using appropriate ML techniques. The potential for cost savings for hospitals, related to reduction in overtime costs and valuable underused operating room time, is high, but the main limitation lies in the accuracy of the DOS prediction. The predictive models for TKA and THA included 33 individual patient features. Improving the model with the use of operational factors from a specific institution would likely have a corresponding effect on the schedule results but would reduce the generalizability of the approach. Further improvements may also be made by directly integrating the downstream scheduling optimization problem into training the predictive ML model [<xref ref-type="bibr" rid="ref42">42</xref>].</p><p>This work presents some limitations. First, the DOS prediction was restricted to preoperative patient factors, based on the availability of data elements in the ACS NSQIP database, limiting the prediction accuracy. This was evidenced by the large difference in schedule performance between the 2-stage method and the perfect, hindsight, schedule. Nevertheless, this approach to predicting DOS still yielded improved schedules as compared to using a surgery-specific mean time estimate. Second, the goal of our optimization problem was to maximize the utilization of the operating room; however, this may not be directly in line with the goals of all hospitals, as some institutions may have other priorities, such as maximizing the number of cases completed. This project only developed predictive models for primary TKA and THA procedures, which may have artificially lowered the potential effect size of using this approach, as these are relatively routine procedures with lower DOS variability. By generating more surgery-specific predictive models within orthopedic surgery or other specialties, the potential for this approach may be even larger. However, these results are more directly applicable to high-volume arthroplasty surgical centers. Additionally, this scheduling approach was a simplified proof-of-concept model that may not be applicable to more complex, real-world scheduling scenarios. For example, it did not consider downstream constraints, such as the number of recovery beds, ward beds, or available staff. This was not a concern at our local institution due to its relative efficiency as a high-volume arthroplasty center. However, this would need to be expanded upon in future work if this is to be practically implemented in less specialized centers. Finally, the Split and Any optimization problems were computationally intensive when considering a waiting list size of 2&#x2010;3 months of patients. This may be a consideration depending on institutional computational resources, which is worth noting when implementing a similar solution.</p><p>In conclusion, using ML patient-specific DOS predictions coupled with optimization was superior to elective scheduling based on a mean DOS metric over 3 different optimization problems with varying constraints and combinations of waitlist size and granularity. This generalizable approach suggests that improvements in hospital resource utilization are possible with the application of new computational methods, but the inclusion of institution-specific operational data may be considered to further improve predictions and scheduling. This has significant potential implications for health care systems struggling with pressures of rising costs and growing operative waitlists.</p></sec></body><back><ack><p>The American College of Surgeons National Surgical Quality Improvement Program (ACS NSQIP) and the hospitals participating in the ACS NSQIP are the source of the data used herein; they have not verified and are not responsible for the statistical validity of the data analysis or the conclusions derived by the authors. Computations were performed on the Mist supercomputer at the SciNet HPC Consortium. SciNet is funded by the Canada Foundation for Innovation; the Government of Ontario; Ontario Research Fund - Research Excellence; and the University of Toronto. The authors gratefully acknowledge the support for JRL through the Ontario Graduate Scholarship (Queen Elizabeth II Graduate Scholarship in Science &#x0026; Technology) and the Holland Centre Research Award.</p></ack><notes><sec><title>Data Availability</title><p>This study analyzed deidentified secondary data from the American College of Surgeons&#x2019; National Surgical Quality Improvement Program (NSQIP) accessed under existing data-use agreements. Due to third-party restrictions, the dataset cannot be publicly shared by the authors. Access to NSQIP data may be requested directly from the American College of Surgeons per their access policies.</p></sec></notes><fn-group><fn fn-type="con"><p>JRL and AA made equal contributions to the paper and as such are joint first authors; conceptualization was done by JRL (lead), AA (lead), JST (lead), BR (supporting), CW (supporting), and EBK (supporting); JRL (lead), AA (lead), JST (lead), BR (supporting), CW (supporting), and EBK (supporting) contributed to methodology; investigation was done by JRL (lead), AA (lead), and JM (supporting); formal analysis was done by JM (lead) and AA (supporting); software was arranged by JM (lead) and AA (supporting); data curation was done by JRL (lead) and JM (lead); writing &#x2013; original draft was done by JRL (lead), AA (lead), and MS (supporting); writing &#x2013; review &#x0026; editing was done by AA (lead), JRL (supporting), MS (supporting), BR (supporting), CW (supporting), and EBK (supporting); supervision was done by BR (lead), CW (lead), EBK (lead), and JST (supporting).</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">ACS NSQIP</term><def><p>American College of Surgeons National Surgical Quality Improvement</p></def></def-item><def-item><term id="abb2">DOS</term><def><p>duration of surgery</p></def></def-item><def-item><term id="abb3">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb4">MSSP</term><def><p>multiple subset sum problem</p></def></def-item><def-item><term id="abb5">THA</term><def><p>total hip arthroplasty</p></def></def-item><def-item><term id="abb6">TKA</term><def><p>total knee arthroplasty</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Martinez</surname><given-names>O</given-names> </name><name name-style="western"><surname>Martinez</surname><given-names>C</given-names> </name><name name-style="western"><surname>Parra</surname><given-names>CA</given-names> </name><name name-style="western"><surname>Rugeles</surname><given-names>S</given-names> </name><name name-style="western"><surname>Suarez</surname><given-names>DR</given-names> </name></person-group><article-title>Machine learning for surgical time prediction</article-title><source>Comput Methods Programs Biomed</source><year>2021</year><month>09</month><volume>208</volume><fpage>106220</fpage><pub-id pub-id-type="doi">10.1016/j.cmpb.2021.106220</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Cabrera</surname><given-names>J</given-names> </name><name name-style="western"><surname>Tsui</surname><given-names>KL</given-names> </name><name name-style="western"><surname>Guo</surname><given-names>H</given-names> </name><name name-style="western"><surname>Bakker</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kostis</surname><given-names>JB</given-names> </name></person-group><article-title>Clinical and nonclinical effects on operative duration: evidence from a database on thoracic surgery</article-title><source>J Healthc Eng</source><year>2020</year><month>02</month><day>10</day><volume>2020</volume><fpage>1</fpage><lpage>8</lpage><pub-id pub-id-type="doi">10.1155/2020/3582796</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="web"><article-title>Elderly population</article-title><source>OECD</source><year>2022</year><access-date>2025-09-04</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.oecd.org/en/data/indicators/elderly-population.html">https://www.oecd.org/en/data/indicators/elderly-population.html</ext-link></comment></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bartek</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Saxena</surname><given-names>RC</given-names> </name><name name-style="western"><surname>Solomon</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Improving operating room efficiency: machine learning approach to predict case-time duration</article-title><source>J Am Coll Surg</source><year>2019</year><month>10</month><volume>229</volume><issue>4</issue><fpage>346</fpage><lpage>354</lpage><pub-id pub-id-type="doi">10.1016/j.jamcollsurg.2019.05.029</pub-id><pub-id pub-id-type="medline">31310851</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rothstein</surname><given-names>DH</given-names> </name><name name-style="western"><surname>Raval</surname><given-names>MV</given-names> </name></person-group><article-title>Operating room efficiency</article-title><source>Semin Pediatr Surg</source><year>2018</year><month>04</month><volume>27</volume><issue>2</issue><fpage>79</fpage><lpage>85</lpage><pub-id pub-id-type="doi">10.1053/j.sempedsurg.2018.02.004</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Harris</surname><given-names>T</given-names> </name><name name-style="western"><surname>Segovia</surname><given-names>N</given-names> </name><name name-style="western"><surname>Koltsov</surname><given-names>J</given-names> </name><name name-style="western"><surname>Gardner</surname><given-names>M</given-names> </name></person-group><article-title>Association between operative duration and adverse outcomes after hip fracture surgery: a NSQIP matched cohort study</article-title><source>Injury</source><year>2024</year><month>08</month><volume>55</volume><issue>8</issue><fpage>111635</fpage><pub-id pub-id-type="doi">10.1016/j.injury.2024.111635</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Cabrera</surname><given-names>J</given-names> </name><name name-style="western"><surname>Tsui</surname><given-names>KL</given-names> </name><name name-style="western"><surname>Guo</surname><given-names>H</given-names> </name><name name-style="western"><surname>Bakker</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kostis</surname><given-names>JB</given-names> </name></person-group><article-title>Predicting surgery duration from a new perspective: evaluation from a database on thoracic surgery</article-title><source>arXiv</source><comment>Preprint posted online on  Dec 17, 2017</comment><pub-id pub-id-type="doi">10.48550/arXiv.1712.07809</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rozell</surname><given-names>JC</given-names> </name><name name-style="western"><surname>Ast</surname><given-names>MP</given-names> </name><name name-style="western"><surname>Jiranek</surname><given-names>WA</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>RH</given-names> </name><name name-style="western"><surname>Della Valle</surname><given-names>CJ</given-names> </name></person-group><article-title>Outpatient total joint arthroplasty: the new reality</article-title><source>J Arthroplasty</source><year>2021</year><month>07</month><volume>36</volume><issue>7</issue><fpage>S33</fpage><lpage>S39</lpage><pub-id pub-id-type="doi">10.1016/j.arth.2021.02.030</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Abbas</surname><given-names>A</given-names> </name><name name-style="western"><surname>Mosseri</surname><given-names>J</given-names> </name><name name-style="western"><surname>Lex</surname><given-names>JR</given-names> </name><etal/></person-group><article-title>Machine learning using preoperative patient factors can predict duration of surgery and length of stay for total knee arthroplasty</article-title><source>Int J Med Inform</source><year>2022</year><month>02</month><volume>158</volume><fpage>104670</fpage><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2021.104670</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Ponce</surname><given-names>M</given-names> </name><name name-style="western"><surname>van Zon</surname><given-names>R</given-names> </name><name name-style="western"><surname>Northrup</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Deploying a top-100 supercomputer for large parallel workloads</article-title><conf-name>PEARC &#x2019;19</conf-name><conf-date>Jul 28 to Aug 1, 2019</conf-date><conf-loc>Chicago, IL, USA</conf-loc><pub-id pub-id-type="doi">10.1145/3332186.3332195</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="report"><article-title>ACS NSQIP participant use data file</article-title><year>2023</year><access-date>2023-07-01</access-date><publisher-name>ACS NSQIP</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://www.facs.org/quality-programs/data-and-registries/acs-nsqip/participant-use-data-file/">https://www.facs.org/quality-programs/data-and-registries/acs-nsqip/participant-use-data-file/</ext-link></comment></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pandit</surname><given-names>JJ</given-names> </name></person-group><article-title>Rational planning of operating lists: a prospective comparison of &#x201C;booking to the mean&#x201D; vs. &#x201C;probabilistic case scheduling&#x201D; in urology</article-title><source>Anaesthesia</source><year>2020</year><month>05</month><volume>75</volume><issue>5</issue><fpage>642</fpage><lpage>647</lpage><pub-id pub-id-type="doi">10.1111/anae.14958</pub-id><pub-id pub-id-type="medline">31867710</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yuniartha</surname><given-names>DR</given-names> </name><name name-style="western"><surname>Masruroh</surname><given-names>NA</given-names> </name><name name-style="western"><surname>Herliansyah</surname><given-names>MK</given-names> </name></person-group><article-title>An evaluation of a simple model for predicting surgery duration using a set of surgical procedure parameters</article-title><source>Inform Med Unlocked</source><year>2021</year><volume>25</volume><fpage>100633</fpage><pub-id pub-id-type="doi">10.1016/j.imu.2021.100633</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Marcon</surname><given-names>E</given-names> </name><name name-style="western"><surname>Kharraja</surname><given-names>S</given-names> </name><name name-style="western"><surname>Simonnet</surname><given-names>G</given-names> </name></person-group><article-title>The operating theatre planning by the follow-up of the risk of no realization</article-title><source>Int J Prod Econ</source><year>2003</year><month>07</month><volume>85</volume><issue>1</issue><fpage>83</fpage><lpage>90</lpage><pub-id pub-id-type="doi">10.1016/S0925-5273(03)00088-4</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Huang</surname><given-names>CC</given-names> </name><name name-style="western"><surname>Lai</surname><given-names>J</given-names> </name><name name-style="western"><surname>Cho</surname><given-names>DY</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>J</given-names> </name></person-group><article-title>A machine learning study to improve surgical case duration prediction</article-title><source>Health Systems and Quality Improvement</source><year>2020</year><publisher-name>Cold Spring Harbor Laboratory Press</publisher-name><pub-id pub-id-type="doi">10.1101/2020.06.10.20127910</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hassanzadeh</surname><given-names>H</given-names> </name><name name-style="western"><surname>Boyle</surname><given-names>J</given-names> </name><name name-style="western"><surname>Khanna</surname><given-names>S</given-names> </name><name name-style="western"><surname>Biki</surname><given-names>B</given-names> </name><name name-style="western"><surname>Syed</surname><given-names>F</given-names> </name></person-group><article-title>Daily surgery caseload prediction: towards improving operating theatre efficiency</article-title><source>BMC Med Inform Decis Mak</source><year>2022</year><month>06</month><day>7</day><volume>22</volume><issue>1</issue><fpage>151</fpage><pub-id pub-id-type="doi">10.1186/s12911-022-01893-8</pub-id><pub-id pub-id-type="medline">35672729</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Erdogan</surname><given-names>SA</given-names> </name><name name-style="western"><surname>Denton</surname><given-names>BT</given-names> </name></person-group><source>Surgery Planning and Scheduling</source><year>2011</year><publisher-name>John Wiley &#x0026; Sons, Ltd</publisher-name><pub-id pub-id-type="doi">10.1002/9780470400531.eorms0861</pub-id><pub-id pub-id-type="other">9780470400531</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Akiba</surname><given-names>T</given-names> </name><name name-style="western"><surname>Sano</surname><given-names>S</given-names> </name><name name-style="western"><surname>Yanase</surname><given-names>T</given-names> </name><name name-style="western"><surname>Ohta</surname><given-names>T</given-names> </name><name name-style="western"><surname>Koyama</surname><given-names>M</given-names> </name></person-group><article-title>Optuna: a next-generation hyperparameter optimization framework</article-title><source>arXiv</source><comment>Preprint posted online on  Jul 25, 2019</comment><pub-id pub-id-type="doi">10.48550/arXiv.1907.10902</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shehadeh</surname><given-names>KS</given-names> </name><name name-style="western"><surname>Padman</surname><given-names>R</given-names> </name></person-group><article-title>A distributionally robust optimization approach for stochastic elective surgery scheduling with limited intensive care unit capacity</article-title><source>Eur J Oper Res</source><year>2021</year><month>05</month><volume>290</volume><issue>3</issue><fpage>901</fpage><lpage>913</lpage><pub-id pub-id-type="doi">10.1016/j.ejor.2020.09.001</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="web"><article-title>Healthcare Cost and Utilization Project (HCUP)</article-title><source>AHRQ</source><year>2021</year><access-date>2025-09-04</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.ahrq.gov/data/hcup/index.html">https://www.ahrq.gov/data/hcup/index.html</ext-link></comment></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shi</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Mahdian</surname><given-names>S</given-names> </name><name name-style="western"><surname>Blanchet</surname><given-names>J</given-names> </name><name name-style="western"><surname>Glynn</surname><given-names>P</given-names> </name><name name-style="western"><surname>Shin</surname><given-names>AY</given-names> </name><name name-style="western"><surname>Scheinker</surname><given-names>D</given-names> </name></person-group><article-title>Surgical scheduling via optimization and machine learning with long-tailed data</article-title><source>Health Care Manag Sci</source><year>2023</year><month>12</month><volume>26</volume><issue>4</issue><fpage>692</fpage><lpage>718</lpage><pub-id pub-id-type="doi">10.1007/s10729-023-09649-0</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Marques</surname><given-names>I</given-names> </name><name name-style="western"><surname>Captivo</surname><given-names>ME</given-names> </name><name name-style="western"><surname>Barros</surname><given-names>N</given-names> </name></person-group><article-title>Optimizing the master surgery schedule in a private hospital</article-title><source>Oper Res Health Care</source><year>2019</year><month>03</month><volume>20</volume><fpage>11</fpage><lpage>24</lpage><pub-id pub-id-type="doi">10.1016/j.orhc.2018.11.002</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hans</surname><given-names>E</given-names> </name><name name-style="western"><surname>Wullink</surname><given-names>G</given-names> </name><name name-style="western"><surname>van Houdenhoven</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kazemier</surname><given-names>G</given-names> </name></person-group><article-title>Robust surgery loading</article-title><source>Eur J Oper Res</source><year>2008</year><month>03</month><volume>185</volume><issue>3</issue><fpage>1038</fpage><lpage>1050</lpage><pub-id pub-id-type="doi">10.1016/j.ejor.2006.08.022</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Abbas</surname><given-names>A</given-names> </name><name name-style="western"><surname>Lex</surname><given-names>JR</given-names> </name><name name-style="western"><surname>Toor</surname><given-names>J</given-names> </name><name name-style="western"><surname>Khalil</surname><given-names>EB</given-names> </name><name name-style="western"><surname>Ravi</surname><given-names>B</given-names> </name><name name-style="western"><surname>Whyne</surname><given-names>C</given-names> </name></person-group><article-title>Neural networks accurately predict precise metrics of hospital resource utilization for total hip arthroplasty: a retrospective database study</article-title><comment>Preprint posted online on 2025</comment><pub-id pub-id-type="doi">10.1101/2025.02.11.25322104</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="web"><source>BMUS: The Burden of Musculoskeletal Diseases in the United States</source><year>2011</year><access-date>2025-09-04</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.bmus-ors.org/">https://www.bmus-ors.org/</ext-link></comment></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Eijkemans</surname><given-names>MJC</given-names> </name><name name-style="western"><surname>van Houdenhoven</surname><given-names>M</given-names> </name><name name-style="western"><surname>Nguyen</surname><given-names>T</given-names> </name><name name-style="western"><surname>Boersma</surname><given-names>E</given-names> </name><name name-style="western"><surname>Steyerberg</surname><given-names>EW</given-names> </name><name name-style="western"><surname>Kazemier</surname><given-names>G</given-names> </name></person-group><article-title>Predicting the unpredictable: a new prediction model for operating room times using individual characteristics and the surgeon&#x2019;s estimate</article-title><source>Anesthesiology</source><year>2010</year><month>01</month><volume>112</volume><issue>1</issue><fpage>41</fpage><lpage>49</lpage><pub-id pub-id-type="doi">10.1097/ALN.0b013e3181c294c2</pub-id><pub-id pub-id-type="medline">19952726</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Str&#x00F6;mblad</surname><given-names>CT</given-names> </name><name name-style="western"><surname>Baxter-King</surname><given-names>RG</given-names> </name><name name-style="western"><surname>Meisami</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Effect of a predictive model on planned surgical duration accuracy, patient wait time, and use of presurgical resources: a randomized clinical trial</article-title><source>JAMA Surg</source><year>2021</year><month>04</month><day>1</day><volume>156</volume><issue>4</issue><fpage>315</fpage><lpage>321</lpage><pub-id pub-id-type="doi">10.1001/jamasurg.2020.6361</pub-id><pub-id pub-id-type="medline">33502448</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Garbarino</surname><given-names>LJ</given-names> </name><name name-style="western"><surname>Gold</surname><given-names>PA</given-names> </name><name name-style="western"><surname>Sodhi</surname><given-names>N</given-names> </name><etal/></person-group><article-title>The effect of operative time on in-hospital length of stay in revision total knee arthroplasty</article-title><source>Ann Transl Med</source><year>2019</year><month>02</month><volume>7</volume><issue>4</issue><fpage>66</fpage><lpage>66</lpage><pub-id pub-id-type="doi">10.21037/atm.2019.01.54</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mu&#x00F1;oz</surname><given-names>E</given-names> </name><name name-style="western"><surname>Mu&#x00F1;oz</surname><given-names>W</given-names> </name><name name-style="western"><surname>Wise</surname><given-names>L</given-names> </name></person-group><article-title>National and surgical health care expenditures, 2005-2025</article-title><source>Ann Surg</source><year>2010</year><month>02</month><volume>251</volume><issue>2</issue><fpage>195</fpage><lpage>200</lpage><pub-id pub-id-type="doi">10.1097/SLA.0b013e3181cbcc9a</pub-id><pub-id pub-id-type="medline">20054269</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Attarian</surname><given-names>DE</given-names> </name><name name-style="western"><surname>Wahl</surname><given-names>JE</given-names> </name><name name-style="western"><surname>Wellman</surname><given-names>SS</given-names> </name><name name-style="western"><surname>Bolognesi</surname><given-names>MP</given-names> </name></person-group><article-title>Developing a high-efficiency operating room for total joint arthroplasty in an academic setting</article-title><source>Clin Orthop Relat Res</source><year>2013</year><month>06</month><volume>471</volume><issue>6</issue><fpage>1832</fpage><lpage>1836</lpage><pub-id pub-id-type="doi">10.1007/s11999-012-2718-4</pub-id><pub-id pub-id-type="medline">23208123</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rasmussen</surname><given-names>RV</given-names> </name><name name-style="western"><surname>Trick</surname><given-names>MA</given-names> </name></person-group><article-title>The timetable constrained distance minimization problem</article-title><source>Ann Oper Res</source><year>2009</year><month>10</month><volume>171</volume><issue>1</issue><fpage>45</fpage><lpage>59</lpage><pub-id pub-id-type="doi">10.1007/s10479-008-0384-4</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Lai</surname><given-names>J</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>CC</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>SC</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>JY</given-names> </name><name name-style="western"><surname>Cho</surname><given-names>DY</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>J</given-names> </name></person-group><source>Improving and Interpreting Surgical Case Duration Prediction With Machine Learning Methodology</source><year>2020</year><publisher-name>Cold Spring Harbor Laboratory Press</publisher-name><pub-id pub-id-type="doi">10.1101/2020.06.10.20127910</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Viberg</surname><given-names>N</given-names> </name><name name-style="western"><surname>Forsberg</surname><given-names>BC</given-names> </name><name name-style="western"><surname>Borowitz</surname><given-names>M</given-names> </name><name name-style="western"><surname>Molin</surname><given-names>R</given-names> </name></person-group><article-title>International comparisons of waiting times in health care &#x2013; limitations and prospects</article-title><source>Health Policy</source><year>2013</year><month>09</month><volume>112</volume><issue>1-2</issue><fpage>53</fpage><lpage>61</lpage><pub-id pub-id-type="doi">10.1016/j.healthpol.2013.06.013</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dexter</surname><given-names>F</given-names> </name><name name-style="western"><surname>Ledolter</surname><given-names>J</given-names> </name></person-group><article-title>Bayesian prediction bounds and comparisons of operating room times even for procedures with few or no historic data</article-title><source>Anesthesiology</source><year>2005</year><volume>103</volume><issue>6</issue><fpage>1259</fpage><lpage>1167</lpage><pub-id pub-id-type="doi">10.1097/00000542-200512000-00023</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pandit</surname><given-names>JJ</given-names> </name><name name-style="western"><surname>Tavare</surname><given-names>A</given-names> </name></person-group><article-title>Using mean duration and variation of procedure times to plan a list of surgical operations to fit into the scheduled list time</article-title><source>Eur J Anaesthesiol</source><year>2011</year><month>07</month><volume>28</volume><issue>7</issue><fpage>493</fpage><lpage>501</lpage><pub-id pub-id-type="doi">10.1097/EJA.0b013e3283446b9c</pub-id><pub-id pub-id-type="medline">21623186</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Laskin</surname><given-names>DM</given-names> </name><name name-style="western"><surname>Abubaker</surname><given-names>AO</given-names> </name><name name-style="western"><surname>Strauss</surname><given-names>RA</given-names> </name></person-group><article-title>Accuracy of predicting the duration of a surgical operation</article-title><source>J Oral Maxillofac Surg</source><year>2013</year><month>02</month><volume>71</volume><issue>2</issue><fpage>446</fpage><lpage>447</lpage><pub-id pub-id-type="doi">10.1016/j.joms.2012.10.009</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Scott</surname><given-names>CEH</given-names> </name><name name-style="western"><surname>MacDonald</surname><given-names>DJ</given-names> </name><name name-style="western"><surname>Howie</surname><given-names>CR</given-names> </name></person-group><article-title>&#x201C;Worse than death&#x201D; and waiting for a joint arthroplasty</article-title><source>Bone Joint J</source><year>2019</year><month>08</month><volume>101-B</volume><issue>8</issue><fpage>941</fpage><lpage>950</lpage><pub-id pub-id-type="doi">10.1302/0301-620X.101B8.BJJ-2019-0116.R1</pub-id><pub-id pub-id-type="medline">31362549</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Elmachtoub</surname><given-names>AN</given-names> </name><name name-style="western"><surname>Grigas</surname><given-names>P</given-names> </name></person-group><article-title>Smart predict, then optimize</article-title><source>arXiv</source><comment>Preprint posted online on  Oct 22, 2017</comment><pub-id pub-id-type="doi">10.48550/arXiv.1710.08005</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Liaw</surname><given-names>R</given-names> </name><name name-style="western"><surname>Liang</surname><given-names>E</given-names> </name><name name-style="western"><surname>Nishihara</surname><given-names>R</given-names> </name><name name-style="western"><surname>Moritz</surname><given-names>P</given-names> </name><name name-style="western"><surname>Gonzalez</surname><given-names>JE</given-names> </name><name name-style="western"><surname>Stoica</surname><given-names>I</given-names> </name></person-group><article-title>Tune: a research platform for distributed model selection and training</article-title><source>arXiv</source><comment>Preprint posted online on  Jul 13, 2018</comment><pub-id pub-id-type="doi">10.48550/arXiv.1807.05118</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><article-title>Obesity: another ongoing pandemic</article-title><source>Lancet Gastroenterol Hepatol</source><year>2021</year><month>06</month><volume>6</volume><issue>6</issue><fpage>411</fpage><pub-id pub-id-type="doi">10.1016/S2468-1253(21)00143-6</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Marques</surname><given-names>I</given-names> </name><name name-style="western"><surname>Captivo</surname><given-names>ME</given-names> </name><name name-style="western"><surname>Vaz Pato</surname><given-names>M</given-names> </name></person-group><article-title>An integer programming approach to elective surgery scheduling</article-title><source>OR Spectr</source><year>2012</year><month>04</month><volume>34</volume><issue>2</issue><fpage>407</fpage><lpage>427</lpage><pub-id pub-id-type="doi">10.1007/s00291-011-0279-7</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ahmed</surname><given-names>A</given-names> </name><name name-style="western"><surname>He</surname><given-names>L</given-names> </name><name name-style="western"><surname>Chou</surname><given-names>C an</given-names> </name><name name-style="western"><surname>Hamasha</surname><given-names>MM</given-names> </name></person-group><article-title>A prediction-optimization approach to surgery prioritization in operating room scheduling</article-title><source>J Ind Product Eng</source><year>2022</year><month>07</month><day>4</day><volume>39</volume><issue>5</issue><fpage>399</fpage><lpage>413</lpage><pub-id pub-id-type="doi">10.1080/21681015.2021.2017362</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Optimization formulations.</p><media xlink:href="medinform_v13i1e70857_app1.docx" xlink:title="DOCX File, 5640 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Select preoperative continuous, categorical, and ordinal feature distributions of total knee and hip arthroplasty patients.</p><media xlink:href="medinform_v13i1e70857_app2.docx" xlink:title="DOCX File, 5407 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>Results of the training, validation, and testing set for the duration of surgery (DOS) predictions for total knee and hip arthroplasty (TKA and THA) models, respectively. Accuracies are presented in percentages.</p><media xlink:href="medinform_v13i1e70857_app3.docx" xlink:title="DOCX File, 5404 KB"/></supplementary-material><supplementary-material id="app4"><label>Multimedia Appendix 4</label><p>Comparing 2-stage, mean, and hindsight duration of surgery using the &#x201C;Any&#x201D; schedule optimization formulation.</p><media xlink:href="medinform_v13i1e70857_app4.docx" xlink:title="DOCX File, 5407 KB"/></supplementary-material><supplementary-material id="app5"><label>Multimedia Appendix 5</label><p>Comparing 2-stage, mean, and hindsight duration of surgery using the &#x201C;Split&#x201D; schedule optimization formulation.</p><media xlink:href="medinform_v13i1e70857_app5.docx" xlink:title="DOCX File, 5407 KB"/></supplementary-material></app-group></back></article>