<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id><journal-id journal-id-type="publisher-id">medinform</journal-id><journal-id journal-id-type="index">7</journal-id><journal-title>JMIR Medical Informatics</journal-title><abbrev-journal-title>JMIR Med Inform</abbrev-journal-title><issn pub-type="epub">2291-9694</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v14i1e80574</article-id><article-id pub-id-type="doi">10.2196/80574</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Predicting 5-Year Mortality in Non&#x2013;Small-Cell Lung Cancer Using the Korean Central Cancer Registry: Model Development and Validation Study</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Lee</surname><given-names>Jong Hyuk</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Kim</surname><given-names>Ho Cheol</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Jung</surname><given-names>Kyu-Won</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Choi</surname><given-names>Chang Min</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Oncology, College of Medicine, Asan Medical Center, University of Ulsan</institution><addr-line>Seoul</addr-line><country>Republic of Korea</country></aff><aff id="aff2"><institution>Department of Pulmonary and Critical Care Medicine, College of Medicine, Asan Medical Center, University of Ulsan</institution><addr-line>88, Olympic-ro 43-gil, Songpa-gu</addr-line><addr-line>Seoul</addr-line><country>Republic of Korea</country></aff><aff id="aff3"><institution>Division of Cancer Registration and Surveillance, National Cancer Control Institute, National Cancer Center</institution><addr-line>Goyang</addr-line><country>Republic of Korea</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Coristine</surname><given-names>Andrew</given-names></name></contrib><contrib contrib-type="editor"><name name-style="western"><surname>Benis</surname><given-names>Arriel</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Xu</surname><given-names>Hao</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Guo</surname><given-names>Jinyu</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Su</surname><given-names>Po-Lan</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Chang Min Choi, MD, PhD, Department of Pulmonary and Critical Care Medicine, College of Medicine, Asan Medical Center, University of Ulsan, 88, Olympic-ro 43-gil, Songpa-gu, Seoul, 05505, Republic of Korea, +82-10-9792-9607; <email>ccm@amc.seoul.kr</email></corresp></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>8</day><month>6</month><year>2026</year></pub-date><volume>14</volume><elocation-id>e80574</elocation-id><history><date date-type="received"><day>13</day><month>07</month><year>2025</year></date><date date-type="rev-recd"><day>03</day><month>03</month><year>2026</year></date><date date-type="accepted"><day>06</day><month>03</month><year>2026</year></date></history><copyright-statement>&#x00A9; Jong Hyuk Lee, Ho Cheol Kim, Kyu-Won Jung, Chang Min Choi. Originally published in JMIR Medical Informatics (<ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org">https://medinform.jmir.org</ext-link>), 8.6.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/">https://medinform.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://medinform.jmir.org/2026/1/e80574"/><abstract><sec><title>Background</title><p>Non&#x2013;small-cell lung cancer (NSCLC) is one of the most common cancers and a leading cause of cancer-related mortality, making prognostic prediction clinically essential. Machine learning models are increasingly used to assess prognosis; however, developing systems that combine high discrimination with clear, clinically interpretable reasoning remains challenging.</p></sec><sec><title>Objective</title><p>This study aimed to develop deep learning models that predict 5-year mortality in NSCLC using data from the Korea Central Cancer Registry and quantify feature importance through permutation testing.</p></sec><sec sec-type="methods"><title>Methods</title><p>We identified 3144 patients diagnosed between 2014 and 2017 who had complete clinical data, pulmonary function test results, histological information, genomic data, and staging details. After preprocessing, the cohort was divided into stratified training, validation, and test sets in a 70%-15%-15% ratio. Five models were tuned using Hyperband across 10 predefined feature groups. The primary evaluation metric was the area under the receiver operating characteristic curve (AUC); additional metrics included accuracy, <italic>F</italic><sub>1</sub>-score, precision, and recall. Groupwise permutation importance was calculated for each model, and the concordance of importance rankings was assessed using the Friedman test.</p></sec><sec sec-type="results"><title>Results</title><p>All 5 models yielded comparable discrimination values on the test set (AUC=0.875&#x2010;0.879). Model A was selected as the primary model and achieved an AUC of 0.879, an accuracy of 0.806, an <italic>F</italic><sub>1</sub>-score of 0.824, and a Brier score of 0.142. Permuting the stage resulted in the largest decrease in AUC (0.217), followed by the pulmonary function test (0.016). Gene mutation had a modest overall impact but became more influential within the adenocarcinoma subset. The Friedman test showed no statistically significant differences in importance rankings across the models (<italic>P</italic>=.93).</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>A grouped-input deep learning framework achieved discrimination comparable to a conventional Cox proportional hazards model using the same routine clinical variables for 5-year mortality prediction in NSCLC. Group-level permutation importance provided stable and reproducible insights into the clinical factors influencing risk, which may guide future model refinement and clinical decision-making.</p></sec></abstract><kwd-group><kwd>non&#x2013;small-cell lung cancer</kwd><kwd>deep learning</kwd><kwd>machine learning</kwd><kwd>prognosis</kwd><kwd>Korean Central Cancer Registry</kwd><kwd>KCCR</kwd><kwd>permutation tests</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Non&#x2013;small-cell lung cancer (NSCLC) is one of the most prevalent cancers worldwide and, despite advancements in prognosis, remains a leading cause of cancer-related mortality [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>]. The prognosis of NSCLC is influenced by various factors, including the stage at diagnosis and molecular biomarkers such as alterations in the epidermal growth factor receptor (EGFR) and anaplastic lymphoma kinase (ALK). Therefore, predicting an individual patient&#x2019;s clinical course is crucial for tailoring treatment strategies [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>].</p><p>Machine learning has gained significant traction in oncology due to its ability to capture complex, nonlinear relationships and integrate heterogeneous data modalities [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. Among the various approaches, deep learning stands out for its strong predictive performance and capacity to automatically learn features [<xref ref-type="bibr" rid="ref8">8</xref>]. However, its limited interpretability and reliance on large, well-curated datasets hinder broad adoption in medical research [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. Despite these challenges, many researchers continue to explore deep learning solutions, and growing evidence indicates that this approach enhances decision-making and supports tasks ranging from screening and diagnosis to prognostic prediction in lung cancer and other malignancies [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref14">14</xref>]. Nevertheless, many previous studies have relied on small, single-institution cohorts, increasing the risk of overfitting, and often inadequately reported data preprocessing or hyperparameter tuning procedures, thereby limiting reproducibility [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. Assembling a sufficiently large, well-curated dataset and developing a clinically practical model remain significant challenges for clinicians.</p><p>The Korea Central Cancer Registry (KCCR) is a national population-based registry that systematically collects data on all patients with cancer diagnosed in South Korea. For lung cancer, the KCCR enhanced the staging survey, which samples 10% of all incident lung cancer cases each year. This survey includes demographic variables and clinical details such as symptoms; tumor, node, metastasis (TNM) stage; histologic subtype; and biomarker profiles [<xref ref-type="bibr" rid="ref15">15</xref>]. By aggregating deidentified records from over 50 medical centers, the KCCR offers a large, multicenter cohort suitable for robust deep learning analyses. This dataset is particularly suitable for deep learning analyses because it captures complex interactions among heterogeneous clinical variables.</p><p>Accordingly, we developed and validated a deep learning model for 5-year mortality prediction in NSCLC using nationwide registry data from the KCCR and routinely collected clinical features. We implemented a grouped-input architecture that mirrors clinically coherent feature domains and incorporated permutation-based, group-level importance to provide a transparent and reproducible assessment of feature contributions across model configurations [<xref ref-type="bibr" rid="ref16">16</xref>]. Collectively, this design targets clinically applicable use with limited routine variables while maintaining interpretability and clear reporting of preprocessing and hyperparameter tuning.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Data Selection, Preprocessing, and Stratified Splitting</title><p>We obtained data from the KCCR nationwide lung cancer staging survey, which includes patients with NSCLC from 52 hospitals across South Korea. Records from patients diagnosed between 2014 and 2017 were used, excluding those with missing or uncertain information regarding TNM stage, gene mutations (EGFR or ALK), or diagnosis date. Patients with logically inconsistent smoking cessation dates (eg, a missing cessation date despite being recorded as a former smoker, a cessation date earlier than the smoking start date, or a cessation date later than the date of death) were also excluded. An Eastern Cooperative Oncology Group (ECOG) performance status recorded as &#x201C;unknown&#x201D; was recoded as 0. For records with &#x201C;unknown&#x201D; smoking history, the smoking amount and duration fields were also missing; therefore, these cases were recoded as never smokers. We used a complete-case approach for the core variables to avoid unverifiable imputation assumptions and ensure consistency across clinical feature domains. Because this approach may introduce selection bias, we compared baseline characteristics between included and excluded patients using absolute standardized mean differences (SMDs).</p><p>A comprehensive set of demographic and clinical variables was extracted from the original records, including age, sex, BMI (calculated from weight and height), smoking history, symptoms, ECOG performance status, pulmonary function test (PFT) results, clinical stage, and pathological features. For PFT variables, we included one-hot availability indicators derived from the PFT status field along with scaled continuous measurements. Unmeasured values (ie, when the test was not performed) were coded using a sentinel value to indicate nonavailability rather than physiologic zero. Smoking status was one-hot encoded, and quit duration was modeled as a continuous variable only for former smokers. We used a sentinel value for never smokers to denote &#x201C;not applicable,&#x201D; whereas quit duration was set to 0 for current smokers. To assess the potential impact of recoding missing clinical information to the healthiest baseline, we additionally trained an &#x201C;unknown-aware&#x201D; version of our primary model in which &#x201C;unknown&#x201D; ECOG performance status and smoking history were retained as distinct categories. The same data splits, model architecture, and evaluation procedures were used for direct comparison.</p><p>Five-year mortality and survival were defined as an interval of at least 60 months between diagnosis and death or last follow-up. Patients who met this threshold were classified as 5-year survivors, whereas the others were categorized as nonsurvivors. Detailed preprocessing steps are summarized in Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><p>The resulting data were stratified by sex, age, smoking history, PFT status (performed or not), gene mutation status, and 5-year mortality. Accordingly, 70% of patients were allocated to the training dataset, 15% were allocated to the validation set, and 15% were allocated to the test set. Immediately before model training, all continuous variables were scaled to the range of 0 to 1 using min-max normalization, with parameters estimated solely from the training subset. The same transformation was then applied unchanged to the validation and test subsets. Categorical variables were one-hot encoded in a similar manner: the encoder was fitted on the training set and reused for the other sets. Symptoms and histology were recorded as binary indicators (0=absent; 1=present). Instead of encoding each variable separately, we combined the symptom and histology indicators into a single composite vector and applied one-hot encoding. EGFR and ALK mutation indicators were handled similarly, being merged into 1 vector prior to one-hot encoding.</p></sec><sec id="s2-2"><title>Model Construction and Hyperparameter Tuning</title><p>A multilayer perceptron (MLP) was developed to predict 5-year mortality (<xref ref-type="fig" rid="figure1">Figure 1</xref>). The model consists of 2 primary layers preceding the output layer. Age, sex, BMI, ECOG score, and symptoms were directly input into the first main layer, whereas other features (eg, smoking status, PFT, stage, histology, and gene mutation) were grouped into dedicated sublayers. This grouped-input design mirrors clinically coherent feature domains, improving interpretability and enabling domain-level regularization (eg, group-specific widths and dropout) in the presence of correlated predictors; it also stabilizes training under sparsity and collinearity. The outputs from these sublayers were then concatenated and fed into the first primary layer. All sublayers and primary layers used rectified linear unit activation functions, whereas the output layer used a sigmoid function for binary classification. Dropout and L2 regularization techniques were applied throughout these layers to reduce the risk of overfitting.</p><p>Our model was implemented in Python (version 3.12.5; Python Software Foundation) using TensorFlow (version 2.18; Google Brain Team) and scikit-learn (version 1.6.1; Google Summer of Code project). We used the Adam optimizer and binary cross-entropy loss for training. Hyperparameters were tuned using the Keras Hyperband tuner. We selected Hyperband because it efficiently explores large search spaces by allocating more epochs to promising configurations and aggressively pruning unpromising ones (successive halving with early stopping), thereby reducing computational cost and overfitting risk. The hyperparameters were evaluated across the following ranges: sublayer units (4, 8, or 16 for most features and 8, 16, or 32 for stage), main layer units (32, 64, or 128), dropout rates (0.30&#x2010;0.50 in increments of 0.05), L2 regularization strength (&#x03BB; in 10<sup>&#x2013;6</sup> to 10<sup>&#x2013;3</sup>; log scale), and learning rate (10<sup>&#x2013;4</sup> to 10<sup>&#x2013;2</sup>; log scale).</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Grouped-input multilayer perceptron architecture for 5-year mortality prediction in non&#x2013;small-cell lung cancer (NSCLC). Input variables were organized into clinically defined feature domains (demographics; symptoms; smoking variables; pulmonary function test [PFT] measurements; histology; gene mutation; and tumor, node, metastasis stage), processed through domain-specific input layers, and merged into shared hidden layers to generate the final prediction. ALK: anaplastic lymphoma kinase; DLCO: diffusion capacity of the lungs for carbon monoxide; ECOG: Eastern Cooperative Oncology Group performance status; EGFR: epidermal growth factor receptor; FEV<sub>1</sub>: forced expiratory volume in 1 second; FVC: forced vital capacity; NOS: not otherwise specified.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v14i1e80574_fig01.png"/></fig><p>Each candidate architecture was trained for up to 100 epochs, with successive Hyperband rounds retaining approximately the top one-third of models and granting them progressively larger training budgets. The optimization target was the area under the receiver operating characteristic curve (AUC), evaluated on the held-out validation cohort. During each trial, an early-stopping callback monitored the same metric and restored the best weights after 5 epochs without improvement. This approach helped prevent overfitting and reduced runtime. The batch size was fixed at 32. This configuration facilitated efficient evaluation of numerous hyperparameter combinations, allowing for the identification of a set that delivered robust performance with minimal overfitting.</p></sec><sec id="s2-3"><title>Performance Evaluation</title><p>AUC was prespecified as the primary metric given outcome imbalance and its threshold-free nature; accuracy, precision, recall, <italic>F</italic><sub>1</sub>-score, and the area under the precision-recall curve (AUPRC) were reported for completeness. Each metric was calculated for the training, validation, and test datasets. We estimated the 95% CIs through bootstrapping with 1000 resamples. Because our primary objective was to determine whether a patient survived for 5 years, AUC was regarded as the main criterion for performance evaluation and for detecting overfitting. The target for the test set was an AUC exceeding 0.800, with the difference in AUC between the training and test sets remaining below 0.05.</p><p>Cox proportional hazards (CPH) models were established as baselines for comparison using the same predictors. First, a full CPH model was fitted using the same set of predictors as the MLP models. In addition, a TNM-only CPH benchmark model was constructed using only the tumor, node, and metastasis variables to quantify the incremental predictive value of nonstaging clinical features beyond TNM staging. Predicted 5-year mortality probabilities were evaluated using the same set of discrimination and classification metrics across models, enabling direct performance comparisons between the CPH and MLP models.</p></sec><sec id="s2-4"><title>Permutation-Based Feature Importance</title><p>A permutation-based approach was used to assess the importance of each feature (<xref ref-type="fig" rid="figure2">Figure 2</xref>). First, a baseline model was trained using the original test dataset to establish a reference AUC. Then, for each individual feature or feature group, we randomly permuted its variables 100 times while keeping the other features intact and retrained the model on each permuted dataset. The resulting AUC values were compared with the baseline AUC, and the average reductions across permutations were calculated to obtain a mean reduction. A greater reduction indicates a higher contribution of that feature group to the predictive performance of the model.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Schematic overview of the grouped-feature permutation importance procedure. For each clinically defined feature group, values were permuted, whereas the features in all other groups were held fixed, generating 100 permuted datasets. The trained model was evaluated on each dataset, and feature group importance was quantified as the decrease in area under the receiver operating characteristic curve (AUC) relative to the baseline (mean AUC drop across iterations).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v14i1e80574_fig02.png"/></fig><p>The Friedman test using R (version 4.4.0; R Foundation for Statistical Computing) was conducted on the mean AUC reductions to assess consistency across multiple model configurations. This statistical test evaluates the rank order of feature group importance among models to determine whether significant differences in feature rankings exist. A <italic>P</italic> value below .05 was considered statistically significant.</p></sec><sec id="s2-5"><title>Ethical Considerations</title><p>The institutional review board of Asan Medical Center approved this retrospective study (2025-0572; approval date: May 13, 2025). The requirement for written informed consent was waived by the institutional review board because this study involved secondary analysis of routinely collected registry data and posed minimal risk to participants. The investigators received a deidentified dataset from the KCCR and had no access to directly identifiable personal information. Data were analyzed in accordance with institutional policies on data security and confidentiality. No compensation was provided, as participants were not prospectively recruited and there was no direct contact with patients. The manuscript and supplementary materials do not include any images or information that could identify individual participants.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Baseline Demographics of the Patients</title><p>A total of 8664 patients diagnosed with NSCLC from 2014 to 2017 were identified in the KCCR. Of these 8664 patients, 3144 (36.3%) had complete data suitable for analysis. Stratified sampling was conducted to assign patients to the training (2215/3144, 70.5%), validation (464/3144, 14.8%), or test (465/3144, 14.8%; <xref ref-type="fig" rid="figure3">Figure 3</xref>) groups. Additionally, 50 patients who lacked matching counterparts during stratification were included in the training set.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Flowchart of cohort selection and dataset splitting for a retrospective registry-based study of non&#x2013;small-cell lung cancer (NSCLC) in South Korea using the Korea Central Cancer Registry (2014&#x2010;2017). Of 8664 registered patients, 5520 (63.7%) were excluded due to missing tumor, node, metastasis (TNM) stage information; missing gene mutation data; uncertain smoking cessation year; or missing diagnosis date. The final analytic cohort included 3144 patients and was split using stratified sampling into training, validation, and test sets.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v14i1e80574_fig03.png"/></fig><p>Patients&#x2019; baseline characteristics are summarized in <xref ref-type="table" rid="table1">Table 1</xref>. Among the total cohort, 60.7% (1908/3144) of the participants were male. The median age at diagnosis was 66 (IQR 58&#x2010;74) years. Most patients had an ECOG performance status of 0 (1902/3144, 60.5%), followed by a score of 1 (1023/3144, 32.5%). <xref ref-type="table" rid="table2">Table 2</xref> presents details of the cancer-related characteristics. Most patients (2490/3144, 79.2%) were diagnosed with adenocarcinoma. Regarding stage, 35.4% (1113/3144) of the patients were diagnosed at stage 1, whereas the largest subgroup was those diagnosed at stage 4 (1282/3144, 40.8%). EGFR mutations were detected in 36.0% (1131/3144) of the patients, whereas ALK mutations were less common, occurring in 6.6% (209/3144) of the patients. A total of 42.9% (1350/3144) of the patients survived at least 5 years after diagnosis. There were no statistically significant differences in baseline characteristics among the training, validation, and test cohorts.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Baseline demographic and clinical characteristics of the included patients (N=3144).</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">Overall</td><td align="left" valign="bottom">Training set (n=2215)</td><td align="left" valign="bottom">Validation set (n=464)</td><td align="left" valign="bottom">Test set (n=465)</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="5">Sex, n (%)</td><td align="left" valign="top">.89</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Male</td><td align="left" valign="top">1908 (60.7)</td><td align="left" valign="top">1340 (60.5)</td><td align="left" valign="top">281 (60.6)</td><td align="left" valign="top">287 (61.7)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Female</td><td align="left" valign="top">1236 (39.3)</td><td align="left" valign="top">875 (39.5)</td><td align="left" valign="top">183 (39.4)</td><td align="left" valign="top">178 (38.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">Age (y), median (IQR)</td><td align="left" valign="top">66 (58&#x2010;74)</td><td align="left" valign="top">66 (58&#x2010;74)</td><td align="left" valign="top">66 (58&#x2010;74)</td><td align="left" valign="top">66 (58&#x2010;74)</td><td align="left" valign="top">.89</td></tr><tr><td align="left" valign="top">BMI (kg/m<sup>2</sup>), median (IQR)</td><td align="left" valign="top">23.2 (21.0&#x2010;25.4)</td><td align="left" valign="top">23.3 (21.0&#x2010;25.4)</td><td align="left" valign="top">23.0 (21.1&#x2010;25.4)</td><td align="left" valign="top">23.0 (20.8&#x2010;25.4)</td><td align="left" valign="top">.96</td></tr><tr><td align="left" valign="top" colspan="5">ECOG<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> performance status, n (%)</td><td align="left" valign="top">.77</td></tr><tr><td align="char" char="." valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>0</td><td align="left" valign="top">1902 (60.5)</td><td align="left" valign="top">1330 (60.0)</td><td align="left" valign="top">282 (60.8)</td><td align="left" valign="top">290 (62.4)</td><td align="left" valign="top"/></tr><tr><td align="char" char="." valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1</td><td align="left" valign="top">1023 (32.5)</td><td align="left" valign="top">726 (32.8)</td><td align="left" valign="top">150 (32.3)</td><td align="left" valign="top">147 (31.6)</td><td align="left" valign="top"/></tr><tr><td align="char" char="." valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>2</td><td align="left" valign="top">160 (5.1)</td><td align="left" valign="top">114 (5.1)</td><td align="left" valign="top">23 (5.0)</td><td align="left" valign="top">23 (4.9)</td><td align="left" valign="top"/></tr><tr><td align="char" char="." valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>3</td><td align="left" valign="top">45 (1.4)</td><td align="left" valign="top">32 (1.4)</td><td align="left" valign="top">8 (1.7)</td><td align="left" valign="top">5 (1.1)</td><td align="left" valign="top"/></tr><tr><td align="char" char="." valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>4</td><td align="left" valign="top">14 (0.4)</td><td align="left" valign="top">13 (0.6)</td><td align="left" valign="top">1 (0.2)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="5">Smoking status, n (%)</td><td align="left" valign="top">&#x003E;.99</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Never smoked</td><td align="left" valign="top">1420 (45.2)</td><td align="left" valign="top">1000 (45.1)</td><td align="left" valign="top">210 (45.3)</td><td align="left" valign="top">210 (45.2)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Current smoker</td><td align="left" valign="top">927 (29.5)</td><td align="left" valign="top">654 (29.5)</td><td align="left" valign="top">136 (29.3)</td><td align="left" valign="top">137 (29.5)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Ex-smoker</td><td align="left" valign="top">797 (25.3)</td><td align="left" valign="top">561 (25.3)</td><td align="left" valign="top">118 (25.4)</td><td align="left" valign="top">118 (25.4)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="6">PFT<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup>, median (IQR)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FVC<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup> (L)</td><td align="left" valign="top">3.1 (2.6&#x2010;3.7)</td><td align="left" valign="top">3.1 (2.6&#x2010;3.7)</td><td align="left" valign="top">3.1 (2.6&#x2010;3.8)</td><td align="left" valign="top">3.1 (2.5&#x2010;3.7)</td><td align="left" valign="top">.76</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FEV<sub>1</sub><sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup> (L)</td><td align="left" valign="top">2.3 (1.8&#x2010;2.7)</td><td align="left" valign="top">2.3 (1.8&#x2010;2.7)</td><td align="left" valign="top">2.3 (1.9&#x2010;2.8)</td><td align="left" valign="top">2.2 (1.8&#x2010;2.7)</td><td align="left" valign="top">.66</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>DLCO<sup><xref ref-type="table-fn" rid="table1fn5">e</xref></sup> (%)</td><td align="left" valign="top">85.0 (71.0&#x2010;99.0)</td><td align="left" valign="top">85.0 (71.0&#x2010;99.0)</td><td align="left" valign="top">86.5 (72.0&#x2010;100.0)</td><td align="left" valign="top">83.0 (71.0&#x2010;97.0)</td><td align="left" valign="top">.58</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>ECOG: Eastern Cooperative Oncology Group.</p></fn><fn id="table1fn2"><p><sup>b</sup>PFT: pulmonary function test.</p></fn><fn id="table1fn3"><p><sup>c</sup>FVC: forced vital capacity.</p></fn><fn id="table1fn4"><p><sup>d</sup>FEV<sub>1</sub>: forced expiratory volume in 1 second.</p></fn><fn id="table1fn5"><p><sup>e</sup>DLCO: diffusion capacity of the lungs for carbon monoxide.</p></fn></table-wrap-foot></table-wrap><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Cancer-related characteristics of the included patients (N=3144).</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">Overall, n (%)</td><td align="left" valign="bottom">Training set (n=2215), n (%)</td><td align="left" valign="bottom">Validation set (n=464), n (%)</td><td align="left" valign="bottom">Test set (n=465), n (%)</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="5">Symptoms</td><td align="left" valign="top">&#x003E;.99</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Asymptomatic</td><td align="left" valign="top">1528 (48.6)</td><td align="left" valign="top">1067 (48.2)</td><td align="left" valign="top">235 (50.6)</td><td align="left" valign="top">226 (48.6)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Cough</td><td align="left" valign="top">890 (28.3)</td><td align="left" valign="top">624 (28.2)</td><td align="left" valign="top">138 (29.7)</td><td align="left" valign="top">128 (27.5)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Sputum</td><td align="left" valign="top">494 (15.7)</td><td align="left" valign="top">345 (15.6)</td><td align="left" valign="top">76 (16.4)</td><td align="left" valign="top">73 (15.7)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Dyspnea</td><td align="left" valign="top">431 (13.7)</td><td align="left" valign="top">301 (13.6)</td><td align="left" valign="top">62 (13.4)</td><td align="left" valign="top">68 (14.6)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hoarseness</td><td align="left" valign="top">34 (1.1)</td><td align="left" valign="top">22 (1.0)</td><td align="left" valign="top">7 (1.5)</td><td align="left" valign="top">5 (1.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hemoptysis</td><td align="left" valign="top">147 (4.7)</td><td align="left" valign="top">102 (4.6)</td><td align="left" valign="top">21 (4.5)</td><td align="left" valign="top">24 (5.2)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Weight loss</td><td align="left" valign="top">185 (5.9)</td><td align="left" valign="top">133 (6.0)</td><td align="left" valign="top">27 (5.8)</td><td align="left" valign="top">25 (5.4)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Pain</td><td align="left" valign="top">493 (15.7)</td><td align="left" valign="top">352 (15.9)</td><td align="left" valign="top">77 (16.6)</td><td align="left" valign="top">66 (14.2)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="5">Histology</td><td align="left" valign="top">.51</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Squamous cell carcinoma</td><td align="left" valign="top">519 (16.5)</td><td align="left" valign="top">358 (16.2)</td><td align="left" valign="top">71 (15.3)</td><td align="left" valign="top">90 (19.4)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Adenocarcinoma</td><td align="left" valign="top">2490 (79.2)</td><td align="left" valign="top">1765 (79.7)</td><td align="left" valign="top">369 (79.5)</td><td align="left" valign="top">356 (76.6)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Large-cell carcinoma</td><td align="left" valign="top">16 (0.5)</td><td align="left" valign="top">10 (0.5)</td><td align="left" valign="top">3 (0.6)</td><td align="left" valign="top">3 (0.6)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>NSCLC NOS<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td><td align="left" valign="top">234 (7.4)</td><td align="left" valign="top">164 (7.4)</td><td align="left" valign="top">40 (8.6)</td><td align="left" valign="top">30 (6.5)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="5">Stage<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup></td><td align="left" valign="top">.83</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1</td><td align="left" valign="top">1113 (35.4)</td><td align="left" valign="top">802 (36.2)</td><td align="left" valign="top">161 (34.7)</td><td align="left" valign="top">168 (36.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>2</td><td align="left" valign="top">276 (8.8)</td><td align="left" valign="top">190 (8.6)</td><td align="left" valign="top">40 (8.6)</td><td align="left" valign="top">46 (9.9)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>3</td><td align="left" valign="top">455 (14.5)</td><td align="left" valign="top">328 (14.8)</td><td align="left" valign="top">61 (13.1)</td><td align="left" valign="top">66 (14.2)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>4</td><td align="left" valign="top">1282 (40.8)</td><td align="left" valign="top">895 (40.4)</td><td align="left" valign="top">202 (43.5)</td><td align="left" valign="top">185 (39.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="6">Gene mutation</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>EGFR<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup></td><td align="left" valign="top">1131 (36.0)</td><td align="left" valign="top">799 (36.1)</td><td align="left" valign="top">166 (35.8)</td><td align="left" valign="top">166 (35.7)</td><td align="left" valign="top">.98</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>ALK<sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup></td><td align="left" valign="top">209 (6.6)</td><td align="left" valign="top">159 (7.2)</td><td align="left" valign="top">27 (5.8)</td><td align="left" valign="top">23 (4.9)</td><td align="left" valign="top">.16</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>NSCLC NOS: non&#x2013;small-cell lung cancer not otherwise specified.</p></fn><fn id="table2fn2"><p><sup>b</sup>Stage was classified according to the eighth edition of the American Joint Committee on Cancer staging system.</p></fn><fn id="table2fn3"><p><sup>c</sup>EGFR: epidermal growth factor receptor.</p></fn><fn id="table2fn4"><p><sup>d</sup>ALK: anaplastic lymphoma kinase.</p></fn></table-wrap-foot></table-wrap><p>Absolute SMD values for baseline characteristics between included and excluded patients are shown in Table S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. Excluded patients had higher 5-year mortality than included patients (3793/5520, 68.7% vs 1794/3144, 57.1%; SMD 0.241) and were older (mean 68.4, SD 10.7 vs 65.5, SD 10.7 years; SMD 0.278).</p></sec><sec id="s3-2"><title>Training Models and Performance Evaluation</title><p>We selected 5 distinct hyperparameter configurations from the Hyperband optimization (Table S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). For each configuration, we rebuilt the network using the corresponding tuned settings, retrained it on the training cohort, and evaluated its performance on both the training and test sets. During this process, we recorded a comprehensive set of performance metrics to facilitate direct comparisons across models. Each final model was serialized into a Keras file to ensure reproducibility and enable downstream inference. Each file contained the complete network architecture, learned weights, and optimizer state, allowing the model to be reloaded and applied with a single command in any compatible Python environment.</p><p>Of the 5 models, we designated model A as the primary model for reporting. On the held-out test set, model A achieved an AUC of 0.879 (95% CI 0.848&#x2010;0.908), with an accuracy of 0.806 (95% CI 0.774&#x2010;0.841) and an <italic>F</italic><sub>1</sub>-score of 0.824 (95% CI 0.788&#x2010;0.858). The AUC and AUPRC of model A are shown in <xref ref-type="fig" rid="figure4">Figure 4</xref>. Model A also demonstrated reasonable calibration on the test set (<xref ref-type="fig" rid="figure5">Figure 5</xref>), with a Brier score of 0.142. Model U (unknown-aware encoding) achieved a test AUC of 0.865 (95% CI 0.830&#x2010;0.897), corresponding to a small decrease compared with model A (&#x0394;AUC=&#x2212;0.014, 95% CI &#x2212;0.025 to &#x2212;0.003). Other discrimination and classification metrics showed similarly small differences (Table S4 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Discrimination performance of model A on the test set: (A) receiver operating characteristic curve and (B) precision-recall curve. AUPRC: area under the precision-recall curve; AUROC: area under the receiver operating characteristic curve.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v14i1e80574_fig04.png"/></fig><p>Figures S1 and S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> show the discrimination performance and calibration curves of the 5 models on the test set. Across models A to E, performance was highly consistent, with AUC ranging from 0.875 to 0.879 and AUPRC ranging from 0.894 to 0.903. The CPH model exhibited similar performance, with an AUC of 0.878 (95% CI 0.844&#x2010;0.908). The TNM-only CPH benchmark model yielded a lower test AUC of 0.845 (95% CI 0.806&#x2010;0.880). Table S5 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> provides the complete set of discrimination and classification metrics for all models, including both CPH baselines (full and TNM only). Brier scores for models A to E were also similar (approximately 0.140; Table S6 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), indicating comparable calibration across model variants.</p><p>We evaluated within-stage discrimination for the primary model (model A). Within-stage performance was generally clinically meaningful in stages 1, 3, and 4 (AUC of 0.753, 95% CI 0.653&#x2010;0.844 in stage 1; 0.722, 95% CI 0.569&#x2010;0.855 in stage 3; and 0.725, 95% CI 0.625&#x2010;0.825 in stage 4). Stage 2 exhibited the lowest AUC and a wide 95% CI (0.642, 95% CI 0.471&#x2010;0.796). Detailed within-stage performance metrics for models A to E are summarized in Table S7 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Calibration plot of model A on the test set. The dashed diagonal line indicates perfect calibration.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v14i1e80574_fig05.png"/></fig></sec><sec id="s3-3"><title>Feature Permutation and Changes in AUC</title><p>We conducted grouped-feature permutation analyses to assess feature importance. Stage yielded the largest decrease in AUC (0.217, 95% CI 0.212&#x2010;0.221), indicating this feature&#x2019;s predominant contribution. PFT ranked second (0.016, 95% CI 0.015&#x2010;0.017), followed by age (0.009, 95% CI 0.009&#x2010;0.010) and symptoms (0.008, 95% CI 0.007&#x2010;0.008). The permutation-based importance hierarchy was highly consistent across the 5 model variants (<xref ref-type="fig" rid="figure6">Figure 6</xref> and Table S8 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). A Friedman test showed no statistically significant differences in importance rankings across models (<italic>P</italic>=.93).</p><p>Feature importance was analyzed separately by histologic subtype (Table S9 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Discrimination was higher in the adenocarcinoma cohort than in the squamous cell carcinoma cohort. Within adenocarcinoma, gene mutation showed a larger decrease in AUC than in the overall analysis (0.003, 95% CI 0.003&#x2010;0.003), a pattern that was consistent across all 5 model variants. This pattern was not observed in the squamous cell carcinoma cohort.</p><fig position="float" id="figure6"><label>Figure 6.</label><caption><p>Mean decrease in test set area under the receiver operating characteristic curve (AUC) after grouped feature permutation across the 5 model variants (models A-E). Stage produced the largest decrease in AUC, followed by pulmonary function test (PFT), symptoms, and age, with consistent rankings across model variants (Friedman test: <italic>P</italic>=.93).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v14i1e80574_fig06.png"/></fig></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Overall Findings</title><p>Using the nationwide KCCR lung cancer cohort, we developed and validated a grouped-input deep learning model to predict 5-year mortality in NSCLC. We ensured reproducibility and minimized data leakage by implementing stratified training, validation, and test splits, with all preprocessing confined to the training set. On the test set, model A demonstrated strong discrimination and reasonable calibration. Across the 5 Hyperband-tuned model variants, test set performance (AUC=0.875&#x2010;0.879) and grouped-feature permutation profiles were highly consistent, supporting the robustness of the proposed framework.</p></sec><sec id="s4-2"><title>Model Performance</title><p>The grouped-input deep learning model demonstrated statistically comparable discrimination to that of a conventional CPH model built on the same routine clinical variables. This finding suggests that, for low-dimensional tabular clinical data without multimodal integration, complex neural network architectures may offer limited incremental benefit over interpretable regression-based approaches [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. Taken together, these results reinforce that model complexity should be guided by data structure rather than architectural novelty. In this context, our findings are best interpreted as a methodological comparison rather than evidence that deep learning is inherently superior for 5-year mortality prediction using registry-based clinical features alone. Nevertheless, deep learning architectures can model nonlinear interactions and readily integrate radiological or molecular data. Consistency across the 5 Hyperband-tuned model variants supports the robustness of the preprocessing pipeline, suggesting that the proposed framework provides a stable foundation for future multimodal extensions.</p><p>Importantly, our model is a baseline prognostic model and does not explicitly incorporate treatment exposures, which can substantially modify survival. Thus, predicted risk represents an average prognosis across heterogeneous treatment pathways in the cohort and should not be interpreted as a treatment-conditional estimate.</p><p>Although the TNM-only benchmark yielded lower overall discrimination (AUC=0.845, 95% CI 0.806&#x2010;0.880), we further assessed model performance within each stage to evaluate whether nonstaging variables retained discriminatory value when staging information was held constant. Our within-stage analysis indicates that the model provides prognostic discrimination beyond TNM staging alone. Within-stage performance was favorable in stages 1, 3, and 4 (AUCs generally of &#x003E;0.700). In contrast, discrimination in stage 2 was lower and imprecise, with wide CIs that in some cases crossed 0.50, likely reflecting the small sample size in this subgroup. This may also partly reflect unmeasured heterogeneity in treatment pathways within stage 2, which could not be explicitly modeled due to incomplete treatment data. Prior validations of the TNM system have shown that revisions from the seventh to the eighth and ninth editions of the American Joint Committee on Cancer staging system yielded only modest gains in discriminatory ability and overall prognostic separation remained limited [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. Although the model demonstrated incremental prognostic value beyond stage in the overall cohort, discrimination within stage 2 was modest (AUC=0.642). The relatively small sample size of stage 2 patients may have contributed to wider CIs and statistical instability; however, even accounting for this uncertainty, the current performance suggests that the model is not sufficiently robust for clinical risk stratification in stage 2 NSCLC. Additional prognostic variables and external validation would likely be required to improve reliability in this subgroup.</p><p>Recent studies have used diverse machine learning techniques to predict lung cancer survival, with reported AUCs ranging from approximately 0.650 to 0.800 [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. In many of these investigations, tree-based ensembles such as random forests and Extreme Gradient Boosting reported stronger discrimination than simple deep learning methods [<xref ref-type="bibr" rid="ref22">22</xref>-<xref ref-type="bibr" rid="ref24">24</xref>]. Nevertheless, because of their ability to integrate heterogeneous inputs, researchers continue to explore deep learning models in NSCLC. For example, Lai et al [<xref ref-type="bibr" rid="ref25">25</xref>] combined biomarker and clinical data, achieving an AUC of 0.816 with an accuracy of 0.754. Wang et al [<xref ref-type="bibr" rid="ref26">26</xref>] reported an AUC of 0.715 using a similar multimodal design. In contrast, Hindocha et al [<xref ref-type="bibr" rid="ref23">23</xref>] developed an ensemble model based solely on clinical variables, which reached an AUC of 0.717. By comparison, our models&#x2014;despite relying exclusively on routine clinical features&#x2014;produced AUCs exceeding 0.875 and accuracies of approximately 0.800. These differences may reflect a combination of factors, including the grouped-input design (which mitigates sparsity, shares weights within clinically coherent groups, and captures nonlinear relationships) [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>], rigorous leakage control, and large multicenter settings. Deep learning models trained on substantially smaller cohorts frequently show weaker discrimination and greater overfitting tendencies [<xref ref-type="bibr" rid="ref11">11</xref>]. However, cross-study comparisons should be interpreted cautiously due to heterogeneity in cohorts, end points, and validation protocols.</p></sec><sec id="s4-3"><title>Permutation-Based Feature Importance</title><p>Permutation-based importance analysis showed that stage was the dominant predictor of mortality, followed by PFT, symptoms, and age, consistent with earlier studies [<xref ref-type="bibr" rid="ref29">29</xref>-<xref ref-type="bibr" rid="ref33">33</xref>]. Because permutation importance can undervalue variables that are correlated with a single dominant predictor, this dominance may have led to a relative underestimation of other clinically relevant features [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]. To minimize such bias, variables were permuted at the group level rather than individually [<xref ref-type="bibr" rid="ref36">36</xref>]. However, interpretation requires caution. For example, PFT included not only spirometric measurements (forced vital capacity, forced expiratory volume in 1 second, and diffusion capacity of the lungs for carbon monoxide) but also indicators of test availability. Given our sentinel-based encoding for unmeasured PFTs, the apparent importance of PFT may partly capture care process information (eg, workup completeness or surgical candidacy) rather than the prognostic effect of lung function values themselves. This likely reflects a characteristic of real-world registry data, in which diagnostic testing patterns may be correlated with clinical severity and treatment eligibility. Accordingly, feature importance in this context should not be interpreted as reflecting the independent prognostic effect of spirometry alone but rather as a combination of lung function measurements and care-related factors.</p><p>Smoking-related variables and histology exhibited only modest marginal importance, which is consistent with the feature distribution imbalance of the cohort (a high prevalence of never smokers and adenocarcinoma), reducing variability in smoking metrics and limiting representation of squamous or large-cell carcinoma [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]. The relatively low importance of BMI is compatible with the reported &#x201C;obesity paradox,&#x201D; in which risk appears nonlinear and a single baseline measurement may dilute the marginal effect [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>]. We also evaluated whether model-level factors could bias these rankings. The 5 models were trained using distinct hyperparameter settings, including different dropout rates and different numbers of hidden units in the feature group&#x2013;specific layers. Although such differences can influence importance estimates [<xref ref-type="bibr" rid="ref41">41</xref>], the rankings were highly concordant across models, suggesting that any bias from hyperparameter choices was negligible.</p><p>This study examined the importance of gene mutations within histological subgroups. In adenocarcinoma, gene mutation became modestly more influential than in the overall analysis, with EGFR consistently surpassing ALK across all 5 models. In contrast, neither mutation provided meaningful predictive value in squamous cell carcinoma. Although both EGFR and ALK have clear therapeutic relevance in NSCLC as targets of tyrosine kinase inhibitors, their apparent prognostic contributions can vary by histology and prevalence [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref42">42</xref>]. Our findings align with those of previous reports in which EGFR was associated with more favorable outcomes in adenocarcinoma, whereas ALK mutations were less frequent and exhibited weaker associations with survival [<xref ref-type="bibr" rid="ref42">42</xref>-<xref ref-type="bibr" rid="ref44">44</xref>]. Because squamous cell carcinoma rarely harbors either mutation and is associated with intrinsically poorer outcomes [<xref ref-type="bibr" rid="ref44">44</xref>], effect estimates in this subgroup are inherently uncertain. Moreover, residual confounding by therapy exposure cannot be excluded in the absence of treatment-level data. Different patterns may emerge in cohorts with larger proportions of squamous cell carcinoma or higher ALK mutation frequencies.</p></sec><sec id="s4-4"><title>Limitations</title><p>This study has several limitations. First, it was a retrospective analysis limited to a Korean cohort; interethnic differences in EGFR mutation prevalence, histology, and smoking patterns may affect generalizability [<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref46">46</xref>]. Second, registry-based data have inherent constraints. Because our cohort was diagnosed between 2014 and 2017, key biomarkers (eg, KRAS mutation, programmed death-ligand 1, and tumor mutational burden) and detailed treatment variables were not routinely available or consistently recorded. As a result, the absolute mortality estimates generated by our model may be higher than those observed under contemporary treatment standards, and model calibration may shift in more recent patient populations. Therefore, external validation and potential recalibration in temporally distinct cohorts will be necessary before clinical implementation. Third, &#x201C;unknown&#x201D; values for ECOG status and smoking history were recoded to default categories to enable complete input vectors. If these values were not missing at random, this preprocessing step might have introduced optimistic bias in survival prediction. Fourth, although the overall sample size was large, some subgroup analyses were underpowered. Notably, the stage 2 subgroup in the test set was small (46/465, 9.9%) with wide CIs, some of which crossed 0.50. This is particularly important because stage 2 represents a key clinical decision point for adjuvant therapy. Fifth, although we compared our model with a conventional CPH model, we did not conduct extensive benchmarking against multiple strong tabular learners; therefore, comparative performance across alternative tabular modeling approaches should be interpreted cautiously. Because TNM stage dominated permutation-based importance, residual correlation-related bias cannot be excluded and may attenuate the apparent importance of correlated predictors. Finally, our evaluation relied on internal validation within a single registry split. As a result, the transportability of the model across different health care systems, patient populations, and treatment eras remains uncertain. Given these constraints, external validation in an independent cohort is required to assess both discrimination and calibration stability before clinical deployment or widespread adoption.</p></sec><sec id="s4-5"><title>Conclusions</title><p>In this study, a deep learning model based on the nationwide lung cancer staging dataset from the KCCR demonstrated performance comparable to that of a conventional CPH model and previously reported machine learning methods. By aligning inputs with clinically coherent groups and quantifying contributions through permutation-based, group-level importance, the framework provides transparent and reproducible explanations using routine clinical variables. These features position the model as a practical foundation for future clinical evaluation and integration of additional modalities such as imaging or molecular data in more complex predictive settings. Future work should include external validation in independent and temporally distinct cohorts as well as prospective evaluation of clinical utility before routine clinical implementation.</p></sec></sec></body><back><ack><p>The data used in this study were obtained from the Korea Central Cancer Registry supported by the Korean Association for Lung Cancer. During preparation of this manuscript, the authors used generative artificial intelligence tools ChatGPT (OpenAI; models GPT-4o, o3, and GPT-5.2) to assist with code revision and organize ideas. No artificial intelligence&#x2013;generated text was used verbatim in the manuscript. The authors take full responsibility for the content, analyses, interpretation, and conclusions. All references were identified and verified by the authors.</p></ack><notes><sec><title>Funding</title><p>The authors declared no financial support was received for this work.</p></sec><sec><title>Data Availability</title><p>The datasets generated or analyzed during this study are not publicly available due to privacy and data-use restrictions related to the Korean Central Cancer Registry, but may be available from the corresponding author on reasonable request under an institutional data-use agreement approved by an institutional review board. The code and a fully synthetic sample dataset are available in the GitHub repository [<xref ref-type="bibr" rid="ref47">47</xref>].</p></sec></notes><fn-group><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">ALK</term><def><p>anaplastic lymphoma kinase</p></def></def-item><def-item><term id="abb2">AUC</term><def><p>area under the receiver operating characteristic curve</p></def></def-item><def-item><term id="abb3">AUPRC</term><def><p>area under the precision-recall curve</p></def></def-item><def-item><term id="abb4">CPH</term><def><p>Cox proportional hazards</p></def></def-item><def-item><term id="abb5">ECOG</term><def><p>Eastern Cooperative Oncology Group</p></def></def-item><def-item><term id="abb6">EGFR</term><def><p>epidermal growth factor receptor</p></def></def-item><def-item><term id="abb7">KCCR</term><def><p>Korea Central Cancer Registry</p></def></def-item><def-item><term id="abb8">MLP</term><def><p>multilayer perceptron</p></def></def-item><def-item><term id="abb9">NSCLC</term><def><p>non&#x2013;small-cell lung cancer</p></def></def-item><def-item><term id="abb10">PFT</term><def><p>pulmonary function test</p></def></def-item><def-item><term id="abb11">SMD</term><def><p>standardized mean difference</p></def></def-item><def-item><term id="abb12">TNM</term><def><p>tumor, node, metastasis</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>JG</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>HC</given-names> </name><name name-style="western"><surname>Choi</surname><given-names>CM</given-names> </name></person-group><article-title>Recent trends of lung cancer in Korea</article-title><source>Tuberc Respir Dis (Seoul)</source><year>2021</year><month>04</month><volume>84</volume><issue>2</issue><fpage>89</fpage><lpage>95</lpage><pub-id pub-id-type="doi">10.4046/trd.2020.0134</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Riely</surname><given-names>GJ</given-names> </name><name name-style="western"><surname>Wood</surname><given-names>DE</given-names> </name><name name-style="western"><surname>Ettinger</surname><given-names>DS</given-names> </name><etal/></person-group><article-title>Non-small cell lung cancer, version 4.2024, NCCN Clinical Practice Guidelines in Oncology</article-title><source>J Natl Compr Canc Netw</source><year>2024</year><volume>22</volume><issue>4</issue><fpage>249</fpage><lpage>274</lpage><pub-id pub-id-type="doi">10.6004/jnccn.2204.0023</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ganti</surname><given-names>AK</given-names> </name><name name-style="western"><surname>Klein</surname><given-names>AB</given-names> </name><name name-style="western"><surname>Cotarla</surname><given-names>I</given-names> </name><name name-style="western"><surname>Seal</surname><given-names>B</given-names> </name><name name-style="western"><surname>Chou</surname><given-names>E</given-names> </name></person-group><article-title>Update of incidence, prevalence, survival, and initial treatment in patients with non-small cell lung cancer in the US</article-title><source>JAMA Oncol</source><year>2021</year><month>12</month><day>1</day><volume>7</volume><issue>12</issue><fpage>1824</fpage><lpage>1832</lpage><pub-id pub-id-type="doi">10.1001/jamaoncol.2021.4932</pub-id><pub-id pub-id-type="medline">34673888</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jung</surname><given-names>HA</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>DH</given-names> </name><name name-style="western"><surname>Lim</surname><given-names>SM</given-names> </name><etal/></person-group><article-title>Epidemiology and outcomes of non-small cell lung cancer in South Korea</article-title><source>JAMA Netw Open</source><year>2024</year><month>02</month><day>5</day><volume>7</volume><issue>2</issue><fpage>e2355331</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2023.55331</pub-id><pub-id pub-id-type="medline">38334998</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chi</surname><given-names>SA</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>H</given-names> </name><name name-style="western"><surname>Choi</surname><given-names>YL</given-names> </name><etal/></person-group><article-title>Trends in survival rates of non-small cell lung cancer with use of molecular testing and targeted therapy in Korea, 2010-2020</article-title><source>JAMA Netw Open</source><year>2023</year><month>03</month><day>1</day><volume>6</volume><issue>3</issue><fpage>e232002</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2023.2002</pub-id><pub-id pub-id-type="medline">36929402</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ellis</surname><given-names>RJ</given-names> </name><name name-style="western"><surname>Sander</surname><given-names>RM</given-names> </name><name name-style="western"><surname>Limon</surname><given-names>A</given-names> </name></person-group><article-title>Twelve key challenges in medical machine learning and solutions</article-title><source>Intell Based Med</source><year>2022</year><volume>6</volume><fpage>100068</fpage><pub-id pub-id-type="doi">10.1016/j.ibmed.2022.100068</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Swanson</surname><given-names>K</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>E</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>A</given-names> </name><name name-style="western"><surname>Alizadeh</surname><given-names>AA</given-names> </name><name name-style="western"><surname>Zou</surname><given-names>J</given-names> </name></person-group><article-title>From patterns to patients: advances in clinical machine learning for cancer diagnosis, prognosis, and treatment</article-title><source>Cell</source><year>2023</year><month>04</month><day>13</day><volume>186</volume><issue>8</issue><fpage>1772</fpage><lpage>1791</lpage><pub-id pub-id-type="doi">10.1016/j.cell.2023.01.035</pub-id><pub-id pub-id-type="medline">36905928</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>X</given-names> </name><name name-style="western"><surname>Faes</surname><given-names>L</given-names> </name><name name-style="western"><surname>Kale</surname><given-names>AU</given-names> </name><etal/></person-group><article-title>A comparison of deep learning performance against health-care professionals in detecting diseases from medical imaging: a systematic review and meta-analysis</article-title><source>Lancet Digit Health</source><year>2019</year><month>10</month><volume>1</volume><issue>6</issue><fpage>e271</fpage><lpage>e297</lpage><pub-id pub-id-type="doi">10.1016/S2589-7500(19)30123-2</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Choi</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>W</given-names> </name><name name-style="western"><surname>Nagarajan</surname><given-names>MB</given-names> </name><etal/></person-group><article-title>Translating AI to clinical practice: overcoming data shift with explainability</article-title><source>Radiographics</source><year>2023</year><month>05</month><volume>43</volume><issue>5</issue><fpage>e220105</fpage><pub-id pub-id-type="doi">10.1148/rg.220105</pub-id><pub-id pub-id-type="medline">37104124</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Esteva</surname><given-names>A</given-names> </name><name name-style="western"><surname>Chou</surname><given-names>K</given-names> </name><name name-style="western"><surname>Yeung</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Deep learning-enabled medical computer vision</article-title><source>NPJ Digit Med</source><year>2021</year><month>01</month><day>8</day><volume>4</volume><issue>1</issue><fpage>5</fpage><pub-id pub-id-type="doi">10.1038/s41746-020-00376-2</pub-id><pub-id pub-id-type="medline">33420381</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Altuhaifa</surname><given-names>FA</given-names> </name><name name-style="western"><surname>Win</surname><given-names>KT</given-names> </name><name name-style="western"><surname>Su</surname><given-names>G</given-names> </name></person-group><article-title>Predicting lung cancer survival based on clinical data using machine learning: a review</article-title><source>Comput Biol Med</source><year>2023</year><month>10</month><volume>165</volume><fpage>107338</fpage><pub-id pub-id-type="doi">10.1016/j.compbiomed.2023.107338</pub-id><pub-id pub-id-type="medline">37625260</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yeh</surname><given-names>MC</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>YH</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>HC</given-names> </name><name name-style="western"><surname>Bai</surname><given-names>KJ</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>HH</given-names> </name><name name-style="western"><surname>Li</surname><given-names>YC</given-names> </name></person-group><article-title>Artificial intelligence-based prediction of lung cancer risk using nonimaging electronic medical records: deep learning approach</article-title><source>J Med Internet Res</source><year>2021</year><month>08</month><day>3</day><volume>23</volume><issue>8</issue><fpage>e26256</fpage><pub-id pub-id-type="doi">10.2196/26256</pub-id><pub-id pub-id-type="medline">34342588</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>D</given-names> </name><name name-style="western"><surname>Lu</surname><given-names>B</given-names> </name><name name-style="western"><surname>Liang</surname><given-names>B</given-names> </name><etal/></person-group><article-title>Interpretable deep learning survival predictive tool for small cell lung cancer</article-title><source>Front Oncol</source><year>2023</year><volume>13</volume><fpage>1162181</fpage><pub-id pub-id-type="doi">10.3389/fonc.2023.1162181</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>S</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>S</given-names> </name></person-group><article-title>Identifying lung cancer risk factors in the elderly using deep neural networks: quantitative analysis of web-based survey data</article-title><source>J Med Internet Res</source><year>2020</year><month>03</month><day>17</day><volume>22</volume><issue>3</issue><fpage>e17695</fpage><pub-id pub-id-type="doi">10.2196/17695</pub-id><pub-id pub-id-type="medline">32181751</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>YC</given-names> </name><name name-style="western"><surname>Won</surname><given-names>YJ</given-names> </name></person-group><article-title>The development of the Korean Lung Cancer Registry (KALC-R)</article-title><source>Tuberc Respir Dis</source><year>2019</year><volume>82</volume><issue>2</issue><fpage>91</fpage><lpage>93</lpage><pub-id pub-id-type="doi">10.4046/trd.2018.0032</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Altmann</surname><given-names>A</given-names> </name><name name-style="western"><surname>Tolo&#x015F;i</surname><given-names>L</given-names> </name><name name-style="western"><surname>Sander</surname><given-names>O</given-names> </name><name name-style="western"><surname>Lengauer</surname><given-names>T</given-names> </name></person-group><article-title>Permutation importance: a corrected feature importance measure</article-title><source>Bioinformatics</source><year>2010</year><month>05</month><day>15</day><volume>26</volume><issue>10</issue><fpage>1340</fpage><lpage>1347</lpage><pub-id pub-id-type="doi">10.1093/bioinformatics/btq134</pub-id><pub-id pub-id-type="medline">20385727</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>H</given-names> </name><name name-style="western"><surname>Park</surname><given-names>T</given-names> </name><name name-style="western"><surname>Jang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>S</given-names> </name></person-group><article-title>Comparison of survival prediction models for pancreatic cancer: Cox model versus machine learning models</article-title><source>Genomics Inform</source><year>2022</year><month>06</month><volume>20</volume><issue>2</issue><fpage>e23</fpage><pub-id pub-id-type="doi">10.5808/gi.22036</pub-id><pub-id pub-id-type="medline">35794703</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xia</surname><given-names>K</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>D</given-names> </name><name name-style="western"><surname>Jin</surname><given-names>S</given-names> </name><name name-style="western"><surname>Yi</surname><given-names>X</given-names> </name><name name-style="western"><surname>Luo</surname><given-names>L</given-names> </name></person-group><article-title>Prediction of lung papillary adenocarcinoma-specific survival using ensemble machine learning models</article-title><source>Sci Rep</source><year>2023</year><month>09</month><day>8</day><volume>13</volume><issue>1</issue><fpage>14827</fpage><pub-id pub-id-type="doi">10.1038/s41598-023-40779-1</pub-id><pub-id pub-id-type="medline">37684259</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jung</surname><given-names>HS</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>JG</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>CY</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>DJ</given-names> </name><name name-style="western"><surname>Chung</surname><given-names>KY</given-names> </name></person-group><article-title>Validation of the T descriptor in the new 8th TNM classification for non-small cell lung cancer</article-title><source>J Thorac Dis</source><year>2018</year><month>01</month><volume>10</volume><issue>1</issue><fpage>162</fpage><lpage>167</lpage><pub-id pub-id-type="doi">10.21037/jtd.2017.12.20</pub-id><pub-id pub-id-type="medline">29600045</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wu</surname><given-names>L</given-names> </name><name name-style="western"><surname>Tian</surname><given-names>JY</given-names> </name><name name-style="western"><surname>Li</surname><given-names>MJ</given-names> </name><etal/></person-group><article-title>Validation of the 9th edition of the TNM staging system for limited-stage small cell lung cancer after resection: a multicenter study</article-title><source>Lung Cancer</source><year>2025</year><month>02</month><volume>200</volume><fpage>108085</fpage><pub-id pub-id-type="doi">10.1016/j.lungcan.2025.108085</pub-id><pub-id pub-id-type="medline">40519973</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Didier</surname><given-names>AJ</given-names> </name><name name-style="western"><surname>Nigro</surname><given-names>A</given-names> </name><name name-style="western"><surname>Noori</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Omballi</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Pappada</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Hamouda</surname><given-names>DM</given-names> </name></person-group><article-title>Application of machine learning for lung cancer survival prognostication-a systematic review and meta-analysis</article-title><source>Front Artif Intell</source><year>2024</year><volume>7</volume><fpage>1365777</fpage><pub-id pub-id-type="doi">10.3389/frai.2024.1365777</pub-id><pub-id pub-id-type="medline">38646415</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jochems</surname><given-names>A</given-names> </name><name name-style="western"><surname>El-Naqa</surname><given-names>I</given-names> </name><name name-style="western"><surname>Kessler</surname><given-names>M</given-names> </name><etal/></person-group><article-title>A prediction model for early death in non-small cell lung cancer patients following curative-intent chemoradiotherapy</article-title><source>Acta Oncol</source><year>2018</year><month>02</month><volume>57</volume><issue>2</issue><fpage>226</fpage><lpage>230</lpage><pub-id pub-id-type="doi">10.1080/0284186X.2017.1385842</pub-id><pub-id pub-id-type="medline">29034756</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hindocha</surname><given-names>S</given-names> </name><name name-style="western"><surname>Charlton</surname><given-names>TG</given-names> </name><name name-style="western"><surname>Linton-Reid</surname><given-names>K</given-names> </name><etal/></person-group><article-title>A comparison of machine learning methods for predicting recurrence and death after curative-intent radiotherapy for non-small cell lung cancer: development and validation of multivariable clinical prediction models</article-title><source>EBioMedicine</source><year>2022</year><month>03</month><volume>77</volume><fpage>103911</fpage><pub-id pub-id-type="doi">10.1016/j.ebiom.2022.103911</pub-id><pub-id pub-id-type="medline">35248997</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Siah</surname><given-names>KW</given-names> </name><name name-style="western"><surname>Khozin</surname><given-names>S</given-names> </name><name name-style="western"><surname>Wong</surname><given-names>CH</given-names> </name><name name-style="western"><surname>Lo</surname><given-names>AW</given-names> </name></person-group><article-title>Machine-learning and stochastic tumor growth models for predicting outcomes in patients with advanced non-small-cell lung cancer</article-title><source>JCO Clin Cancer Inform</source><year>2019</year><month>09</month><volume>3</volume><fpage>1</fpage><lpage>11</lpage><pub-id pub-id-type="doi">10.1200/CCI.19.00046</pub-id><pub-id pub-id-type="medline">31539267</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lai</surname><given-names>YH</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>WN</given-names> </name><name name-style="western"><surname>Hsu</surname><given-names>TC</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>C</given-names> </name><name name-style="western"><surname>Tsao</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>S</given-names> </name></person-group><article-title>Overall survival prediction of non-small cell lung cancer by integrating microarray and clinical data with deep learning</article-title><source>Sci Rep</source><year>2020</year><month>03</month><day>13</day><volume>10</volume><issue>1</issue><fpage>4679</fpage><pub-id pub-id-type="doi">10.1038/s41598-020-61588-w</pub-id><pub-id pub-id-type="medline">32170141</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>S</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>Y</given-names> </name></person-group><article-title>A novel deep learning method to predict lung cancer long-term survival with biological knowledge incorporated gene expression images and clinical data</article-title><source>Front Genet</source><year>2022</year><volume>13</volume><fpage>800853</fpage><pub-id pub-id-type="doi">10.3389/fgene.2022.800853</pub-id><pub-id pub-id-type="medline">35368657</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Xu</surname><given-names>S</given-names> </name><name name-style="western"><surname>Bu</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Chaudhari</surname><given-names>P</given-names> </name><name name-style="western"><surname>Barnett</surname><given-names>IJ</given-names> </name></person-group><article-title>Sparse neural additive model: interpretable deep learning with feature selection via group sparsity</article-title><source>arXiv</source><comment>Preprint posted online on  Feb 25, 2022</comment><pub-id pub-id-type="doi">10.48550/arXiv.2202.12482</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>J</given-names> </name><name name-style="western"><surname>Liao</surname><given-names>K</given-names> </name><name name-style="western"><surname>Wan</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>DZ</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>J</given-names> </name></person-group><article-title>DANets: deep abstract networks for tabular data classification and regression</article-title><source>arXiv</source><comment>Preprint posted online on  Dec 6, 2021</comment><pub-id pub-id-type="doi">10.48550/arxiv.2112.02962</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yuan</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>G</given-names> </name><name name-style="western"><surname>Gu</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Artificial intelligence-assisted machine learning models for predicting lung cancer survival</article-title><source>Asia Pac J Oncol Nurs</source><year>2025</year><volume>12</volume><fpage>100680</fpage><pub-id pub-id-type="doi">10.1016/j.apjon.2025.100680</pub-id><pub-id pub-id-type="medline">40201531</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Caruso</surname><given-names>CM</given-names> </name><name name-style="western"><surname>Guarrasi</surname><given-names>V</given-names> </name><name name-style="western"><surname>Ramella</surname><given-names>S</given-names> </name><name name-style="western"><surname>Soda</surname><given-names>P</given-names> </name></person-group><article-title>A deep learning approach for overall survival prediction in lung cancer with missing values</article-title><source>Comput Methods Programs Biomed</source><year>2024</year><month>09</month><volume>254</volume><fpage>108308</fpage><pub-id pub-id-type="doi">10.1016/j.cmpb.2024.108308</pub-id><pub-id pub-id-type="medline">38968829</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kwon</surname><given-names>OB</given-names> </name><name name-style="western"><surname>Han</surname><given-names>S</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>HY</given-names> </name><etal/></person-group><article-title>Prediction of postoperative lung function in lung cancer patients using machine learning models</article-title><source>Tuberc Respir Dis (Seoul)</source><year>2023</year><month>07</month><volume>86</volume><issue>3</issue><fpage>203</fpage><lpage>215</lpage><pub-id pub-id-type="doi">10.4046/trd.2022.0048</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tas</surname><given-names>F</given-names> </name><name name-style="western"><surname>Ciftci</surname><given-names>R</given-names> </name><name name-style="western"><surname>Kilic</surname><given-names>L</given-names> </name><name name-style="western"><surname>Karabulut</surname><given-names>S</given-names> </name></person-group><article-title>Age is a prognostic factor affecting survival in lung cancer patients</article-title><source>Oncol Lett</source><year>2013</year><month>11</month><volume>6</volume><issue>5</issue><fpage>1507</fpage><lpage>1513</lpage><pub-id pub-id-type="doi">10.3892/ol.2013.1566</pub-id><pub-id pub-id-type="medline">24179550</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shen</surname><given-names>YL</given-names> </name><name name-style="western"><surname>Shen</surname><given-names>CI</given-names> </name><name name-style="western"><surname>Chiang</surname><given-names>CL</given-names> </name><etal/></person-group><article-title>Reduced FEV<sub>1</sub> as prognostic factors in patients with advanced NSCLC receiving immune checkpoint inhibitors</article-title><source>Front Med (Lausanne)</source><year>2022</year><volume>9</volume><fpage>860733</fpage><pub-id pub-id-type="doi">10.3389/fmed.2022.860733</pub-id><pub-id pub-id-type="medline">35391883</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Strobl</surname><given-names>C</given-names> </name><name name-style="western"><surname>Boulesteix</surname><given-names>AL</given-names> </name><name name-style="western"><surname>Kneib</surname><given-names>T</given-names> </name><name name-style="western"><surname>Augustin</surname><given-names>T</given-names> </name><name name-style="western"><surname>Zeileis</surname><given-names>A</given-names> </name></person-group><article-title>Conditional variable importance for random forests</article-title><source>BMC Bioinformatics</source><year>2008</year><month>07</month><day>11</day><volume>9</volume><fpage>307</fpage><pub-id pub-id-type="doi">10.1186/1471-2105-9-307</pub-id><pub-id pub-id-type="medline">18620558</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wallace</surname><given-names>ML</given-names> </name><name name-style="western"><surname>Mentch</surname><given-names>L</given-names> </name><name name-style="western"><surname>Wheeler</surname><given-names>BJ</given-names> </name><etal/></person-group><article-title>Use and misuse of random forest variable importance metrics in medicine: demonstrations through incident stroke prediction</article-title><source>BMC Med Res Methodol</source><year>2023</year><month>06</month><day>19</day><volume>23</volume><issue>1</issue><fpage>144</fpage><pub-id pub-id-type="doi">10.1186/s12874-023-01965-x</pub-id><pub-id pub-id-type="medline">37337173</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Au</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Herbinger</surname><given-names>J</given-names> </name><name name-style="western"><surname>Stachl</surname><given-names>C</given-names> </name><name name-style="western"><surname>Bischl</surname><given-names>B</given-names> </name><name name-style="western"><surname>Casalicchio</surname><given-names>G</given-names> </name></person-group><article-title>Grouped feature importance and combined features effect plot</article-title><source>Data Min Knowl Disc</source><year>2022</year><month>07</month><volume>36</volume><fpage>1401</fpage><lpage>1450</lpage><pub-id pub-id-type="doi">10.1007/s10618-022-00840-5</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Grosu</surname><given-names>HB</given-names> </name><name name-style="western"><surname>Manzanera</surname><given-names>A</given-names> </name><name name-style="western"><surname>Shivakumar</surname><given-names>S</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>S</given-names> </name><name name-style="western"><surname>Noguras Gonzalez</surname><given-names>G</given-names> </name><name name-style="western"><surname>Ost</surname><given-names>DE</given-names> </name></person-group><article-title>Survival disparities following surgery among patients with different histological types of non-small cell lung cancer</article-title><source>Lung Cancer</source><year>2020</year><month>02</month><volume>140</volume><fpage>55</fpage><lpage>58</lpage><pub-id pub-id-type="doi">10.1016/j.lungcan.2019.12.007</pub-id><pub-id pub-id-type="medline">31865279</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hao</surname><given-names>B</given-names> </name><name name-style="western"><surname>Fan</surname><given-names>T</given-names> </name><name name-style="western"><surname>Xiong</surname><given-names>J</given-names> </name><etal/></person-group><article-title>The prognostic significance of the histological types in patients with nonsmall cell lung cancer &#x2264;2 cm</article-title><source>Front Surg</source><year>2021</year><volume>8</volume><fpage>721567</fpage><pub-id pub-id-type="doi">10.3389/fsurg.2021.721567</pub-id><pub-id pub-id-type="medline">34760914</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shepshelovich</surname><given-names>D</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>W</given-names> </name><name name-style="western"><surname>Lu</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Body mass index (BMI), BMI change, and overall survival in patients with SCLC and NSCLC: a pooled analysis of the International Lung Cancer Consortium</article-title><source>J Thorac Oncol</source><year>2019</year><month>09</month><volume>14</volume><issue>9</issue><fpage>1594</fpage><lpage>1607</lpage><pub-id pub-id-type="doi">10.1016/j.jtho.2019.05.031</pub-id><pub-id pub-id-type="medline">31163278</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rock</surname><given-names>CL</given-names> </name><name name-style="western"><surname>Thomson</surname><given-names>CA</given-names> </name><name name-style="western"><surname>Sullivan</surname><given-names>KR</given-names> </name><etal/></person-group><article-title>American Cancer Society nutrition and physical activity guideline for cancer survivors</article-title><source>CA Cancer J Clin</source><year>2022</year><month>05</month><volume>72</volume><issue>3</issue><fpage>230</fpage><lpage>262</lpage><pub-id pub-id-type="doi">10.3322/caac.21719</pub-id><pub-id pub-id-type="medline">35294043</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Teng</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Song</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Han</surname><given-names>K</given-names> </name><name name-style="western"><surname>Lu</surname><given-names>Y</given-names> </name></person-group><article-title>A survey on the interpretability of deep learning in medical diagnosis</article-title><source>Multimed Syst</source><year>2022</year><volume>28</volume><issue>6</issue><fpage>2335</fpage><lpage>2355</lpage><pub-id pub-id-type="doi">10.1007/s00530-022-00960-4</pub-id><pub-id pub-id-type="medline">35789785</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nana-Sinkam</surname><given-names>SP</given-names> </name><name name-style="western"><surname>Powell</surname><given-names>CA</given-names> </name></person-group><article-title>Molecular biology of lung cancer: diagnosis and management of lung cancer, 3rd ed: American College of Chest Physicians evidence-based clinical practice guidelines</article-title><source>Chest</source><year>2013</year><month>05</month><volume>143</volume><issue>5 Suppl</issue><fpage>e30S</fpage><lpage>e39S</lpage><pub-id pub-id-type="doi">10.1378/chest.12-2346</pub-id><pub-id pub-id-type="medline">23649444</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Luo</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Anaplastic lymphoma kinase gene rearrangement predicts better prognosis in NSCLC patients: a meta-analysis</article-title><source>Lung Cancer</source><year>2017</year><month>10</month><volume>112</volume><fpage>1</fpage><lpage>9</lpage><pub-id pub-id-type="doi">10.1016/j.lungcan.2017.07.029</pub-id><pub-id pub-id-type="medline">29191580</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>W</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>K</given-names> </name><name name-style="western"><surname>Li</surname><given-names>X</given-names> </name></person-group><article-title>Correlation between EML4-ALK, EGFR and clinicopathological features based on IASLC/ATS/ERS classification of lung adenocarcinoma</article-title><source>Medicine (Baltimore)</source><year>2018</year><volume>97</volume><issue>26</issue><fpage>e11116</fpage><pub-id pub-id-type="doi">10.1097/MD.0000000000011116</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Vaccarella</surname><given-names>S</given-names> </name><name name-style="western"><surname>Morgan</surname><given-names>E</given-names> </name><etal/></person-group><article-title>Global variations in lung cancer incidence by histological subtype in 2020: a population-based study</article-title><source>Lancet Oncol</source><year>2023</year><month>11</month><volume>24</volume><issue>11</issue><fpage>1206</fpage><lpage>1218</lpage><pub-id pub-id-type="doi">10.1016/S1470-2045(23)00444-8</pub-id><pub-id pub-id-type="medline">37837979</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Qian</surname><given-names>J</given-names> </name><name name-style="western"><surname>Nie</surname><given-names>W</given-names> </name><name name-style="western"><surname>Lu</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Racial differences in characteristics and prognoses between Asian and White patients with nonsmall cell lung cancer receiving atezolizumab: an ancillary analysis of the POPLAR and OAK studies</article-title><source>Int J Cancer</source><year>2020</year><month>06</month><day>1</day><volume>146</volume><issue>11</issue><fpage>3124</fpage><lpage>3133</lpage><pub-id pub-id-type="doi">10.1002/ijc.32717</pub-id><pub-id pub-id-type="medline">31583695</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="web"><article-title>Lee91jh/nsclc_5yr_kccr</article-title><source>GitHub</source><access-date>2026-05-25</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://github.com/lee91jh/NSCLC_5yr_KCCR">https://github.com/lee91jh/NSCLC_5yr_KCCR</ext-link></comment></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Consolidated supplementary tables for this study, including cohort description, preprocessing and variable definitions, model configuration, and full evaluation outputs. These materials support the main results and are provided for transparency and reproducibility.</p><media xlink:href="medinform_v14i1e80574_app1.docx" xlink:title="DOCX File, 332 KB"/></supplementary-material></app-group></back></article>