<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Cancer</journal-id><journal-id journal-id-type="publisher-id">cancer</journal-id><journal-id journal-id-type="index">21</journal-id><journal-title>JMIR Cancer</journal-title><abbrev-journal-title>JMIR Cancer</abbrev-journal-title><issn pub-type="epub">2369-1999</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v12i1e86418</article-id><article-id pub-id-type="doi">10.2196/86418</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Machine Learning&#x2013;Based Survival Prediction Models for Young Patients With Gastric Cancer: Model Development and Validation Study</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Kang</surname><given-names>Ha Ye Jin</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Jang</surname><given-names>Wooyeong</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ko</surname><given-names>Minsam</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Ryu</surname><given-names>Kwang Sun</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Computer Science, Semyung University</institution><addr-line>Jecheon-si</addr-line><addr-line>Chungcheongbuk-do</addr-line><country>Republic of Korea</country></aff><aff id="aff2"><institution>Department of Biomedical Engineering, School of Medicine, Chungbuk National University</institution><addr-line>Seowon-gu, Cheongju-si</addr-line><addr-line>Chungcheongbuk-do</addr-line><country>Republic of Korea</country></aff><aff id="aff3"><institution>Department of Human-Computer Interaction, Hanyang University</institution><addr-line>Sangnok-gu, Ansan-si</addr-line><addr-line>Gyeonggi-do</addr-line><country>Republic of Korea</country></aff><aff id="aff4"><institution>National Cancer Data Center, National Cancer Center</institution><addr-line>323 Ilsan-ro, Ilsandong-gu</addr-line><addr-line>Goyang-si</addr-line><addr-line>Gyeonggi-do</addr-line><country>Republic of Korea</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Balcarras</surname><given-names>Matthew</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Chen</surname><given-names>Huiling</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Lai</surname><given-names>Yi-Hsiang</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Kwang Sun Ryu, PhD, National Cancer Data Center, National Cancer Center, 323 Ilsan-ro, Ilsandong-gu, Goyang-si, Gyeonggi-do, 10408, Republic of Korea, 82 10-5769-7272, 82 10-031-920-0654; <email>niceplay13@ncc.re.kr</email></corresp></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>26</day><month>5</month><year>2026</year></pub-date><volume>12</volume><elocation-id>e86418</elocation-id><history><date date-type="received"><day>23</day><month>10</month><year>2025</year></date><date date-type="rev-recd"><day>01</day><month>04</month><year>2026</year></date><date date-type="accepted"><day>02</day><month>04</month><year>2026</year></date></history><copyright-statement>&#x00A9; Ha Ye Jin Kang, Wooyeong Jang, Minsam Ko, Kwang Sun Ryu. Originally published in JMIR Cancer (<ext-link ext-link-type="uri" xlink:href="https://cancer.jmir.org">https://cancer.jmir.org</ext-link>), 26.5.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Cancer, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://cancer.jmir.org/">https://cancer.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://cancer.jmir.org/2026/1/e86418"/><abstract><sec><title>Background</title><p>Despite a global decline in the incidence of gastric cancer (GC), the number of cases diagnosed among younger individuals continues to increase. Several studies have been conducted to develop predictive models of mortality in patients with GC.</p></sec><sec><title>Objective</title><p>We developed 3- and 5-year survival prediction models for young patients with GC based on machine learning&#x2013;based survival modeling approaches.</p></sec><sec sec-type="methods"><title>Methods</title><p>Data from 813 young patients (&#x2264;50 years) diagnosed with GC between 2013 and 2015 were retrieved from the Gastric Cancer Public Staging Database. Among these 813 patients, data from 569 (70%) and 244 (30%) were allocated to the model training and testing datasets, respectively. Random survival forest, gradient boosting survival analysis, extra survival tree, and the Cox proportional hazards model were applied to predict survival outcomes at the 3- and 5-year time horizons. Model performance was assessed and quantified using the concordance index (C-index) metric. For the machine learning prediction models, the mean C-index values and corresponding 95% CIs were estimated across 100 repeated training iterations.</p></sec><sec sec-type="results"><title>Results</title><p>For the random survival forest model, the C-index for predicting 3-year mortality was 95.89% (95% CI 95.80%&#x2010;95.97%), whereas the C-index for predicting 5-year mortality was 91.82% (95% CI 91.68%&#x2010;91.96%). In the gradient boosting survival analysis model, the C-index for predicting 3-year mortality was 95.32% (95% CI 95.31%&#x2010;95.33%), and the C-index for predicting 5-year mortality was 89.98% (95% CI 89.95%&#x2010;90.01%). For the extra survival tree model, the C-index for predicting 3-year mortality was 95.53% (95% CI 95.46%&#x2010;95.60%), whereas the C-index for predicting 5-year mortality was 94.60% (95% CI 94.50%&#x2010;94.70%). In addition, the Cox proportional hazards model showed a C-index of 94.15% for predicting 3-year mortality and 82.26% for predicting 5-year mortality. Tumor stage and tumor size were the primary predictive variables used to train the models for mortality prediction at different time points. Other variables exhibited varying levels of predictive contribution across different time points.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>These findings may facilitate the identification of high-risk young patients with GC who may benefit from more aggressive treatment strategies by enabling the prediction of mortality risk at different time points.</p></sec></abstract><kwd-group><kwd>survival prediction model</kwd><kwd>young patients with gastric cancer</kwd><kwd>machine learning</kwd><kwd>gastric cancer</kwd><kwd>mortality risk</kwd><kwd>predictive modeling</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Despite a consistent global decline in the incidence of gastric cancer (GC) resulting from improved understanding of the key etiological factors influencing its development, more than 1 million new cases are still diagnosed annually worldwide, and the disease remains associated with a high mortality rate [<xref ref-type="bibr" rid="ref1">1</xref>]. Recent studies have shown that the prevalence of GC among younger individuals varies substantially across geographic regions and is increasing worldwide. This trend is particularly evident in Asian countries such as South Korea, Japan, and China [<xref ref-type="bibr" rid="ref2">2</xref>-<xref ref-type="bibr" rid="ref4">4</xref>] where GC occurs at a comparatively higher rate among younger populations [<xref ref-type="bibr" rid="ref2">2</xref>]. Although the precise mechanisms underlying GC development in younger individuals remain unclear, both disease progression and prognosis are influenced by a complex interplay of factors, including pathological characteristics, molecular alterations, genomic features, dietary patterns, and lifestyle-related exposures. Consequently, several studies have been conducted to evaluate prognostic outcomes in younger patients with GC [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. Previous studies predicting survival outcomes in young patients with GC have primarily relied on traditional statistical nomogram models. These models represent the relationships between clinical covariates and patient outcomes in an interpretable format and have demonstrated relatively stable predictive performance [<xref ref-type="bibr" rid="ref7">7</xref>].</p><p>Recently, machine learning (ML)&#x2013;based approaches have been explored as complementary tools to traditional prediction models [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>], demonstrating particular strengths in capturing complex nonlinear relationships among predictor variables and analyzing large-scale, high-dimensional clinical datasets [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. Several studies have demonstrated that ML-based survival models can provide meaningful prognostic insights for predicting time-to-event outcomes using structured clinical data collected in real-world health care settings [<xref ref-type="bibr" rid="ref12">12</xref>-<xref ref-type="bibr" rid="ref16">16</xref>]. However, in young patients with GC, baseline prognostic factors influencing survival change over time [<xref ref-type="bibr" rid="ref17">17</xref>]. In addition, existing mortality prediction models typically provide predictions for a single time point, which may limit their ability to capture time-varying changes in prognostic factors that may occur in younger patients with GC [<xref ref-type="bibr" rid="ref15">15</xref>]. Therefore, to account for the complex nature of GC prognosis, this study developed 3- and 5-year mortality prediction ML-based models for young patients with GC and constructed 3- and 5-year mortality prediction models to capture potential time-varying risk factors. This ML-based survival prediction study aimed to identify how key prognostic factors associated with mortality vary across different prediction horizons.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Design</title><p>We developed a predictive model to estimate all-cause mortality among younger patients with GC using deidentified data obtained from the Cancer Public Staging Database (CPSD) provided by the National Cancer Data Center (NCDC; <xref ref-type="fig" rid="figure1">Figure 1</xref>). To achieve this objective, we first extracted data for younger patients (&#x2264;50 years) diagnosed with GC between 2013 and 2015 from the CPSD and subsequently performed data preprocessing on the dataset. The data were randomly divided into training and testing subsets comprising 70% and 30% of the data, respectively. Using the training dataset, we developed 3- and 5-year mortality prediction models using random survival forest (RSF), gradient boosting survival analysis (GBSA), extra survival tree (EST), and Cox proportional hazards (PH).</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Research framework. CPSD: Cancer Public Staging Database.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cancer_v12i1e86418_fig01.png"/></fig></sec><sec id="s2-2"><title>Ethical Considerations</title><p>This study was approved by the institutional review board of the National Cancer Center of South Korea (NCC2023-0260). The requirement for informed consent was waived because HYJK, WJ, and KSR accessed only anonymized data for the purposes of analysis. The pseudonymized dataset was analyzed within a secure research environment provided by the NCDC, ensuring that only aggregated analytical results were exported.</p></sec><sec id="s2-3"><title>Data Source</title><p>This study used the CPSD, which is provided by the NCDC. This database was constructed by linking data from the NCDC&#x2019;s Cancer Public Library Database with collaborative staging data for cancer cases established in the Korea Central Cancer Registry (KCCR) [<xref ref-type="bibr" rid="ref18">18</xref>]. The collaborative staging system was developed using probability-based sampling methods and mandatory retrospective medical record surveys of cancer cases registered in the KCCR. These surveys provide information on cancer staging, treatment modalities, and patient prognoses [<xref ref-type="bibr" rid="ref19">19</xref>]. The Cancer Public Library Database was developed by integrating linked data from 4 major population-based public databases: the Korea National Cancer Incidence Database maintained by the KCCR, cause of death records from Statistics Korea, the National Health Information Database of the National Health Insurance Service, and the National Health Insurance Research Database maintained by the Health Insurance Review and Assessment Service [<xref ref-type="bibr" rid="ref20">20</xref>]. The use of the CPSD dataset complied with the data access and use policies established by the NCDC, and all data were handled in accordance with relevant guidelines and regulations to ensure confidentiality and data security. As the dataset contained no personally identifiable information, this study was exempt from institutional review board review.</p></sec><sec id="s2-4"><title>Definitions</title><p>Comorbid conditions, including myocardial infarction, stroke, heart failure, diabetes mellitus, hypertension, dyslipidemia, chronic obstructive pulmonary disease, peripheral vascular disease, liver disease, atrial fibrillation, and chronic kidney disease, were identified and defined according to the diagnostic codes from the <italic>International Classification of Diseases, 10th Revision</italic>. Additionally, primary study end points were defined to represent short- and medium-term mortality, specifically all-cause mortality occurring within 3 and 5 years after cancer diagnosis, respectively. Information on all-cause mortality was obtained from official cause of death records provided by South Korea&#x2019;s national statistical authority. Deaths occurring within each follow-up period were treated as cumulative mortality events; therefore, events occurring within 3 years were also included in the cumulative event count for the 5-year follow-up period.</p></sec><sec id="s2-5"><title>Experimental Dataset</title><p>The dataset was randomly divided into a training set (n=569) and a test set (n=244) using a fixed random seed (42) to ensure the reproducibility of the dataset partitioning. The primary outcome was all-cause mortality measured at 3 and 5 years after cancer diagnosis, and separate survival prediction models were developed for each prediction horizon. To minimize potential bias caused by outcome imbalance, the dataset was randomly partitioned using stratified sampling, ensuring comparable proportions of mortality events between the training and testing datasets. Model performance was evaluated on the corresponding test dataset using the Harrell C-index, a widely used discrimination metric in survival analysis. For the ML-based survival models (RSF, GBSA, and EST), the training and evaluation procedures were repeated across 100 iterations, with the random seed varied in each iteration while maintaining a fixed data split to quantify stochastic variability and assess the robustness of model performance. At each iteration, the models were refitted using the same training dataset and subsequently evaluated on the identical test dataset. The resulting training and testing datasets were fixed after partitioning and were consistently used in all subsequent model development and evaluation experiments.</p></sec><sec id="s2-6"><title>Models</title><p>The RSF is an ensemble-based ML method that models complex nonlinear relationships between predictor variables and estimates variable importance to reduce generalization error. The RSF model can also estimate the cumulative hazard function for individual observations even when the PH assumption is not satisfied [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. A gradient boosting machine framework [<xref ref-type="bibr" rid="ref23">23</xref>] was adapted for survival analysis, enabling the model to effectively handle light-censored survival data. Gradient boosting machine is an ensemble learning technique in which successive decision trees are sequentially constructed, with each tree iteratively correcting the prediction errors of the preceding model. GBSA builds on this boosting framework for survival modeling, allowing the algorithm to handle censored observations and capture complex interactions between predictor variables and survival time [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. The EST model, an extension of the randomized trees algorithm introduced by Geurts et al [<xref ref-type="bibr" rid="ref26">26</xref>] in 2006, introduces additional randomness by selecting split points randomly during tree construction. The EST algorithm can censor survival data and does not rely on the PH assumption [<xref ref-type="bibr" rid="ref27">27</xref>]. The Cox PH model is a widely used semiparametric survival analysis method that examines the relationship between survival time and multiple predictor variables. This model does not require explicit specification of the baseline hazard function [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>].</p></sec><sec id="s2-7"><title>Computational Environment Settings</title><p>Survival analysis is a statistical methodology used to analyze time-to-event outcomes such as death or disease progression [<xref ref-type="bibr" rid="ref30">30</xref>], and ML approaches are increasingly being adopted in health care research to address the analytical complexities associated with survival modeling [<xref ref-type="bibr" rid="ref31">31</xref>]. Nonparametric tree-based ensemble methods are generally considered well suited for analyzing censored time-to-event outcomes and performing dynamic survival predictions [<xref ref-type="bibr" rid="ref32">32</xref>]. The predictor variables were further ranked and stratified according to their relative feature importance within the survival prediction models. In this study, we developed a survival prediction model based on GBSA, RSF, EST, and the Cox PH. During model development, feature importance scores were computed based on the mean decrease in impurity using the scikit-learn library (version 1.0.2; Google Summer of Code project) [<xref ref-type="bibr" rid="ref33">33</xref>]. The models were implemented using the scikit-survival library (version 0.17.2) [<xref ref-type="bibr" rid="ref34">34</xref>] within a Python (version 3.7.5; Python Software Foundation) computational environment, with TensorFlow (version 1.15.5; Google Brain Team) used as the underlying ML framework.</p><p>All survival models were trained using predefined and fixed hyperparameter configurations. For the RSF, GBSA, and EST models, the number of estimators was fixed at 200, whereas all remaining hyperparameters were retained at their default library settings. For the Cox PH model, elastic net regularization was applied with an L1 ratio of 1 &#x00D7; 10<sup>&#x2013;6</sup> and predefined alpha values to enhance numerical stability during model optimization. Continuous variables were not normalized for tree-based survival models because tree-based algorithms are inherently scale invariant and do not require feature normalization. Missing values were handled through data imputation using the median value for continuous variables and the most frequent category for categorical variables followed by one-hot encoding of categorical features. Importantly, all preprocessing procedures&#x2014;including imputation and feature encoding&#x2014;were fit exclusively on the training dataset and subsequently applied to the test dataset to prevent information leakage during model evaluation. For the Cox PH model, the predictor variables were standardized prior to model training to improve numerical stability and optimization convergence.</p></sec><sec id="s2-8"><title>Model Performance Evaluation</title><p>The C-index [<xref ref-type="bibr" rid="ref35">35</xref>] is the most widely used evaluation metric for assessing the performance of survival prediction models [<xref ref-type="bibr" rid="ref36">36</xref>]. This C-index is computed by comparing the predictive risk scores and observed survival times for pairs of randomly selected patients. To determine the number of concordant and discordant patient pairs, this pairwise comparison process was repeated across all possible patient pairs within the study cohort. The predictive model assigns a numerical risk score to each individual, representing the predicted risk of mortality, whereas the C-index evaluates the model&#x2019;s ability to correctly rank the relative risk between pairs of individuals [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]. Therefore, the C-index was used to evaluate the predictive performance and discrimination ability of the survival prediction models.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Study Population</title><p>The CPSD contains data for 23,717 individuals diagnosed with GC at the primary anatomical sites C160 to C166, C168, and C169 between 2012 and 2019. From this dataset, we excluded patients diagnosed with GC between 2016 and 2019 for 5-year mortality prediction analysis, as well as the 2012 cohort, for which prediagnostic screening information was unavailable. The dataset subsequently underwent data cleaning procedures, during which 3103 records containing missing or unknown values were removed, including tumor size (T-size; n=1140, 36.7%), height (n=1849, 59.6%), urine protein (n=44, 1.4%), gamma-glutamyl transpeptidase (n=4, 0.1%), low-density lipoprotein cholesterol (n=17, 0.5%), and estimated glomerular filtration rate (eGFR; n=49, 1.6%). Patients aged 50 years or younger at the time of diagnosis were classified as the &#x201C;younger&#x201D; patient group, as illustrated in <xref ref-type="fig" rid="figure2">Figure 2</xref>.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Generation process of the experimental datasets. K-CURE: Korea Clinical Data Utilization Network for Research Excellence.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cancer_v12i1e86418_fig02.png"/></fig></sec><sec id="s3-2"><title>Baseline Characteristics</title><p>The study population showed differences between younger and older patients. Among younger patients, there was a higher proportion of women, whereas older patients exhibited a higher burden of comorbidities, including cardiovascular and metabolic diseases. Differences were also observed in tumor-related characteristics, including cancer stage according to the seventh edition of the American Joint Committee on Cancer (AJCC) cancer staging manual, with younger patients tending to present with more advanced stages. In addition, older patients showed higher all-cause mortality at both 3 and 5 years. Detailed baseline characteristics are provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s3-3"><title>Model Performance</title><p>The RSF, GBSA, EST, and Cox PH models were trained and evaluated to compare their predictive performance for survival outcomes at 2 time horizons (3 and 5 years). <xref ref-type="table" rid="table1">Table 1</xref> presents the mean C-index values with corresponding 95% CIs, reflecting the predictive accuracy of the models in estimating mortality risk among young patients with GC at different prediction time points. For the ML prediction models, we reported the mean C-index and the corresponding empirical 95% CIs across 100 repeated training iterations, whereas the Cox PH model was evaluated using a single model run; therefore, CIs for the C-index were not estimated or reported. The C-index values obtained from each of the 100 training iterations for the prediction models are provided in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>. For 3-year survival prediction, the RSF, GBSA, EST, and Cox PH models achieved C-index values of 95.89% (95% CI 95.80%&#x2010;95.97%), 95.32% (95% CI 95.31%&#x2010;95.33%), 95.53% (95% CI 95.46%&#x2010;95.60%), and 94.15%, respectively. For 5-year survival prediction, the corresponding C-index values were 91.82% (95% CI 91.68%&#x2010;91.96%), 89.98% (95% CI 89.95%&#x2010;90.01%), 94.60% (95% CI 94.50%&#x2010;94.70%), and 82.26%, as summarized in <xref ref-type="table" rid="table1">Table 1</xref>.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Concordance index (C-index) with 95% CIs for survival prediction models and the Cox proportional hazards (PH) model.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Model</td><td align="left" valign="bottom">3 year, C-index (%; 95% CI)</td><td align="left" valign="bottom">5 year, C-index (%; 95% CI)</td></tr></thead><tbody><tr><td align="left" valign="top">RSF<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup></td><td align="left" valign="top">95.89 (95.80-95.97)</td><td align="left" valign="top">91.82 (91.68-91.96)</td></tr><tr><td align="left" valign="top">GBSA<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="top">95.32 (95.31-95.33)</td><td align="left" valign="top">89.98 (89.95-90.01)</td></tr><tr><td align="left" valign="top">EST<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">95.53 (95.46-95.60)</td><td align="left" valign="top">94.60 (94.50-94.70)</td></tr><tr><td align="left" valign="top">Cox PH</td><td align="left" valign="top">94.15<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">82.26</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>RSF: random survival forest.</p></fn><fn id="table1fn2"><p><sup>b</sup>GBSA: gradient boosting survival analysis.</p></fn><fn id="table1fn3"><p><sup>c</sup>EST: extra survival tree.</p></fn><fn id="table1fn4"><p><sup>d</sup>The C-index values reported for the machine learning models represent the mean values and corresponding 95% CIs obtained from 100 repeated model training iterations. The Cox PH model was evaluated using a single model run; therefore, CIs for the C-index were not estimated or reported.</p></fn></table-wrap-foot></table-wrap><p>For 3-year survival prediction, the RSF model identified several important predictors, including the AJCC stage, T-size, age, serum glutamic oxaloacetic transaminase (aspartate aminotransferase), eGFR, systolic blood pressure, serum glutamic pyruvic transaminase (aspartate aminotransferase), hemoglobin level, and tumor topography codes (C162 and C160). For 5-year survival prediction, the RSF model identified AJCC stage, T-size, deep vein thrombosis, age, tumor topography code (C163), gamma-glutamyl transpeptidase, tumor grade, diastolic blood pressure, hemoglobin level, and liver disease as key prognostic predictors. For 3-year survival prediction, the GBSA model identified several important predictors, including AJCC stage, hemoglobin level, tumor topography code (C169), T-size, fasting blood glucose, total cholesterol, weekly alcohol consumption, walking activity level, systolic blood pressure, and serum glutamic oxaloacetic transaminase. For 5-year survival prediction, the GBSA model identified the following important predictors: AJCC stage, T-size, tumor topography code (C169), weekly alcohol consumption, fasting blood glucose, hemoglobin level, diastolic blood pressure, serum glutamic pyruvic transaminase, tumor grade, and total cholesterol. For 3-year survival prediction, the EST model identified several important predictors, including AJCC stage, T-size, diabetes mellitus, tumor topography codes (C169 and C162), proteinuria, waist circumference, body weight, daily alcohol consumption, and serum glutamic oxaloacetic transaminase levels. For 5-year survival prediction, the most influential predictors identified by the EST model included AJCC stage, T-size, tumor topography code (C163), deep vein thrombosis, liver disease, diabetes mellitus, tumor grade, BMI, waist circumference, and height. For 3-year mortality prediction, the Cox PH model identified AJCC stage and T-size as the most influential predictors, followed by serum glutamic oxaloacetic transaminase, eGFR, triglycerides, age, high-density lipoprotein cholesterol, hemoglobin level, total cholesterol, and gamma-glutamyl transpeptidase. For 5-year mortality prediction, AJCC stage and T-size remained the dominant predictors, together with serum glutamic oxaloacetic transaminase, eGFR, age, high-density lipoprotein cholesterol, total cholesterol, hemoglobin level, triglycerides, and weekly alcohol consumption.</p><p>Feature importance analysis showed that AJCC stage and T-size were consistently the most influential predictors across all models and prediction time points, whereas other variables demonstrated model- and time-dependent variability. Detailed feature importance results are provided in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>, the corresponding hazard ratio analyses are presented in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>, and <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref> provides the mapping between heat map feature labels and the corresponding clinical variables reported in the manuscript tables.</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>In this study, we developed ML-based survival prediction models for young patients with GC to estimate 3- and 5-year mortality. Among the evaluated models, RSF and EST demonstrated superior predictive performance compared to the Cox PH model. Across all models and prediction horizons, AJCC stage and T-size consistently emerged as the most important predictors of mortality risk.</p><p>GC has traditionally been considered a disease predominantly affecting older adults; however, recent epidemiological studies have reported an increasing incidence among younger individuals [<xref ref-type="bibr" rid="ref39">39</xref>-<xref ref-type="bibr" rid="ref41">41</xref>]. These findings highlight the need for tailored prognostic models for younger patient populations. Our analysis results indicated that the older patient group exhibited a poorer prognosis than the younger patient group. Furthermore, the stage-specific survival curves demonstrated adverse poorer prognoses in the older patient cohort. However, for stage 3 and 4 disease, no statistically meaningful differences in survival prognosis were observed between the younger and older groups, as shown in <xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref>. Owing to age-related physiological and biological differences, treatment responses and survival outcomes may vary, which should be considered when developing survival prediction models [<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref43">43</xref>]. Previous studies have reported promising results, demonstrating the potential of predictive modeling to generate meaningful insights into survival outcomes [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref44">44</xref>-<xref ref-type="bibr" rid="ref48">48</xref>]. However, uncertainty remains regarding the consistency of model performance across different predictive time horizons in young patients with GC. The superior performance of ML-based models compared with the Cox PH model may be attributed to their ability to capture complex nonlinear relationships and interactions among clinical variables, which are not adequately addressed by traditional statistical approaches. These findings suggest that ML-based models may provide more accurate risk stratification, potentially supporting personalized treatment strategies and clinical decision-making for young patients with GC. In particular, the use of longitudinal clinical and comorbidity data in this study may have contributed to improved model performance, which is in line with previous studies exploring the use of ML approaches for survival prediction. Furthermore, although many predictive models have been developed using the Surveillance, Epidemiology, and End Results database, which contains comprehensive cancer registry information, there remains limited availability of longitudinal data for tracking comorbidities and patient health characteristics, such as disease diagnosis codes (<italic>International Classification of Diseases, 10th Revision</italic>), medication records, and routine health examination data. Such information is not consistently available in the Healthcare Examiners and Evaluators database or the National Health Service database, which may influence the predictive performance and reliability of ML models. To address these limitations, we classified patients with GC as younger (&#x2264;50 years) based on criteria used in recent studies [<xref ref-type="bibr" rid="ref49">49</xref>] and evaluated their 3- and 5-year survival predictions using multiple survival prediction models. Using feature importance analysis, we identified clinically relevant predictors, among which 2 variables consistently influenced survival prognosis across all models and time horizons: AJCC stage and T-size. These variables demonstrated significant associations with all-cause mortality at both the 3- and 5-year follow-up intervals, as shown in <xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref>. The tumor, node, metastasis (TNM) staging system represents a comprehensive framework for evaluating the anatomical extent of cancer progression and continues to serve as the fundamental basis for prognostic stratification in oncology. Although T-size contributes to the T component of the TNM classification, the continuous measurement of T-size may provide additional prognostic granularity beyond categorical stage classifications. The TNM staging system aggregates information from the tumor, nodal involvement, and metastasis categories into discrete stage groups. However, a continuous T-size variable may capture heterogeneity within the same stage group, which may not be fully represented by categorical staging alone. This may prove why both tumor stage and T-size were retained as significant predictors in the ML survival prediction models. These findings suggest that, within established staging frameworks, incorporating quantitative tumor characteristics such as continuous T-size measurements can provide additional prognostic information, particularly for long-term survival prediction. However, as illustrated by the heat map of key predictors for the 3- and 5-year models, the relative importance of variables used to predict mortality varied across prediction time points in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>. The proposed survival prediction models enabled the identification of high-risk subgroups among young patients with GC by accounting for temporal variations in prognostic risk factors. These findings may support the development of more targeted and potentially aggressive treatment strategies for young patients with GC. To evaluate the performance of the proposed model, a comparative analysis was conducted between the traditional TNM staging system and the ML survival model for 1-, 3-, and 5-year mortality prediction, with the Harrell C-index used to quantify model discrimination performance. The findings demonstrated that ML-based approaches exhibited superior performance for 3- and 5-year mortality, whereas at the 1-year prediction horizon, the TNM staging classification showed slightly higher discriminatory power than the ML survival model, as shown in <xref ref-type="supplementary-material" rid="app8">Multimedia Appendix 8</xref>. Consequently, the ML-based 1-year mortality prediction model was excluded from subsequent analyses. These findings suggest that short-term mortality outcomes are predominantly influenced by the initial stage of disease, a factor that is effectively captured by the conventional TNM staging classification system. Conversely, the additional predictive benefit of ML-based survival models became more pronounced in long-term predictions (3 and 5 years), where multiple complex clinical and biological factors may contribute to heterogeneity in patient outcomes. The validation of predictive model performance was strongly influenced by the data-splitting strategy used for model training and evaluation. This study compared the results obtained using a random data-splitting strategy (training: 70%; testing: 30%) applied to the entire dataset from 2013 to 2015 with those obtained using a year-based split (training: 2013&#x2010;2014; testing: 2015), as shown in <xref ref-type="supplementary-material" rid="app9">Multimedia Appendix 9</xref>. The analysis demonstrated that the random data-splitting strategy produced a higher predictive performance compared with the year-based splitting approach. This result was interpreted as reflecting the inability of the year-based split to adequately represent the characteristics of the patient cohort collected in a specific year (2015) within the training dataset, which led to larger differences in key variables&#x2014;particularly AJCC stage&#x2014;between the training and testing datasets. In summary, although the dataset in this study was longitudinal and incorporated patient-specific follow-up durations, the year-based segmentation approach functioned more as a method for separating patient cohorts collected at different time points than as a validation framework representing a true temporal prediction scenario. This heterogeneity in key predictor variables&#x2014;particularly AJCC stage&#x2014;between the training and test datasets was considered to limit the generalization of latent patterns learned by the models during training, thereby reducing the overall predictive performance.</p><p>This study has several limitations. It was conducted using data derived from a single ethnic population, which may have introduced potential population-specific bias into the developed prediction models. In addition, external validation using independent datasets was not performed, which may limit the robustness, generalizability, and clinical applicability of these predictive models. Although this study developed and validated ML models for predicting 3- and 5-year mortality in young patients with GC, several important methodological considerations, including model interpretability and robustness to complex or incomplete data, were not fully addressed.</p><p>In summary, this study developed and validated ML models for predicting 3- and 5-year mortality in young patients with GC, demonstrating their potential utility for risk stratification and clinical decision-making. Validation using larger and more diverse patient populations is necessary to ensure robustness, external validity, and generalizability. The integration of explainable artificial intelligence methodologies may enhance the interpretability and transparency of ML models, thereby making predictive outputs more clinically actionable for health care practitioners [<xref ref-type="bibr" rid="ref50">50</xref>]. Recent ML research has addressed several methodological challenges, including modeling temporal dependencies, discriminative feature selection, and improving robustness to noisy or incomplete input data. Prior studies in nonclinical ML domains have proposed advanced methodologies, including attention-based temporal models, structure-aware feature selection frameworks, and confidence-driven learning strategies [<xref ref-type="bibr" rid="ref51">51</xref>-<xref ref-type="bibr" rid="ref53">53</xref>]. Although these approaches do not directly fall within the scope of this study, they provide conceptually important insights for survival prediction problems, particularly those requiring careful handling of longitudinal data patterns, high-dimensional clinical variables, and uncertainty in medical datasets. These methodological directions may be adapted and extended to medical prognostic prediction models, particularly in survival analysis and clinical outcome prediction research. In addition to these methodological considerations, evaluation of the clinical utility of the key prognostic variables identified in this study, including cancer stage and T-size, is required through prospective or independent validation studies, whereas the use of internationally standardized and multiethnic datasets may further improve the reliability, external validity, and global generalizability of the predictive models.</p></sec><sec id="s4-2"><title>Conclusions</title><p>The number of young patients diagnosed with GC continues to increase worldwide, and nomogram-based prognostic models have been proposed to identify patients at high risk of adverse outcomes. However, relatively few studies have focused on predicting survival outcomes in young patients with GC using ML approaches. Therefore, we developed ML-based prediction models for estimating 3- and 5-year mortality in young patients with GC. These models may assist clinicians in identifying young patients with GC who may require more aggressive or personalized treatment strategies. However, because this analysis was conducted using data derived from the Korean patient population, future studies should externally validate these prediction models in diverse international populations.</p></sec></sec></body><back><ack><p>The authors attest that there was no use of generative artificial intelligence technology in the generation of text, figures, or other informational content of this manuscript.</p></ack><notes><sec><title>Funding</title><p>This study was supported by a grant (2310440-4) from the National Cancer Center of South Korea.</p></sec><sec><title>Data Availability</title><p>The datasets generated or analyzed during this study are not publicly available due to privacy protection requirements and national data governance restrictions for cancer registry&#x2013;linked health data. However, researchers may request access to the original dataset through the Korea Clinical Data Utilization Network for Research Excellence portal [<xref ref-type="bibr" rid="ref54">54</xref>], subject to registration and approval through the required data application and review process. Applicants must submit a data access application form, including a detailed research proposal describing the intended use of the dataset, which is reviewed and approved by both the Korea Clinical Data Utilization Network for Research Excellence and the National Cancer Data Center. This data access service is currently restricted to researchers based in South Korea. All source code associated with this study is publicly available through the GitHub repository [<xref ref-type="bibr" rid="ref55">55</xref>].</p></sec></notes><fn-group><fn fn-type="con"><p>Conceptualization: HYJK, MK, KSR</p><p>Data curation: HYJK, WJ, KSR</p><p>Investigation: HYJK</p><p>Methodology: HYJK, MK, KSR</p><p>Validation: HYJK, WJ, MK, KSR</p><p>Writing&#x2014;original draft: HYJK, KSR</p><p>All authors contributed to drafting and revising the manuscript.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AJCC</term><def><p>American Joint Committee on Cancer</p></def></def-item><def-item><term id="abb2">CPSD</term><def><p>Cancer Public Staging Database</p></def></def-item><def-item><term id="abb3">eGFR</term><def><p>estimated glomerular filtration rate</p></def></def-item><def-item><term id="abb4">EST</term><def><p>extra survival tree</p></def></def-item><def-item><term id="abb5">GBSA</term><def><p>gradient boosting survival analysis</p></def></def-item><def-item><term id="abb6">GC</term><def><p>gastric cancer</p></def></def-item><def-item><term id="abb7">KCCR</term><def><p>Korea Central Cancer Registry</p></def></def-item><def-item><term id="abb8">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb9">NCDC</term><def><p>National Cancer Data Center</p></def></def-item><def-item><term id="abb10">PH</term><def><p>proportional hazards</p></def></def-item><def-item><term id="abb11">RSF</term><def><p>random survival forest</p></def></def-item><def-item><term id="abb12">TNM</term><def><p>tumor, node, metastasis</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wong</surname><given-names>MCS</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Chan</surname><given-names>PSF</given-names> </name><etal/></person-group><article-title>Global incidence and mortality of gastric cancer, 1980-2018</article-title><source>JAMA Netw Open</source><year>2021</year><month>07</month><day>1</day><volume>4</volume><issue>7</issue><fpage>e2118457</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2021.18457</pub-id><pub-id pub-id-type="medline">34309666</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wu</surname><given-names>SL</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Fu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>JS</given-names> </name></person-group><article-title>Gastric cancer incidence, mortality and burden in adolescents and young adults: a time-trend analysis and comparison among China, South Korea, Japan and the USA</article-title><source>BMJ Open</source><year>2022</year><month>07</month><day>21</day><volume>12</volume><issue>7</issue><fpage>e061038</fpage><pub-id pub-id-type="doi">10.1136/bmjopen-2022-061038</pub-id><pub-id pub-id-type="medline">35863834</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gao</surname><given-names>K</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>J</given-names> </name></person-group><article-title>National trend of gastric cancer mortality in China (2003&#x2013;2015): a population&#x2010;based study</article-title><source>Cancer Commun</source><year>2019</year><month>12</month><volume>39</volume><issue>1</issue><fpage>1</fpage><lpage>5</lpage><pub-id pub-id-type="doi">10.1186/s40880-019-0372-x</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>D</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Lu</surname><given-names>S</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>D</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>L</given-names> </name></person-group><article-title>Global, regional, and national burden of gastric cancer in adolescents and young adults, 1990-2019: a systematic analysis for the Global Burden of Disease Study 2019</article-title><source>Am J Gastroenterol</source><year>2024</year><month>03</month><day>1</day><volume>119</volume><issue>3</issue><fpage>454</fpage><lpage>467</lpage><pub-id pub-id-type="doi">10.14309/ajg.0000000000002551</pub-id><pub-id pub-id-type="medline">37800697</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wu</surname><given-names>C</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>N</given-names> </name><name name-style="western"><surname>Zhou</surname><given-names>H</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>T</given-names> </name><name name-style="western"><surname>Zhao</surname><given-names>D</given-names> </name></person-group><article-title>Development and validation of a nomogram to individually predict survival of young patients with nonmetastatic gastric cancer: a retrospective cohort study</article-title><source>Saudi J Gastroenterol</source><year>2019</year><volume>25</volume><issue>4</issue><fpage>236</fpage><lpage>244</lpage><pub-id pub-id-type="doi">10.4103/sjg.SJG_378_18</pub-id><pub-id pub-id-type="medline">30719999</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>YR</given-names> </name><name name-style="western"><surname>Tian</surname><given-names>ZY</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>MQ</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>ML</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>JZ</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>XY</given-names> </name></person-group><article-title>Development and validation of prognostic nomograms based on lymph node ratio for young patients with gastric cancer: a SEER-based study</article-title><source>Technol Cancer Res Treat</source><year>2023</year><volume>22</volume><fpage>15330338231157923</fpage><pub-id pub-id-type="doi">10.1177/15330338231157923</pub-id><pub-id pub-id-type="medline">37248609</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>W</given-names> </name><name name-style="western"><surname>Lam</surname><given-names>SK</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>R</given-names> </name><name name-style="western"><surname>Cai</surname><given-names>J</given-names> </name></person-group><article-title>Review of methodological workflow, interpretation and limitations of nomogram application in cancer study</article-title><source>Radiat Med Prot</source><year>2022</year><month>12</month><volume>3</volume><issue>4</issue><fpage>200</fpage><lpage>207</lpage><pub-id pub-id-type="doi">10.1016/j.radmp.2022.08.004</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tran</surname><given-names>TT</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>J</given-names> </name><name name-style="western"><surname>Gunathilake</surname><given-names>M</given-names> </name><etal/></person-group><article-title>A comparison of machine learning models and Cox proportional hazards models regarding their ability to predict the risk of gastrointestinal cancer based on metabolic syndrome and its components</article-title><source>Front Oncol</source><year>2023</year><volume>13</volume><fpage>1049787</fpage><pub-id pub-id-type="doi">10.3389/fonc.2023.1049787</pub-id><pub-id pub-id-type="medline">36937438</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kurt Omurlu</surname><given-names>I</given-names> </name><name name-style="western"><surname>Ture</surname><given-names>M</given-names> </name><name name-style="western"><surname>Tokatli</surname><given-names>F</given-names> </name></person-group><article-title>The comparisons of random survival forests and Cox regression analysis with simulation and an application related to breast cancer</article-title><source>Expert Syst Appl</source><year>2009</year><month>05</month><volume>36</volume><issue>4</issue><fpage>8582</fpage><lpage>8588</lpage><pub-id pub-id-type="doi">10.1016/j.eswa.2008.10.023</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>D&#x00ED;ez-Sanmart&#x00ED;n</surname><given-names>C</given-names> </name><name name-style="western"><surname>Sarasa Cabezuelo</surname><given-names>A</given-names> </name></person-group><article-title>Application of artificial intelligence techniques to predict survival in kidney transplantation: a review</article-title><source>J Clin Med</source><year>2020</year><month>02</month><day>19</day><volume>9</volume><issue>2</issue><fpage>572</fpage><pub-id pub-id-type="doi">10.3390/jcm9020572</pub-id><pub-id pub-id-type="medline">32093027</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>N</given-names> </name><name name-style="western"><surname>Guo</surname><given-names>J</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>X</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>L</given-names> </name><name name-style="western"><surname>Yi</surname><given-names>Z</given-names> </name></person-group><article-title>SurvNet: a novel deep neural network for lung cancer survival analysis with missing values</article-title><source>Front Oncol</source><year>2021</year><volume>10</volume><fpage>588990</fpage><pub-id pub-id-type="doi">10.3389/fonc.2020.588990</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mainali</surname><given-names>G</given-names> </name></person-group><article-title>Artificial intelligence in medical science: perspective from a medical student</article-title><source>JNMA J Nepal Med Assoc</source><year>2020</year><month>09</month><day>27</day><volume>58</volume><issue>229</issue><fpage>709</fpage><lpage>711</lpage><pub-id pub-id-type="doi">10.31729/jnma.5257</pub-id><pub-id pub-id-type="medline">33068098</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Seifert</surname><given-names>R</given-names> </name><name name-style="western"><surname>Weber</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kocakavuk</surname><given-names>E</given-names> </name><name name-style="western"><surname>Rischpler</surname><given-names>C</given-names> </name><name name-style="western"><surname>Kersting</surname><given-names>D</given-names> </name></person-group><article-title>Artificial intelligence and machine learning in nuclear medicine: future perspectives</article-title><source>Semin Nucl Med</source><year>2021</year><month>03</month><volume>51</volume><issue>2</issue><fpage>170</fpage><lpage>177</lpage><pub-id pub-id-type="doi">10.1053/j.semnuclmed.2020.08.003</pub-id><pub-id pub-id-type="medline">33509373</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lu</surname><given-names>T</given-names> </name><name name-style="western"><surname>Fang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Comparison of machine learning and logic regression algorithms for predicting lymph node metastasis in patients with gastric cancer: a two-center study</article-title><source>Technol Cancer Res Treat</source><year>2024</year><volume>23</volume><fpage>15330338231222331</fpage><pub-id pub-id-type="doi">10.1177/15330338231222331</pub-id><pub-id pub-id-type="medline">38190617</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alabi</surname><given-names>RO</given-names> </name><name name-style="western"><surname>M&#x00E4;kitie</surname><given-names>AA</given-names> </name><name name-style="western"><surname>Pirinen</surname><given-names>M</given-names> </name><name name-style="western"><surname>Elmusrati</surname><given-names>M</given-names> </name><name name-style="western"><surname>Leivo</surname><given-names>I</given-names> </name><name name-style="western"><surname>Almangush</surname><given-names>A</given-names> </name></person-group><article-title>Comparison of nomogram with machine learning techniques for prediction of overall survival in patients with tongue cancer</article-title><source>Int J Med Inform</source><year>2021</year><month>01</month><volume>145</volume><fpage>104313</fpage><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2020.104313</pub-id><pub-id pub-id-type="medline">33142259</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Huang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name><name name-style="western"><surname>Li</surname><given-names>M</given-names> </name><name name-style="western"><surname>Aparasu</surname><given-names>RR</given-names> </name></person-group><article-title>Application of machine learning in predicting survival outcomes involving real-world data: a scoping review</article-title><source>BMC Med Res Methodol</source><year>2023</year><month>11</month><day>13</day><volume>23</volume><issue>1</issue><fpage>268</fpage><pub-id pub-id-type="doi">10.1186/s12874-023-02078-1</pub-id><pub-id pub-id-type="medline">37957593</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>QY</given-names> </name><name name-style="western"><surname>Zhong</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>W</given-names> </name><etal/></person-group><article-title>Prognosis of young survivors of gastric cancer in China and the U.S.: determining long-term outcomes based on conditional survival</article-title><source>Oncologist</source><year>2019</year><month>06</month><volume>24</volume><issue>6</issue><fpage>e260</fpage><lpage>e274</lpage><pub-id pub-id-type="doi">10.1634/theoncologist.2018-0220</pub-id><pub-id pub-id-type="medline">30470692</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="web"><source>National Cancer Data Center</source><access-date>2024-05-21</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.cancerdata.re.kr/en/index">https://www.cancerdata.re.kr/en/index</ext-link></comment></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="web"><person-group person-group-type="author"><collab>Korea Central Cancer Registry</collab></person-group><article-title>KCCR survey</article-title><source>Korea Central Cancer Registry</source><access-date>2024-05-21</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://kccrsurvey.cancer.go.kr/index.do">https://kccrsurvey.cancer.go.kr/index.do</ext-link></comment></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Choi</surname><given-names>DW</given-names> </name><name name-style="western"><surname>Guk</surname><given-names>MY</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>HR</given-names> </name><etal/></person-group><article-title>Data resource profile: the Cancer Public Library Database in South Korea</article-title><source>Cancer Res Treat</source><year>2024</year><month>10</month><volume>56</volume><issue>4</issue><fpage>1014</fpage><lpage>1026</lpage><pub-id pub-id-type="doi">10.4143/crt.2024.207</pub-id><pub-id pub-id-type="medline">38697846</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ishwaran</surname><given-names>H</given-names> </name><name name-style="western"><surname>Kogalur</surname><given-names>UB</given-names> </name><name name-style="western"><surname>Blackstone</surname><given-names>EH</given-names> </name><name name-style="western"><surname>Lauer</surname><given-names>MS</given-names> </name></person-group><article-title>Random survival forests</article-title><source>Ann Appl Stat</source><year>2008</year><volume>2</volume><issue>3</issue><fpage>841</fpage><lpage>860</lpage><pub-id pub-id-type="doi">10.1214/08-AOAS169</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mogensen</surname><given-names>UB</given-names> </name><name name-style="western"><surname>Ishwaran</surname><given-names>H</given-names> </name><name name-style="western"><surname>Gerds</surname><given-names>TA</given-names> </name></person-group><article-title>Evaluating random forests for survival analysis using prediction error curves</article-title><source>J Stat Softw</source><year>2012</year><month>09</month><volume>50</volume><issue>11</issue><fpage>1</fpage><lpage>23</lpage><pub-id pub-id-type="doi">10.18637/jss.v050.i11</pub-id><pub-id pub-id-type="medline">25317082</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Friedman</surname><given-names>JH</given-names> </name></person-group><article-title>Greedy function approximation: a gradient boosting machine</article-title><source>Ann Statist</source><year>2001</year><volume>29</volume><issue>5</issue><fpage>1189</fpage><lpage>1232</lpage><pub-id pub-id-type="doi">10.1214/aos/1013203451</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Jia</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Mercola</surname><given-names>D</given-names> </name><name name-style="western"><surname>Xie</surname><given-names>X</given-names> </name></person-group><article-title>A gradient boosting algorithm for survival analysis via direct optimization of concordance index</article-title><source>Comput Math Methods Med</source><year>2013</year><volume>2013</volume><fpage>873595</fpage><pub-id pub-id-type="doi">10.1155/2013/873595</pub-id><pub-id pub-id-type="medline">24348746</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bai</surname><given-names>M</given-names> </name><name name-style="western"><surname>Zheng</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Shen</surname><given-names>Y</given-names> </name></person-group><article-title>Gradient boosting survival tree with applications in credit scoring</article-title><source>J Oper Res Soc</source><year>2022</year><volume>73</volume><issue>1</issue><fpage>39</fpage><lpage>55</lpage><pub-id pub-id-type="doi">10.1080/01605682.2021.1919035</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Geurts</surname><given-names>P</given-names> </name><name name-style="western"><surname>Ernst</surname><given-names>D</given-names> </name><name name-style="western"><surname>Wehenkel</surname><given-names>L</given-names> </name></person-group><article-title>Extremely randomized trees</article-title><source>Mach Learn</source><year>2006</year><month>04</month><volume>63</volume><fpage>3</fpage><lpage>42</lpage><pub-id pub-id-type="doi">10.1007/s10994-006-6226-1</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zaenal</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Fitrianto</surname><given-names>A</given-names> </name><name name-style="western"><surname>Wijayanto</surname><given-names>H</given-names> </name></person-group><article-title>Comparison of extremely randomized survival trees and random survival forests: a simulation study</article-title><source>Sci J Inform</source><year>2024</year><volume>11</volume><issue>3</issue><fpage>635</fpage><lpage>644</lpage><pub-id pub-id-type="doi">10.15294/sji.v11i3.8464</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cox</surname><given-names>DR</given-names> </name></person-group><article-title>Regression models and life-tables</article-title><source>J R Stat Soc Ser B Methodol</source><year>1972</year><month>01</month><volume>34</volume><issue>2</issue><fpage>187</fpage><lpage>202</lpage><pub-id pub-id-type="doi">10.1111/j.2517-6161.1972.tb00899.x</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cygu</surname><given-names>S</given-names> </name><name name-style="western"><surname>Seow</surname><given-names>H</given-names> </name><name name-style="western"><surname>Dushoff</surname><given-names>J</given-names> </name><name name-style="western"><surname>Bolker</surname><given-names>BM</given-names> </name></person-group><article-title>Comparing machine learning approaches to incorporate time-varying covariates in predicting cancer survival time</article-title><source>Sci Rep</source><year>2023</year><month>01</month><day>25</day><volume>13</volume><issue>1</issue><fpage>1370</fpage><pub-id pub-id-type="doi">10.1038/s41598-023-28393-7</pub-id><pub-id pub-id-type="medline">36697455</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schober</surname><given-names>P</given-names> </name><name name-style="western"><surname>Vetter</surname><given-names>TR</given-names> </name></person-group><article-title>Survival analysis and interpretation of time-to-event data: the tortoise and the hare</article-title><source>Anesth Analg</source><year>2018</year><month>09</month><volume>127</volume><issue>3</issue><fpage>792</fpage><lpage>798</lpage><pub-id pub-id-type="doi">10.1213/ANE.0000000000003653</pub-id><pub-id pub-id-type="medline">30015653</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Deng</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Qin</surname><given-names>HY</given-names> </name><name name-style="western"><surname>Zhou</surname><given-names>YY</given-names> </name><etal/></person-group><article-title>Artificial intelligence applications in pathological diagnosis of gastric cancer</article-title><source>Heliyon</source><year>2022</year><month>12</month><volume>8</volume><issue>12</issue><fpage>e12431</fpage><pub-id pub-id-type="doi">10.1016/j.heliyon.2022.e12431</pub-id><pub-id pub-id-type="medline">36619448</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pickett</surname><given-names>KL</given-names> </name><name name-style="western"><surname>Suresh</surname><given-names>K</given-names> </name><name name-style="western"><surname>Campbell</surname><given-names>KR</given-names> </name><name name-style="western"><surname>Davis</surname><given-names>S</given-names> </name><name name-style="western"><surname>Juarez-Colunga</surname><given-names>E</given-names> </name></person-group><article-title>Random survival forests for dynamic predictions of a time-to-event outcome using a longitudinal biomarker</article-title><source>BMC Med Res Methodol</source><year>2021</year><month>10</month><day>17</day><volume>21</volume><issue>1</issue><fpage>216</fpage><pub-id pub-id-type="doi">10.1186/s12874-021-01375-x</pub-id><pub-id pub-id-type="medline">34657597</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pedregosa</surname><given-names>F</given-names> </name><name name-style="western"><surname>Varoquaux</surname><given-names>G</given-names> </name><name name-style="western"><surname>Gramfort</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Scikit-learn: machine learning in Python</article-title><source>J Mach Learn Res</source><year>2011</year><access-date>2026-05-21</access-date><volume>12</volume><fpage>2825</fpage><lpage>2830</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://jmlr.org/papers/volume12/pedregosa11a/pedregosa11a.pdf">https://jmlr.org/papers/volume12/pedregosa11a/pedregosa11a.pdf</ext-link></comment></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>P&#x00F6;lsterl</surname><given-names>S</given-names> </name></person-group><article-title>scikit-survival: a library for time-to-event analysis built on top of scikit-learn</article-title><source>J Mach Learn Res</source><year>2020</year><access-date>2026-05-21</access-date><volume>21</volume><issue>212</issue><fpage>1</fpage><lpage>6</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://www.jmlr.org/papers/volume21/20-729/20-729.pdf">https://www.jmlr.org/papers/volume21/20-729/20-729.pdf</ext-link></comment></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Harrell</surname><given-names>FE Jr</given-names> </name><name name-style="western"><surname>Califf</surname><given-names>RM</given-names> </name><name name-style="western"><surname>Pryor</surname><given-names>DB</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>KL</given-names> </name><name name-style="western"><surname>Rosati</surname><given-names>RA</given-names> </name></person-group><article-title>Evaluating the yield of medical tests</article-title><source>JAMA</source><year>1982</year><month>05</month><day>14</day><volume>247</volume><issue>18</issue><fpage>2543</fpage><lpage>2546</lpage><pub-id pub-id-type="medline">7069920</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Longato</surname><given-names>E</given-names> </name><name name-style="western"><surname>Vettoretti</surname><given-names>M</given-names> </name><name name-style="western"><surname>Di Camillo</surname><given-names>B</given-names> </name></person-group><article-title>A practical perspective on the concordance index for the evaluation and selection of prognostic time-to-event models</article-title><source>J Biomed Inform</source><year>2020</year><month>08</month><volume>108</volume><fpage>103496</fpage><pub-id pub-id-type="doi">10.1016/j.jbi.2020.103496</pub-id><pub-id pub-id-type="medline">32652236</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Uno</surname><given-names>H</given-names> </name><name name-style="western"><surname>Cai</surname><given-names>T</given-names> </name><name name-style="western"><surname>Pencina</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>D&#x2019;Agostino</surname><given-names>RB</given-names> </name><name name-style="western"><surname>Wei</surname><given-names>LJ</given-names> </name></person-group><article-title>On the C-statistics for evaluating overall adequacy of risk prediction procedures with censored survival data</article-title><source>Stat Med</source><year>2011</year><month>05</month><day>10</day><volume>30</volume><issue>10</issue><fpage>1105</fpage><lpage>1117</lpage><pub-id pub-id-type="doi">10.1002/sim.4154</pub-id><pub-id pub-id-type="medline">21484848</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schmid</surname><given-names>M</given-names> </name><name name-style="western"><surname>Wright</surname><given-names>MN</given-names> </name><name name-style="western"><surname>Ziegler</surname><given-names>A</given-names> </name></person-group><article-title>On the use of Harrell&#x2019;s C for clinical risk prediction via random survival forests</article-title><source>Expert Syst Appl</source><year>2016</year><month>11</month><volume>63</volume><fpage>450</fpage><lpage>459</lpage><pub-id pub-id-type="doi">10.1016/j.eswa.2016.07.018</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Arnold</surname><given-names>M</given-names> </name><name name-style="western"><surname>Park</surname><given-names>JY</given-names> </name><name name-style="western"><surname>Camargo</surname><given-names>MC</given-names> </name><name name-style="western"><surname>Lunet</surname><given-names>N</given-names> </name><name name-style="western"><surname>Forman</surname><given-names>D</given-names> </name><name name-style="western"><surname>Soerjomataram</surname><given-names>I</given-names> </name></person-group><article-title>Is gastric cancer becoming a rare disease? A global assessment of predicted incidence trends to 2035</article-title><source>Gut</source><year>2020</year><month>05</month><volume>69</volume><issue>5</issue><fpage>823</fpage><lpage>829</lpage><pub-id pub-id-type="doi">10.1136/gutjnl-2019-320234</pub-id><pub-id pub-id-type="medline">32001553</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name></person-group><article-title>Gastric cancer in young adults: a different clinical entity from carcinogenesis to prognosis</article-title><source>Gastroenterol Res Pract</source><year>2020</year><volume>2020</volume><fpage>9512707</fpage><pub-id pub-id-type="doi">10.1155/2020/9512707</pub-id><pub-id pub-id-type="medline">32190044</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Heer</surname><given-names>EV</given-names> </name><name name-style="western"><surname>Harper</surname><given-names>AS</given-names> </name><name name-style="western"><surname>Sung</surname><given-names>H</given-names> </name><name name-style="western"><surname>Jemal</surname><given-names>A</given-names> </name><name name-style="western"><surname>Fidler-Benaoudia</surname><given-names>MM</given-names> </name></person-group><article-title>Emerging cancer incidence trends in Canada: the growing burden of young adult cancers</article-title><source>Cancer</source><year>2020</year><month>10</month><day>15</day><volume>126</volume><issue>20</issue><fpage>4553</fpage><lpage>4562</lpage><pub-id pub-id-type="doi">10.1002/cncr.33050</pub-id><pub-id pub-id-type="medline">32770762</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Song</surname><given-names>P</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>L</given-names> </name><name name-style="western"><surname>Jiang</surname><given-names>B</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Cao</surname><given-names>K</given-names> </name><name name-style="western"><surname>Guan</surname><given-names>W</given-names> </name></person-group><article-title>Age-specific effects on the prognosis after surgery for gastric cancer: a SEER population-based analysis</article-title><source>Oncotarget</source><year>2016</year><month>07</month><day>26</day><volume>7</volume><issue>30</issue><fpage>48614</fpage><lpage>48624</lpage><pub-id pub-id-type="doi">10.18632/oncotarget.9548</pub-id><pub-id pub-id-type="medline">27224925</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Cheng</surname><given-names>X</given-names> </name><name name-style="western"><surname>Guo</surname><given-names>W</given-names> </name><etal/></person-group><article-title>Metastasis patterns and prognosis in young gastric cancer patients: a propensity score&#x2011;matched SEER database analysis</article-title><source>PLoS One</source><year>2024</year><volume>19</volume><issue>4</issue><fpage>e0301834</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0301834</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fryan</surname><given-names>LH</given-names> </name><name name-style="western"><surname>Alazzam</surname><given-names>MB</given-names> </name></person-group><article-title>Survival analysis of oncological patients using machine learning method</article-title><source>Healthcare (Basel)</source><year>2022</year><month>12</month><day>27</day><volume>11</volume><issue>1</issue><fpage>80</fpage><pub-id pub-id-type="doi">10.3390/healthcare11010080</pub-id><pub-id pub-id-type="medline">36611540</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tizi</surname><given-names>W</given-names> </name><name name-style="western"><surname>Berrado</surname><given-names>A</given-names> </name></person-group><article-title>Machine learning for survival analysis in cancer research: a comparative study</article-title><source>Sci Afr</source><year>2023</year><month>09</month><volume>21</volume><fpage>e01880</fpage><pub-id pub-id-type="doi">10.1016/j.sciaf.2023.e01880</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wu</surname><given-names>M</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Development and validation of a deep learning model for predicting postoperative survival of patients with gastric cancer</article-title><source>BMC Public Health</source><year>2024</year><month>03</month><day>6</day><volume>24</volume><issue>1</issue><fpage>723</fpage><pub-id pub-id-type="doi">10.1186/s12889-024-18221-6</pub-id><pub-id pub-id-type="medline">38448849</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Afrash</surname><given-names>MR</given-names> </name><name name-style="western"><surname>Mirbagheri</surname><given-names>E</given-names> </name><name name-style="western"><surname>Mashoufi</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kazemi-Arpanahi</surname><given-names>H</given-names> </name></person-group><article-title>Optimizing prognostic factors of five-year survival in gastric cancer patients using feature selection techniques with machine learning algorithms: a comparative study</article-title><source>BMC Med Inform Decis Mak</source><year>2023</year><month>04</month><day>6</day><volume>23</volume><issue>1</issue><fpage>54</fpage><pub-id pub-id-type="doi">10.1186/s12911-023-02154-y</pub-id><pub-id pub-id-type="medline">37024885</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>C</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>YH</given-names> </name><etal/></person-group><article-title>Machine learning models for predicting one-year survival in patients with metastatic gastric cancer who experienced upfront radical gastrectomy</article-title><source>Front Mol Biosci</source><year>2022</year><volume>9</volume><fpage>937242</fpage><pub-id pub-id-type="doi">10.3389/fmolb.2022.937242</pub-id><pub-id pub-id-type="medline">36533072</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Koh</surname><given-names>B</given-names> </name><name name-style="western"><surname>Tan</surname><given-names>DJ</given-names> </name><name name-style="western"><surname>Ng</surname><given-names>CH</given-names> </name><etal/></person-group><article-title>Patterns in cancer incidence among people younger than 50 years in the US, 2010 to 2019</article-title><source>JAMA Netw Open</source><year>2023</year><month>08</month><day>1</day><volume>6</volume><issue>8</issue><fpage>e2328171</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2023.28171</pub-id><pub-id pub-id-type="medline">37585204</pub-id></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sadeghi</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Alizadehsani</surname><given-names>R</given-names> </name><name name-style="western"><surname>Cifci</surname><given-names>MA</given-names> </name><etal/></person-group><article-title>A review of explainable artificial intelligence in healthcare</article-title><source>Comput Electr Eng</source><year>2024</year><month>08</month><volume>118</volume><fpage>109370</fpage><pub-id pub-id-type="doi">10.1016/j.compeleceng.2024.109370</pub-id></nlm-citation></ref><ref id="ref51"><label>51</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhou</surname><given-names>H</given-names> </name><name name-style="western"><surname>Ren</surname><given-names>D</given-names> </name><name name-style="western"><surname>Xia</surname><given-names>H</given-names> </name><name name-style="western"><surname>Fan</surname><given-names>M</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>H</given-names> </name></person-group><article-title>AST-GNN: an attention-based spatio-temporal graph neural network for Interaction-aware pedestrian trajectory prediction</article-title><source>Neurocomputing</source><year>2021</year><month>07</month><volume>445</volume><fpage>298</fpage><lpage>308</lpage><pub-id pub-id-type="doi">10.1016/j.neucom.2021.03.024</pub-id></nlm-citation></ref><ref id="ref52"><label>52</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fan</surname><given-names>M</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Hu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Gu</surname><given-names>N</given-names> </name><name name-style="western"><surname>Tao</surname><given-names>D</given-names> </name></person-group><article-title>Adaptive data structure regularized multiclass discriminative feature selection</article-title><source>IEEE Trans Neural Netw Learn Syst</source><year>2022</year><volume>33</volume><issue>10</issue><fpage>5859</fpage><lpage>5872</lpage><pub-id pub-id-type="doi">10.1109/TNNLS.2021.3071603</pub-id></nlm-citation></ref><ref id="ref53"><label>53</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>X</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Zhao</surname><given-names>H</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Hu</surname><given-names>M</given-names> </name></person-group><article-title>Learning a convolutional neural network for propagation-based stereo image segmentation</article-title><source>Vis Comput</source><year>2020</year><month>01</month><volume>36</volume><fpage>39</fpage><lpage>52</lpage><pub-id pub-id-type="doi">10.1007/s00371-018-1582-y</pub-id></nlm-citation></ref><ref id="ref54"><label>54</label><nlm-citation citation-type="web"><source>Korea-Clinical data Utilization network for Research Excellence</source><access-date>2024-05-22</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://k-cure.mohw.go.kr">https://k-cure.mohw.go.kr</ext-link></comment></nlm-citation></ref><ref id="ref55"><label>55</label><nlm-citation citation-type="web"><article-title>Predicting mortality in young patients with gastric cancer</article-title><source>GitHub</source><access-date>2026-05-10</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://github.com/KwangSun-Ryu/gastric_cancer_mortality">https://github.com/KwangSun-Ryu/gastric_cancer_mortality</ext-link></comment></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Baseline characteristics of the older and younger patient groups.</p><media xlink:href="cancer_v12i1e86418_app1.docx" xlink:title="DOCX File, 31 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>C-index values of the survival prediction models.</p><media xlink:href="cancer_v12i1e86418_app2.docx" xlink:title="DOCX File, 38 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>Relative feature importance of predictors in the survival prediction model.</p><media xlink:href="cancer_v12i1e86418_app3.docx" xlink:title="DOCX File, 103 KB"/></supplementary-material><supplementary-material id="app4"><label>Multimedia Appendix 4</label><p>Univariate analysis results for all causes of death.</p><media xlink:href="cancer_v12i1e86418_app4.docx" xlink:title="DOCX File, 34 KB"/></supplementary-material><supplementary-material id="app5"><label>Multimedia Appendix 5</label><p>Mapping between heat map feature labels and clinical variables.</p><media xlink:href="cancer_v12i1e86418_app5.docx" xlink:title="DOCX File, 25 KB"/></supplementary-material><supplementary-material id="app6"><label>Multimedia Appendix 6</label><p>Survival curve for younger and older patients.</p><media xlink:href="cancer_v12i1e86418_app6.docx" xlink:title="DOCX File, 226 KB"/></supplementary-material><supplementary-material id="app7"><label>Multimedia Appendix 7</label><p>Survival curve for stage and tumor size.</p><media xlink:href="cancer_v12i1e86418_app7.docx" xlink:title="DOCX File, 175 KB"/></supplementary-material><supplementary-material id="app8"><label>Multimedia Appendix 8</label><p>Comparison of predictive performance between American Joint Committee on Cancer stage and survival machine learning models.</p><media xlink:href="cancer_v12i1e86418_app8.docx" xlink:title="DOCX File, 17 KB"/></supplementary-material><supplementary-material id="app9"><label>Multimedia Appendix 9</label><p>Comparison of year-based data splitting and the 7:3 random split.</p><media xlink:href="cancer_v12i1e86418_app9.docx" xlink:title="DOCX File, 34 KB"/></supplementary-material></app-group></back></article>