Explainable Machine Learning for Preoperative Relapse Prediction in Molecularly Stratified Endometrial Cancer: A Single-Center Finnish Cohort Study

doi:10.1101/2025.11.06.686680

Explainable Machine Learning for Preoperative Relapse Prediction in Molecularly Stratified Endometrial Cancer: A Single-Center Finnish Cohort Study

2025 · doi:10.1101/2025.11.06.686680

preprint OA: closed

📄 Open PDF Full text JSON View at publisher

Full text 85,196 characters · extracted from preprint-html · click to expand

Explainable Machine Learning for Preoperative Relapse Prediction in Molecularly Stratified Endometrial Cancer: A Single-Center Finnish Cohort Study | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Explainable Machine Learning for Preoperative Relapse Prediction in Molecularly Stratified Endometrial Cancer: A Single-Center Finnish Cohort Study View ORCID Profile Sergio Vela Moreno , View ORCID Profile Masuma Khatun , View ORCID Profile Annukka Pasanen , View ORCID Profile Ralf Bützow , View ORCID Profile Andres Salumets , View ORCID Profile Mikko Loukovaara , View ORCID Profile Vijayachitra Modhukur doi: https://doi.org/10.1101/2025.11.06.686680 Sergio Vela Moreno 1 Department of Obstetrics and Gynecology, Institute of Clinical Medicine, University of Tartu , Tartu, Estonia 2 Celvia CC , Tartu, Estonia, Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Sergio Vela Moreno Masuma Khatun 3 Helsinki University Hospital and University of Helsinki, Department of Obstetrics and Gynecology , Helsinki, Finland 4 University of Helsinki, Faculty of Medicine, Helsinki University Hospital, and Research Program in Applied Tumor Genomics, Department of Pathology , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Masuma Khatun Annukka Pasanen 4 University of Helsinki, Faculty of Medicine, Helsinki University Hospital, and Research Program in Applied Tumor Genomics, Department of Pathology , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Annukka Pasanen Ralf Bützow 3 Helsinki University Hospital and University of Helsinki, Department of Obstetrics and Gynecology , Helsinki, Finland 4 University of Helsinki, Faculty of Medicine, Helsinki University Hospital, and Research Program in Applied Tumor Genomics, Department of Pathology , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Ralf Bützow Andres Salumets 1 Department of Obstetrics and Gynecology, Institute of Clinical Medicine, University of Tartu , Tartu, Estonia 2 Celvia CC , Tartu, Estonia, 5 Department of Clinical Science, Intervention and Technology, Karolinska Institute and Karolinska University Hospital , Stockholm, Sweden, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Andres Salumets Mikko Loukovaara 3 Helsinki University Hospital and University of Helsinki, Department of Obstetrics and Gynecology , Helsinki, Finland 6 Helsinki University Hospital and University of Helsinki, Comprehensive Cancer Center , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Mikko Loukovaara Vijayachitra Modhukur 1 Department of Obstetrics and Gynecology, Institute of Clinical Medicine, University of Tartu , Tartu, Estonia 2 Celvia CC , Tartu, Estonia, Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Vijayachitra Modhukur For correspondence: vijayachitra.modhukur{at}ut.ee Abstract Full Text Info/History Metrics Supplementary material Preview PDF Abstract Relapse risk in endometrial carcinoma (EC) is strongly influenced by molecular subtype, yet current WHO/ESGO classifications rely on postoperative data, limiting their utility for preoperative decision-making. We developed and compared interpretable machine learning (ML) models to predict relapse timing (none, ≤6 months, >6 months) using exclusively preoperative multimodal data. In a retrospective cohort of 784 EC patients, we integrated clinicopathological, molecular, immunohistochemical, and systemic biomarkers and constructed four feature strategies: (1) Traditional (clinicopathology), (2) ESGO (guideline risk groups), (3) TP53 + MMRd (high-risk biology), and (4) POLE (low-risk biology). Classifiers (Random Forest (RF), Support Vector Machine (SVM), k-Nearest Neighbors (KNN), Gradient Boosting (GBM)) were trained with leakage-safe preprocessing and in-fold resampling; performance was evaluated via area under the curve (AUC), accuracy, recall, and F1 score, and interpretability via SHapley Additive exPlanations (SHAP). The RF-based Traditional model achieved the highest overall performance (F1 = 0.895, AUC = 0.84), while the GBM-based POLE model showed superior sensitivity (F1 = 0.886, AUC = 0.842). SHAP identified ARID1A loss, elevated CA125, thrombocytosis, and p16 expression among key predictors of relapse; while overlapping high-risk features across models included advanced stage, deeper myometrial invasion, elevated CA125, and positive cytology. These biologically coherent, explainable predictions support individualized risk stratification and may enhance preoperative decision-making, particularly for aggressive histology and high-risk molecular subtypes. Download figure Open in new tab Graphical abstract Workflow for Machine Learning (ML)–based relapse prediction in endometrial cancer. The schematic figure outlines the study pipeline from patient inclusion to clinical application. (A) A retrospective cohort of 784 EC patients was analyzed, integrating clinical, demographic, biomarker, and molecular data into a multimodal feature set. Patients were stratified into four molecular subgroups: NSMP, p53abn, MMRd, and POLE mut. Multiple ML algorithms (Random Forest, SVM, XGBoost, k-NN) were trained to predict relapse timing. (B) Model performance was evaluated using area under the curve (AUC) and accuracy metrics, with SHapley Additive exPlanations (SHAP) analysis applied to identify key predictive features across models. (C) SHAP-based interpretation was used to support individualized relapse risk stratification, enabling potential clinical decision-making for surveillance and therapy. Highlights Pre-operative XAI models predict relapse timing in EC with an AUC of up to 0.842. The traditional model achieves a top accuracy of 0.797 using 22 features, while POLE maximizes sensitivity at 0.886. SHAP explanations identify class-specific drivers such as stage, LVSI, size, cytology, CA125, and PR. Early Relapse is associated with burden and aggressiveness, while Late Relapse relates to the spread and size of EC, while No Relapse indicates an inverse profile. Transparent outputs facilitate risk-aligned surveillance and treatment planning before surgery. 1. Introduction Endometrial cancer (EC) is the most common gynaecologic malignancy in developed countries, with incidence and mortality projected to increase by 55% by 2030 ( Clarke et al., 2022 ; Onstad et al., 2016 ), largely driven by obesity and metabolic syndrome ( Onstad et al., 2016 ; Siegel et al., 2022 ). Despite advances in adjuvant therapies, including immunotherapy trials (RUBY, GY018, and DUO-E) ( Bogani et al., 2024 ; Yang and Wang, 2019 ), 15–20% of patients experience relapse, often in the vaginal vault, pelvis, peritoneum, or distant organs, with a poor prognosis and limited treatment options ( Beavis and Fader, 2022 ; Crosbie et al., 2022 ; Tuninetti et al., 2024 ). Endometrial carcinosarcoma, a rare but highly aggressive subtype accounting for 5-6% of ECs ( Capozzi et al., 2024 ), exhibits relapse rates of 40–60% and high mortality ( Cantrell et al., 2015 ). Traditional risk stratification relies on clinicopathological features such as age, tumor grade, FIGO (International Federation of Gynecology and Obstetrics) stage, and lymphovascular space invasion (LVSI) ( Concin et al., 2021 ; Zwahlen et al., 2016 ). However, these parameters often lack reproducibility and prognostic accuracy, particularly in high-risk or recurrent cases ( Oaknin et al., 2022 ). Molecular classifiers, including The Cancer Genome Atlas (TCGA) and its clinical surrogate, The Proactive Molecular Risk Classifier for Endometrial Cancer (ProMisE), have refined EC stratification into four distinct subtypes: POLE -ultramutated ( POLE mut, favorable, low relapse risk), mismatch repair-deficient (MMRd, higher relapse risk), p53-abnormal (p53abn, poor prognosis, higher relapse risk), and no specific molecular profile (NSMP, intermediate) ( Lee et al., 2025 ; Levine, 2013 ). These are now integrated into the 2023 FIGO staging, which recognizes POLEmut tumors as favorable and p53abn as adverse, even in early-stage disease ( Gaffney et al., 2024 ; Talhouk et al., 2017 ). Despite these advances, relapse prediction remains challenging, particularly in NSMP, p53abn, and carcinosarcoma subgroups ( León-Castillo et al., 2025 ; W Glenn McCluggage et al., 2023 ). Existing models often fail to incorporate comprehensive molecular and clinical variables ( Urick and Bell, 2019 ), while symptom-based surveillance may miss early asymptomatic relapses that are linked to poorer outcomes ( Backes et al., 2018 ; Kommoss et al., 2018 ). Post-relapse survival varies significantly: 43 months for MMRd, 39 for NSMP, and only 10 for p53abn, underscoring the urgent need for improved predictive tools ( León-Castillo, 2023 ; Siegenthaler et al., 2022 ). Biomarkers ( e.g. , ARID1A ( Liu et al., 2017 ), p16 ( Murali et al., 2019 ), β-catenin, E-cadherin ( Schlosshauer et al., 2002 ), and systemic markers (e.g., CA125, platelet count) ( Njoku et al., 2022 ; Schlosshauer et al., 2002 ) show promise but lack integration into multivariable risk models. Machine learning (ML) continues to show promise in enhancing relapse prediction in EC, particularly when integrated with molecular classification. Ensemble models (e.g., AdaBoost, XGBoost, and Random Forest, RF) combined with interpretability tools like SHAP (SHapley Additive exPlanations) have boosted both predictive accuracy and clinical applicability. For instance, the TJHPEC model achieved an area under the curve (AUC) of 0.93 using routine clinical features across 1,935 patients ( Wang et al., 2022 ), while radiomics-based models leveraging preoperative CT scans reached AUCs up to 0.90 (Camelia Alexandra Coada et al., 2023 ). Molecularly informed models like im4MEC correlated strongly with 5-year relapse-free survival ( Fremond et al., 2023 ) and NU-CAT predicted progression and relapse with 75% accuracy ( Zheng et al., 2023 ). Additional approaches include Random Forest (RF)-based predictors of high-grade EC (AUC 0.85) ( Piedimonte et al., 2022 ), biomarker-integrated nomograms ( Cong et al., 2023 ), deep learning on haematoxylin and eosin (H&E)-stained slides ( Coudray et al., 2018 ; Fu et al., 2020 ), and the HECTOR model for distant relapse prediction ( Volinsky-Fremond et al., 2024 ). However, few models have been validated in molecularly stratified cohorts, and preoperative, multi – class prediction of relapse timing, particularly in high-risk EC and carcinosarcoma, remains underexplored. To address these gaps, we developed and compared interpretable ML models for preoperative relapse prediction of relapse timing (No Relapse, ≤6 months, >6 months) in EC, including carcinosarcoma. Four complementary approaches were implemented: 1) Traditional clinicopathological model, (2) ESGO guideline-based model, (3) Tp53 + MMRd biology-driven high-risk model, and (4) POLE low-risk feature strategies. By integrating multimodal preoperative data, including molecular classifiers, biomarkers, and clinicopathological features, we sought to evaluate trade-offs between accuracy, sensitivity, and clinical utility, while ensuring model interpretability through SHAP (SHapley Additive exPlanations). 2. Materials and Methods 2.1 Study Design and Patient Cohort This retrospective study included 784 patients with stage I–IV EC who underwent hysterectomy at Helsinki University Hospital between 2007 and 2013. Ethical approval was obtained from the Helsinki University Hospital Institutional Review Board (HUS/491/2021) and the Finnish Medicines Agency (FIMEA/2021/005153). Informed consent was waived for this retrospective cohort. Clinicopathological data were retrieved from institutional records. Staging followed the FIGO 2009 guidelines ( Pecorelli, 2009 ). Tumours were classified into molecular and clinicopathological risk groups using the ESGO/ESTRO/ESP 2021 guidelines ( Concin et al., 2021 ). Tumours were classified into low, intermediate, high-intermediate, high, and advanced-metastatic risk categories based on molecular subtype and clinicopathological factors, including histology, grade, depth of myometrial invasion, LVSI, and FIGO stage. The guidelines do not assign risk categories to stage I–IVA MMRd and NSMP clear cell carcinomas with myometrial invasion, or to stage III–IVA POLE mut tumours, due to limited supporting data. In this study, these tumors were classified as high-risk. LVSI was assessed using a three-tiered system: none, focal, or substantial ( Concin et al., 2021 ). Relapse status was obtained from hospital or referral centre records, and cytology from peritoneal washings taken during surgery. 2.2 Preoperative Clinical and Biomarker Assessment Preoperative data included American Society of Anaesthesiologists (ASA) physical status scores extracted from anaesthesia records and standardized to the 2014 classification system ( Kolehmainen et al., 2019 ). Patients who were current smokers, had a BMI of 30–40 kg/m², or had well-controlled diabetes were assigned ASA II, while those with severe obesity (BMI ≥40 kg/m²) were classified as ASA III. Hematologic parameters were obtained from pre-treatment blood count using photometry, impedance, and flow cytometry. Anaemia was defined as haemoglobin (Hb) 8.2×10⁹/L, and thrombocytosis as platelets > 360×10⁹/L ( Nordin et al., 2004 ). Serum CA125 levels were measured via chemiluminescent microparticle immunoassay on the Abbott Architect 2000i system, with values >35 U/mL considered elevated ( Bast et al., 1981 ). A tumor size threshold of 25 mm was applied based on prior evidence linking it to relapse risk ( Sozzi et al., 2018 ). 2.3 Molecular Classification and Immunohistochemistry Multicore tissue microarrays (four tumor cores/case) were constructed following established protocols and scanning using the 3D Histech Pannoramic 250 Flash II. Digital images were reviewed via WebMicroscope. Immunohistochemical (IHC) scoring was performed by a pathologist blinded to clinical outcomes (A.P.), with equivocal cases confirmed by a second pathologist (R.B.) ( Khatun et al., 2025 ; Khatun et al., 2021 ; Pasanen et al., 2016 ). Molecular classification followed WHO guidance, assigning tumors to MMRd, P53abn , POLE mut, or NSMP. In cases with overlapping features, classification was based on the prognostically dominant alteration ( Höhn et al., 2021 ; León-Castillo et al., 2020 ; Pasanen et al., 2021 ; Pasanen et al., 2020 ). Fresh-frozen tumor samples were collected for POLE mutation analysis, with exonuclease-domain hotspot mutations confirmed by targeted sequencing (exon 9, 13, 14) ( Pasanen et al., 2019 ). IHC panels, scoring thresholds, and assay details are summarized in Supplementary Table S1. 2.4 Explainable Machine Learning Framework To predict relapse risk, supervised machine learning pipelines were implemented to assess relapse risk, categorized into multi-class, namely, No Relapse, ≤6 months, or >6 months. Data was pre-processed by eliminating features with >30% missing values, and only pre-operative variables were retained. Missing values were imputed using median/mode substitution with the na.roughfix function in the R package randomForest . Variables were one-hot encoded, normalized, and outliers capped using interquartile range (IQR) thresholds. After this preprocessing, the final feature sets were selected for every molecular dataset (28–29 variables depending on the molecular dataset). To capture different perspectives of relapse prediction, four complementary models were developed. The Traditional model incorporated established clinicopathological features (FIGO stage, grade, histology, LVSI, tumor size, receptor status) and served as the benchmark reflecting current practice. The ESGO model applied the 2021 ESGO/ESTRO/ESP risk classification as a guideline-based comparator. The TP53 + MMRd model targets two molecularly defined high-risk subgroups (TP53-abnormal and MMR-deficient) with a compact, biology-driven feature set. Finally, the POLE model focused on the biologically distinct POLE mut subgroup, typically associated with excellent prognosis, to assess whether subgroup-specific modeling improved discrimination. For each strategy (traditional, ESGO, TP53 + MMRd, POLE), a dedicated data frame was generated and split into 70:20:10 train-test-validation sets. Recursive feature elimination (RFE) was performed using 10-fold cross-validation (CV), optimizing for the metric F1 score in risk prediction, given the significant class imbalance between classes. Feature selection was implemented manually using the tidymodels R package. Tumor size thresholds were iteratively optimized to improve accuracy ( Sozzi et al., 2018 ). 2.5 Model Development and Evaluation Four supervised classification algorithms were evaluated: Random Forest (RF), Support Vector Machines (SVM), k-Nearest Neighbors (KNN), and Gradient Boosting (GBM). Models were optimized using grid search with 10-fold stratified cross-validation. Class imbalance was addressed through SMOTE, under-sampling, and oversampling, which were applied within each field. All models for relapse risk were optimized for AUC, a threshold-invariant metric that minimizes the effect of class imbalance. Evaluation metrics included: ● Accuracy = (TP + TN) / (TP + TN + FP + FN) ● Recall/Sensitivity = TP / (TP + FN) ● F1-score = 2TP / (2TP + FP + FN) ● AUC for each class, calculated as the integral under the ROC curve (representation of True Positive Rate (TPR) (TP / (TP + FN)) and False Positive Rate (FPR) (FP / (FP + TN))). ● Precision-Recall area under the receiver operating characteristic curve (PR-AUC) for each class, calculated as the integral under the Precision-Recall curve (representation of Precision (TP / (TP + FP)) and Recall (TP / (TP + FN)). TP=True Positive, FP=False Positive, TN=True Negative, FN=False Negative All models were implemented in R 4.5.0 using caret 7.0-1, randomForest 4.7-1.2, dplyr 1.1.2, gbm 2.2.2, kernelshap 0.7.0, and shapviz 0.9.7. Analyses were performed on a 64-core Intel Xeon server (256 GB RAM, Ubuntu 20.04 LTS). 2.6 XAI-Based Model Interpretability To enhance clinical trust and applicability, SHAP was employed to quantify feature contributions to predictions ( Lundberg et al., 2017 ). SHAP values were computed using kernelshap with k-means background sampling (m=50, 1,000 samples per observation). Class-specific SHAP values were visualized using shapviz, enabling identification of key predictors for each relapse category (Early, Late, No Relapse). Implementations were performed using R packages kernelshap and shapviz . A summary of the ML algorithms and parameters is shown in Table 1 . View this table: View inline View popup Download powerpoint Table 1. Summary of the Machine Learning algorithm. 3. Results 3.1 Patient Cohort and Molecular Stratification A total of 784 patients with EC were included, of whom 172 (22%) experienced relapse — 76 Early (≤6 months) and 96 Late (>6 months) relapse. The remaining 612 patients (78%) remained relapse-free. Patients were stratified into four molecular subgroups: MMRd (64.0%), NSMP (23.9%), p53abn (8.3%), and POLEmut (3.8%). Thirty-three preoperative features were integrated into a multimodal feature vector for ML analyses (Graphical abstract ). Relapsed cases were significantly enriched in advanced FIGO stages (II–IV), non-endometrioid histology (serous and carcinosarcoma), and positive LVSI. Tumors >25 mm, positive peritoneal cytology, deep myometrial invasion, and molecular alterations (p53abn, MMRd) were more frequent in relapsed patients. On the other hand, POLEmut tumors showed the lowest relapse rates. Additional relapse-associated features included p16 positivity, E-cadherin loss, vimentin expression, ARID1A loss, elevated CA125, and increased thrombocyte and leucocyte counts. Full demographic and clinicopathological comparisons are presented in Table 2 . View this table: View inline View popup Table 2. Demographic and clinicopathological characteristics of patients (n=784). 3.2 Feature Selection and Model Inputs Recursive Feature Elimination (RFE) identified the key preoperative features for each model, with systemic biomarkers (CA125, thrombocytes, leucocytes) and invasion-related variables (myometrial depth, LVSI, cytology) consistently ranked highest. Traditional risk modifiers (BMI, diabetes, smoking) were rarely selected. For the risk of relapse, the TP53 + MMRd model achieved a theoretical F1 score of 0.512 using 19 features, including myometrial invasion, CA125, advanced stage (II–IV), thrombocyte count, and histology. Similar performance was observed with the applied molecular classification (F1 score = 0.492, 22 features) and the ESGO molecular classification (F1 score = 0.528, 23 features), where overlapping predictors included CA125, myometrial invasion, stage, and leucocyte count. The POLE -specific model achieved the highest F1 score among single-subtype analyses (0.557 with 28 features), although feature selection was limited by the sample size of POLE mut tumours. Supplementary Table S2 provides detailed information on the F1 score, the number of features, and their respective names for each molecular classification. In summary, across all analyses, systemic biomarkers (CA125, thrombocytes, leucocytes) and invasion-related variables (myometrial depth, LVSI, cytology) consistently emerged among the top-ranked features, underscoring their value for preoperative risk stratification. In contrast, traditional risk modifiers such as BMI, diabetes, and smoking status were rarely selected, suggesting their limited predictive contribution in molecularly stratified cohorts. Following feature selection, the optimal subsets of covariates retained to explain relapse risk were as follows: 19 for the TP53 + MMRd model, 22 for the molecular classification model, 28 for the POLE model, and 23 for the ESGO model ( Supplementary Table S2 ). 3.3 Model Metrics Across the Predictive Model 3.4 Model Performance Comparison Four ML models (RF, SVM, KNN, GBM) were trained across the four stratification strategies (Traditional, ESGO, TP53 + MMRd, and POLE). Performance metrics for the above-mentioned ML models are summarized in Table 3 and visualized in Figure 1A . The POLE model demonstrated the highest discrimination (AUC 0.842) and sensitivity (0.886). In contrast, the Traditional model achieved the best overall accuracy (0.797) and tied with POLE for the top F1 score (0.892), while requiring fewer predictors (22 vs. 28). The TP53 + MMRd model utilized the fewest predictors (19) and delivered competitive sensitivity (0.876) and F1 score (0.872), albeit with slightly lower accuracy (0.759) and AUC (0.804). By contrast, the ESGO model underperformed, with lower discrimination (AUC 0.624) and F1 score (0.519), despite a comparable feature count (23). In summary, these findings highlight a trade-off: the Traditional model delivers a parsimonious and well-balanced solution, whereas the POLE model lays emphasis on sensitivity and discrimination. The TP53 + MMRd model offers a compact, intermediate option. Future updates will incorporate PR-AUC and balanced accuracy once harmonized per-class outputs are accessible. The detailed data for all predictive models with all four ML algorithms are outlined in Supplementary Table S3. Download figure Open in new tab Figure 1. Performance Metrics and Feature Overlap Across Predictive Models. (A) Heatmap showing performance metrics (Accuracy, F1 Score, Sensitivity, AUC) for four machine learning algorithms (SVM, RF, KNN, GBM) across molecular subgroups: Traditional (red), TP53 + MMRd (black), POLE (orange), and ESGO (green). Darker shades indicate higher metric values. ( B) Venn diagram illustrates the distribution of overlapping features among the four molecular subgroups. Each segment is annotated with case counts and their percentage representation. A blue gradient indicates density, highlighting both unique and shared cases across subgroup intersections. View this table: View inline View popup Download powerpoint Table 3: Performance of pre-operative predictive models optimized with the best Gradient Boosting (GBM) algorithm. 3.5 Overlap and Feature Distribution Across Models Venn diagram analysis revealed overlapping and unique case distributions across models ( Figure 1B ). The POLE group had the highest number of cases (11), characterized by features such as LVSI, large tumor size, higher ASA score and BMI, variable PD-L1 expression (1–>10%), diabetes mellitus, and positivity for β-catenin, HNFβ, and vimentin. The ESGO group included 7 cases, mainly showing advanced or metastatic status, thrombocytosis, molecular high or intermediate risk, ER positivity, loss of E-cadherin, and a history of smoking. The TP53 + MMRd and Traditional groups each had 1 case, associated with proficient MMRd and p53abn, respectively. Among overlapping categories, Traditional/POLE (1 case) showed positive ARID1A expression. The TP53 + MMRd/Traditional/ESGO group (4 cases) demonstrated LVSI, higher BMI and ASA scores, and larger tumor size. Similarly, TP53 + MMRd/Traditional/POLE (4 cases) was characterized by ER positivity, thrombocytosis, normal E-cadherin, and non-smoking status. The Traditional/ESGO/POLE overlap (2 cases) involved endometrioid G3 tumors with weakened E-cadherin. The most complex intersection, TP53 + MMRd/Traditional/ESGO/POLE (10 cases), showed high-risk clinicopathologic features including stage II–IV disease, myometrial invasion, elevated CA125, positive CD171 and cytology, older age, leukocytosis, PR positivity, low hemoglobin, and non-endometrioid histology. Full details about the feature are presented in Supplementary Table S4. 3.6 Traditional Model: Class-Specific Performance Per-class performance metrics for the traditional models revealed the expected imbalance pattern ( Figure 2A ) . The model demonstrated optimal performance for the No-Relapse class (F1=0.892, precision=0.868, recall=0.918, PR-AUC=0.935; accuracy=0.829). Performance for the Early Relapse class was moderate (F1=0.615, precision=0.571, recall=0.667, PR-AUC=0.477; accuracy=0.937), reflecting reasonable detection with some false positives. The Late-Relapse class posed the greatest challenge (F1=0.308, precision=0.400, recall=0.250, PR-AUC=0.266; accuracy=0.829), consistent with class rarity and overlap with other phenotypes. Overall, these results support the importance of reporting PR-AUC and F1 alongside ROC-AUC, and they suggest the implementation of targeted strategies, such as rebalancing or multimodal features, to enhance minority-class detection. Per-class performance of the Traditional model across relapse timing is presented in Supplementary Table S5. Download figure Open in new tab Figure 2. Class-Level Performance and Confusion Matrix for the Traditional Model. (A) Grouped bars display accuracy, F1, PR-AUC, precision, and recall for Early Relapse, Late Relapse, and No Relapse classes. The highest performance is observed for the No-Relapse class (F1 0.892; PR-AUC 0.935), intermediate for Early Relapse (F1 0.615; PR-AUC 0.477), and lowest for Late Relapse (F1 0.308; PR-AUC 0.266). These patterns reflect both the underlying class imbalance and the greater challenge of distinguishing Late Relapse events. (B) Confusion matrix for relapse stages (No-Relapse, Early Relapse, Late Relapse) with row-normalized recall percentages. Rows indicate true labels, while columns indicate predicted labels. The recall is strong for No-Relapse, moderate for Early Relapse (often misclassified as No-Relapse), and weak for Late Relapse (mostly misclassified as No-Relapse). Darker colors indicate a higher frequency of recall. The confusion matrix corroborates these class-specific metrics ( Figure 2B ). Notably, the’No-Relapse’ category predominantly occupies the diagonal, with most instances correctly classified. The’Early Relapse’ category exhibits a moderate true-positive block, with most remaining errors misclassified as’No-Relapse.’ The’Late Relapse’ category has the least populated true-positive cell, with misclassifications primarily occurring as’No-Relapse’ and, to a lesser extent, as’Early Relapse.’ This asymmetric error pattern (Late → Early/No) aligns with class imbalance and the lower recall for late events, whereas early events are detected with greater reliability, and’No-Relapse’ is identified with high recall. 3.7 XAI-Based Model Interpretability: Traditional Model SHAP analyses demonstrated class-specific patterns that aligned with the overall feature ranking. The global importance was highlighted by the mean absolute SHAP values (organized by class), which pinpointed FIGO stage, E-cadherin status, tumor size, and LVSI as the primary predictors. These were followed by ARID1A, PR, and peritoneal cytology. There were also smaller contributions from hematologic/host factors such as thrombocytes, BMI, leucocytes, and hemoglobin, as well as CA125, myometrial invasion, and ASA score. Notably, these variables had varying levels of influence across different classes, as illustrated by the stacked bar profiles ( Figure 3A ). Download figure Open in new tab Figure 3. SHAP-Based Interpretation of Relapse Risk in the Traditional Model. (A) Global SHAP summary plot showing mean absolute SHAP values, ranked by feature importance and stacked by relapse class. This visualization highlights the most influential predictors across all classes. (B–D) Class-specific SHAP beeswarm plots for Early Relapse, Late Relapse, and No Relapse, respectively. Each point represents an individual patient; color indicates the feature value (red = high, blue = low), while horizontal position reflects the magnitude and direction of the feature’s impact on the predicted class probability. These plots illustrate how specific features contribute to relapse risk stratification at the patient level. Early Relapse (≤6 months) was primarily driven by higher stage (II–IV), positive peritoneal cytology, thrombocytosis, grade-3 endometrioid histology (G3), deep myometrial invasion, and ARID1A loss, with elevated CA125 providing additional risk. Protective features included PR positivity (>10%), preserved E-cadherin, and smaller tumor size ( Figure 3B ). Late-relapse class (>6 months) was most strongly linked to LVSI positivity, larger tumor size, and higher stage, supported by ARID1A loss, G3 endometrioid histology, and host factors such as higher BMI/ASA, leukocytosis, and lower hemoglobin. In the Late-Relapse class, Stage I status, preserved E-cadherin, and smaller tumor size served as protective features, each contributing negative SHAP values. The latter implies that they decreased the model’s log-odds and predicted probability of Late Relapse (shifting probability toward Early/No Relapse) when other inputs were held constant ( Figure 3C ) . In the No-Relapse category, factors that favored predictions of No Relapse included Stage I disease, preserved E-cadherin, PR levels above 10%, low CA125, negative cytology, absence of LVSI, and smaller tumors. In contrast, Stage II–IV, positive LVSI, ARID1A loss, larger tumors, and positive cytology decreased the likelihood of remaining free from recurrence. Early Relapse is associated with tumor burden and biological aggressiveness, such as advanced stage, positive cytology, elevated CA125, and invasion/size. Late Relapse is more closely linked to anatomic spread and size, including advanced LVSI, larger diameter, and higher stage, while No-Relapse reflects the opposite profile ( Figure 3D ) . Collectively, the panels provide a coherent and clinically intuitive distinction of relapse phenotypes. Early Relapse is primarily driven by tumour biology and burden, while Late Relapse is more associated with anatomic spread and size. In contrast, the No-Relapse profile reflects the inverse of these features. This alignment between SHAP-based interpretability and established clinical expectations offers clinical plausibility and bolsters confidence in the model’s predictive framework. 3.8 POLE Model: Class-Specific Performance Per-class performance metrics for the POLE model revealed a performance pattern consistent with the traditional model, largely influenced by class imbalance ( Figure 4A ). The model achieved its strongest performance for the No-Relapse class (F1 = 0.892, Precision = 0.886, recall = 0.897, PR-AUC = 0.944; accuracy = 0.835), indicating stable generalization and consistent identification of patients without relapse. The Early Relapse class showed moderate discrimination (F1 = 0.593, Precision = 0.533, recall = 0.667, PR-AUC = 0.649; accuracy = 0.893), indicating a balanced sensitivity, precision, with a modest improvement in PR-AUC, compared to the traditional model. The Late Relapse class exhibited the lower performance (F1 = 0.273, Precision = 0.333, recall = 0.231, PR-AUC = 0.208; accuracy = 0.845), reflecting continued limitations in minority-class detection. Collectively, these findings reinforce the need for targeted modeling strategies such as temporal reweighting or synthetic data augmentation to enhance recognition of rare relapse patterns, particularly late events. Per-class performance of the POLE model across relapse timing is presented in Supplemental Table S5. Download figure Open in new tab Figure 4. Class-Level Performance and Confusion Matrix for the POLE Model. (A) Grouped bar chart displaying performance metrics — Accuracy, F1 Score, Precision-Recall AUC (PR-AUC), Precision, and Recall for each relapse class: Early Relapse, Late Relapse, and No Relapse. The model showed highest performance for the No-Relapse class (F1 = 0.891; PR-AUC = 0.944), moderate performance for Early Relapse (F1 = 0.592; PR-AUC = 0.649), and lowest for Late Relapse (F1 = 0.272; PR-AUC = 0.208). These results reflect both class imbalance and the increased difficulty in identifying Late Relapse events. ( B) Confusion matrix for the POLE model predictions (Early Relapse, Late Relapse, No Relapse), displaying row-normalized recall percentages. Rows correspond to true labels and columns to predicted labels. Recall is strongest for No Relapse, moderate for Early Relapse (often misclassified as No Relapse), and lowest for Late Relapse, which are commonly misclassified as Early or No Relapse. Darker shading indicates higher recall frequency. The confusion matrix for the POLE model ( Figure 4B ) illustrates the class-specific trends. Notably, the recall was strongest for the No-Relapse class, moderate for Early Relapse (often misclassified as No Relapse), and weakest for Late Relapse (frequently confused with both Early and No Relapse). The dominance of correct No-Relapse predictions forms a dense diagonal cluster, while the asymmetric misclassification of Late Relapse underscores both data imbalance and model conservatism. Despite this, the slightly higher PR-AUC for Early Relapse suggests improved precision–recall trade-offs relative to the traditional model. 3.9 XAI-Based Model Interpretability: POLE Model The SHAP patterns for the POLE models ( Figure 5 ) closely resemble those of the Traditional model ( Figure 3 ). On a global scale, FIGO stage, tumor size, LVSI, and myometrial invasion emerged as the primary contributors by mean SHAP ( Figure 5A ). Conversely, CA125 and peritoneal cytology were associated with increased risk, while progesterone receptor (PR) >10% shifted predictions towards No Relapse ( Figure 5B ). In terms of class-specific SHAP, Early Relapse was associated with higher stage, positive cytology, and elevated CA125 levels. In contrast, Late Relapse was linked to positive LVSI and larger tumor size ( Figure 5C ). Tumor stage I preserved E-cadherin, and smaller tumor sizes acted as protective factors against Late Relapse, showing negative SHAP contributions that reduced the model’s probability of Late Relapse and directed predictions toward No Relapse ( Figure 5D ). Compared to the Traditional model, POLE exhibited a slight reweighting, highlighting the influence of size/LVSI for Late Relapse and cytology/CA125 for Early Relapse, while maintaining the early versus late pattern. Download figure Open in new tab Figure 5. SHAP-Based Interpretation of Relapse Risk in the POLE Model. (A) Global SHAP summary plot displaying mean absolute SHAP values, ranked by overall feature importance and stacked by relapse class. This visualization highlights the most influential predictors contributing to relapse risk across the POLE subgroup. (B–D) Class-specific SHAP beeswarm plots for Early Relapse, Late Relapse, and No Relapse, respectively. Each point represents an individual patient; color indicates the feature value (red = high, blue = low), while horizontal position reflects the magnitude and direction of the feature’s impact on the predicted class probability. These plots provide insight into how specific features drive model predictions at the patient level, supporting individualized risk assessment. 4. Discussion 4.1 Study Overview and Clinical Context This study demonstrates that preoperative multimodal data, when analyzed through interpretable ML, can effectively predict relapse risk and timing in EC. By analyzing a large, molecularly stratified cohort of 784 patients, we developed four complementary ML models that integrate clinicopathological, molecular, and systemic features. These models offer actionable insights for individualized risk stratification prior to surgery or definitive histopathological staging. 4.2 Model Performance and Biological Interpretability Among all the molecular models, the Traditional model achieved the highest overall accuracy (0.797) and demonstrated balanced performance, while the POLE-based model excelled in sensitivity (0.886) and discrimination (AUC 0.842). The TP53 + MMRd model, which focuses on high-risk molecular subsets, maintained competitive performance with fewer variables, underscoring the biological significance of molecularly driven compact modeling. In contrast, the ESGO-based classifier exhibited limited discrimination (AUC 0.624), indicating that static risk categories may underrepresent the complexity of relapse heterogeneity. Our SHAP analyses revealed that relapse timing reflects distinct biological patterns: Early Relapse is primarily driven by tumor burden and systemic inflammation (advanced stage, positive cytology, high CA125, thrombocytosis), whereas Late Relapse is associated with invasion-related features (LVSI, tumor size, ARID1A loss). Predictions of No Relapse were characterized by PR receptor positivity, preserved E-cadherin, and early-stage disease, reinforcing the biological coherence of the model outputs. This mechanistic interpretability enhances clinical confidence and provides actionable decision support. 4.3 Comparison with Existing Literature Prior prognostic tools in EC have mainly relied on postoperative clinicopathological variables such as FIGO stage, tumor grade, and LVSI, which inadequately capture the heterogeneity of high-risk molecular subtypes ( Concin et al., 2021 ; Oaknin et al., 2022 ). Incorporation of TCGA-based Molecular classifiers into WHO/ESGO/FIGO systems has markedly improved risk stratification, yet predictive accuracy for relapse remains suboptimal, particularly in NSMP, p53abn, and carcinosarcoma cases ( León-Castillo et al., 2025 ). In fact, molecular context significantly influences prognosis. The ProMisE classifiers enable the practical implementation of TCGA subgroups ( Talhouk et al., 2015 ), and PORTEC-3 showed that p53abn cases, while associated with poor outcomes, benefited from chemoradiotherapy over radiotherapy alone ( de Boer et al., 2019 ). Recent cohort studies further confirmed distinct relapse patterns across molecular subtypes, reinforcing the need for molecularly informed prediction models ( Lindemann et al., 2025 ; Loukovaara et al., 2025). Notably, semiquantitative LVSI remains prognostically relevant within endometrioid EC regardless of molecular classification ( Loukovaara et al., 2025b ), suggesting that traditional histopathological markers still hold relevance when interpreted in a molecular context, consistent with our findings. Interestingly, the overlap and feature distribution across models highlight both shared and distinct prognostic profiles. Notably, the POLE group, despite its generally favorable prognosis ( Liu et al., 2017 ), exhibited several high-risk features such as LVSI, elevated BMI and ASA scores, and variable PD-L1 expressions, suggesting that even molecularly favorable subtypes may harbor complex clinicopathologic traits. The ESGO group, enriched for advanced disease and molecular high-risk status, aligns with prior findings linking ER positivity and E-cadherin loss to aggressive behavior ( Murali et al., 2019 ). Overlapping categories, particularly the TP53 + MMRd/Traditional/ESGO/POLE cluster, revealed a convergence of high-risk features, including stage II–IV disease, myometrial invasion, and elevated CA125 — traits previously associated with poor outcomes ( de Boer et al., 2019 ). These intersections underscore the value of multimodal profiling in capturing relapse risk beyond single-model stratification. Recent ML models such as TJHPEC ( Wang et al., 2022 ), NU-CATS ( Zheng et al., 2023 ), and im4MEC ( Fremond et al., 2023 ) have shown promise but often lack integration of multimodal biomarkers or preoperative applicability. While HECTOR integrated whole-slide histopathology with stage across eight EC cohorts (including PORTEC trials) to deliver strong prognostic performance with therapy-relevant stratification ( Volinsky-Fremond et al., 2024 ), our framework complements these efforts by offering infrastructure-light, interpretable predictions at the patient level. Similarly, a large multi-institutional Israeli XGBoost model (n≈1,935) demonstrated feasibility with SHAP-informed relapse prediction (AUC ≈ 0.84) ( Ohad Houri et al., 2022 ), while MRI radiomics models integrating intertumoral and peritumoral features predict relapse with decision-curve utility ( Li et al., 2025 ). Beyond EC, ML-based relapse prediction in breast cancer has shown that hybrid mechanistic and ML models improve calibration for Late Relapses ( Nicolò et al., 2020 ), suggesting opportunities for similar approaches in EC. To our knowledge, by incorporating systemic and immunohistochemical markers alongside molecular classification, our approach aligns with emerging evidence supporting the value of multimodal inputs for relapse prediction ( Karpel et al., 2023 ; Njoku et al., 2022 ). Notably, the identification of ARID1A and p16 as key relapse predictors aligns with prior studies linking these biomarkers to aggressive EC phenotypes ( Liu et al., 2017 ; Murali et al., 2019 ). 4.4 Interpretability and Clinical Implications SHAP-based interpretability provided transparent, class-specific insights into model predictions by highlighting key biomarkers and risk factors, such as ARID1A loss, elevated CA125, thrombocytosis, p16 expression, FIGO stage, LVSI, cytology, tumor size, and E-cadherin status. These features aligned well with established molecular and staging frameworks, reinforcing the biological plausibility of the models. Importantly, SHAP profiles enabled differentiation between relapse phenotypes. Patients flagged as high risk for Early Relapses, often driven by tumor burden and systemic inflammation, may benefit from intensified imaging or systemic therapy. Conversely, those with Late-Relapse signals, typically associated with anatomic spread, may require extended surveillance. This level of interpretability supports personalized treatment planning and enhances clinical trust in ML-based decision support. Embedding these models into electronic health records and generating patient-level risk summaries could facilitate their integration into multidisciplinary care. This approach is consistent with evolving ESGO– ESTRO–ESP and FIGO 2023 guidelines, which increasingly emphasize molecular stratification in EC management ( Berek et al., 2023 ; Concin et al., 2025 ; Maria-Bianca Anca-Stanciu et al., 2025 ). For aggressive subtypes such as carcinosarcoma, which consistently showed high predicted relapse risk and distinct biomarker profiles, these models may be particularly impactful. Their clinical utility could mirror precision strategies already in use, such as trastuzumab for HER2-positive uterine serous carcinoma ( Fader et al., 2020 ; Fader et al., 2018 ), demonstrating how biomarker-informed ML tools can personalize care and improve outcomes. Our models achieved an AUC of up to 0.842, comparable to the externally validated ENDORISK-2 framework for predicting lymph-node metastasis in EC (AUC ≈ 0.85). Both approaches highlight the value of integrating molecular and clinicopathological data in preoperative assessment. While ENDORISK-2 informs nodal management, our models focus on relapse timing, offering complementary guidance for early treatment planning and surveillance before surgery ( Lombaers et al., 2025 ). 4.5 Strengths and Limitations The key strengths of this study include the use of a large, well-characterized cohort, exclusive reliance on preoperative data, integration of systemic, immunohistochemical, and molecular data, and explainable AI outputs ensuring clinical interpretability. Limitations include the single-center retrospective design and class imbalance affecting Late Relapse prediction. Additionally, while SHAP improves interpretability, it is sensitive to feature selection and model architecture, which may influence the stability and generalizability of feature importance rankings ( Ponce-Bobadilla et al., 2024 ). External validation and prospective integration into clinical workflows are needed to confirm generalizability. 4.6 Conclusions and Future Directions We developed preoperative, interpretable ML models capable of predicting relapse timing in EC, aligning with molecular risk frameworks. Stage, LVSI, tumor size, myometrial invasion, CA125, cytology, and hormone-receptor status emerged as key predictors across algorithms, showing clinically coherent effects. Gradient boosting with SHAP explanations provides patient-level transparency, supporting decision-making for surveillance and adjuvant therapy, particularly in molecularly adverse groups and aggressive histology. To build on these findings, future work should focus on validating the models in external, multi-center cohorts and integrating them into prospective clinical workflow. Combining clinicopathological data with radiomics, liquid biopsy, and whole-slide pathology could enhance predictive accuracy (e.g., HECTOR-like and radiomics pipelines) and enable trial-based validation ( Li et al., 2025 ; Volinsky-Fremond et al., 2024 ). Additionally, incorporating relapse site prediction, such as regional versus distant recurrence, could further refine surveillance strategies and therapeutic planning. Adaptive learning frameworks may allow real-time updates as new data becomes available, improving clinical responsiveness. Embedding explainable ML tools into electronic health records and developing clinician-friendly interfaces will be key to adoption. Finally, ethical considerations such as transparency, patient communication, and equitable access must be addressed to ensure responsible implementation in oncological care. Credit Authorship Contribution Statement Conceptualization, investigation, methodology: SVM, MK, AP, RB, AS, ML, VM. Data curation, Resources: MK, ML, AP, RB. Formal analysis: SVM, VM. Visualization, investigation: SVM, MK, VM. Writing – original draft preparation: SVM, MK, VM. Writing – review & editing: SVM, MK, AP, RB, AS, ML, VM. Supervision: VM, ML. Funding acquisition, project administration: RB, AS, VM. Code Availability The scripts used to perform the different analyses described in this paper can be found in https://github.com/SergioVela17/Preoperative-Relapse-Prediction-in-Molecularly-Stratified-Endometrial-Cancer-Finnish-Cohort-Study . Funding Sources This work was funded by Helsinki University Hospital research funds (TYH2020302) and Cancer Foundation Finland (WBS4708719), Estonian Research Council grant (PRG1076, project nr 2021-2027.1.01.24-0750), and Horizon Europe (NESTOR, grant no. 101120075). MK received personal grants from the Finnish Cultural Foundation and K. Albin Johansson Foundation. Declaration of Competing Interest None declared. Ethics Statement Ethical approval was obtained from the Helsinki University Hospital Institutional Review Board (HUS/491/2021) and the Finnish Medicines Agency (FIMEA/2021/005153). Consent for Publication Informed consent was waived for this retrospective cohort. Supplementary Files Supplementary Table S1. Details of immunohistochemistry, scoring, and interpretation Supplementary Table S2. Distribution of Recursive feature elimination (RFE) derived data Supplementary Table S3. Performance metrix of pre-operative predictive models derived from all ML algorithm. Supplementary Table S4. Overlapping molecular and clinical features across the predictive model via Venn diagram. Supplementary Table S5. Per-class performance metrics for the Traditional and POLE model Data Availability The datasets used and/or analyzed during the current study are available from the corresponding author on reasonable request. Acknowledgement We thank Annikki Löfhjelm for the technical support. Funder Information Declared Helsinki University Hospital research funds , TYH2020302 Cancer Foundation Finland , WBS4708719 Estonian Research Council grant , PRG1076, project nr 2021-2027.1.01.24-0750 Horizon Europe , NESTOR, grant no. 101120075 Finnish Cultural Foundation, https://ror.org/027xav248 K. Albin Johanssons stiftelse, https://ror.org/03arxxe13 Footnotes ↵ ¥ Shared first authorship ↵ * Shared last authorship References ↵ Backes , F.J. , Haag , J. , Cosgrove , C.M. , Suarez , A. , Cohn , D.E. , Goodfellow , P.J ., 2018 . Mismatch repair deficiency identifies patients with high-intermediate–risk (HIR) endometrioid endometrial cancer at the highest risk of recurrence: A prognostic biomarker . Cancer 125 , 398 – 405 . doi: 10.1002/cncr.31901 OpenUrl CrossRef PubMed ↵ Bast , R.C. , Feeney , M. , Lazarus , H. , Nadler , L.M. , Colvin , R.B. , Knapp , R.C ., 1981 . Reactivity of a monoclonal antibody with human ovarian carcinoma . Journal of Clinical Investigation 68 , 1331 – 1337 . doi: 10.1172/jci110380 OpenUrl CrossRef PubMed Web of Science ↵ Beavis , A.L. , Fader , A.N ., 2022 . Surveillance Strategies in Endometrial Cancer Care: Why Less Represents Progress . Journal of clinical oncology 40 , 3790 – 3795 . doi: 10.1200/jco.22.01551 OpenUrl CrossRef PubMed ↵ Berek , J.S. , Matias-Guiu , X. , Carien Creutzberg , Fotopoulou , C. , Gaffney , D. , Kehoe , S. , Lindemann , K. , Mutch , D. , Concin , N., 2023 . FIGO staging of endometrial cancer: 2023 . International Journal of Gynecology and Obstetrics 162 . doi: 10.1002/ijgo.14923 OpenUrl CrossRef PubMed ↵ Camelia Alexandra Coada , Santoro , M. , Vladislav Zybin , Marco Di Stanislao , Giulia Paolani , Modolon , C. , Stella Di Costanzo , Genovesi , L. , Tesei , M. , Antonio De Leo , Ravegnini , G. , Dario De Biase , Alessio Giuseppe Morganti , Lovato , L. , Pierandrea De Iaco , Strigari , L. , Anna Myriam Perrone , 2023 . A Radiomic-Based Machine Learning Model Predicts Endometrial Cancer Recurrence Using Preoperative CT Radiomic Features: A Pilot Study . Cancers 15 , 4534 – 4534 . doi: 10.3390/cancers15184534 OpenUrl CrossRef PubMed ↵ Cantrell , L.A. , Blank , S.V. , Duska , L.R ., 2015 . Uterine carcinosarcoma: A review of the literature . Gynecologic Oncology 137 , 581 – 588 . doi: 10.1016/j.ygyno.2015.03.041 OpenUrl CrossRef PubMed ↵ Capozzi , V.A. , Monfardini , L. , Maglietta , G. , Barresi , G. , De Finis , A. , Rosati , A. , Vargiu , V. , Cosentino , F. , Sozzi , G. , Chiantera , V. , Bogani , G. , Carnelli , M. , Scambia , G. , Fanfani , F. , Ghi , T. , Berretta , R. , 2024 . Pattern of recurrence in endometrial cancer. The murderer always returns to the scene of the crime. European journal of surgical oncology : the journal of the European Society of Surgical Oncology and the British Association of Surgical Oncology 50 , 107985 . doi: 10.1016/j.ejso.2024.107985 OpenUrl CrossRef ↵ Clarke , M.A. , Devesa , S.S. , Hammer , A. , Wentzensen , N ., 2022 . Racial and Ethnic Differences in Hysterectomy-Corrected Uterine Corpus Cancer Mortality by Stage and Histologic Subtype . JAMA Oncology 8 , 895 . doi: 10.1001/jamaoncol.2022.0009 OpenUrl CrossRef PubMed ↵ Concin , N. , Matias-Guiu , X. , Cibula , D. , Colombo , N. , Creutzberg , C.L. , Ledermann , J. , Mirza , M.R. , Vergote , I. , Abu-Rustum , N.R. , Bosse , T. , Chargari , C. , Espenel , S. , Fagotti , A. , Fotopoulou , C. , Gatius , S. , González-Martin , A. , Lax , S. , Levy , B. , Lorusso , D. , Macchia , G ., 2025 . ESGO–ESTRO– ESP guidelines for the management of patients with endometrial carcinoma: update 2025 . The Lancet Oncology 26 , e423 – e435 . doi: 10.1016/s1470-2045(25)00167-6 OpenUrl CrossRef PubMed ↵ Concin , N. , Matias-Guiu , X. , Vergote , I. , Cibula , D. , Mirza , M.R. , Marnitz , S. , Ledermann , J. , Bosse , T. , Chargari , C. , Fagotti , A. , Fotopoulou , C. , Martin , A.G. , Lax , S. , Lorusso , D. , Marth , C. , Morice , P. , Nout , R.A. , O’Donnell , D. , Querleu , D. , Raspollini , M.R ., 2021 . ESGO/ESTRO/ESP guidelines for the management of patients with endometrial carcinoma . International Journal of Gynecologic Cancer 31 . doi: 10.1136/ijgc-2020-002230 OpenUrl Abstract / FREE Full Text ↵ Cong , R. , Li , M. , Xu , W. , Ma , X. , Wang , S ., 2023 . Development and validation of a prognostic nomogram model incorporating routine laboratory biomarkers for preoperative patients with endometrial cancer . BMC Cancer 23 . doi: 10.1186/s12885-023-11497-8 OpenUrl CrossRef ↵ Coudray , N. , Ocampo , P.S. , Sakellaropoulos , T. , Narula , N. , Snuderl , M. , Fenyö , D. , Moreira , A.L. , Razavian , N. , Tsirigos , A ., 2018 . Classification and mutation prediction from non–small cell lung cancer histopathology images using deep learning . Nature Medicine 24 , 1559 – 1567 . doi: 10.1038/s41591-018-0177-5 OpenUrl CrossRef PubMed ↵ Crosbie , E.J. , Kitson , S.J. , McAlpine , J.N. , Mukhopadhyay , A. , Powell , M.E. , Singh , N ., 2022 . Endometrial cancer . The Lancet 399 , 1412 – 1428 . doi: 10.1016/S0140-6736(22)00323-3 OpenUrl CrossRef PubMed ↵ de Boer , S.M. , Powell , M.E. , Mileshkin , L. , Katsaros , D. , Bessette , P. , Haie-Meder , C. , Ottevanger , P.B. , Ledermann , J.A. , Khaw , P. , D’Amico , R. , Fyles , A. , Baron , M.-H. , Jürgenliemk-Schulz , I.M. , Kitchener , H.C. , Nijman , H.W. , Wilson , G. , Brooks , S. , Gribaudo , S. , Provencher , D. , Hanzen , C. , 2019 . Adjuvant chemoradiotherapy versus radiotherapy alone in women with high-risk endometrial cancer (PORTEC-3): patterns of recurrence and post-hoc survival analysis of a randomised phase 3 trial . The Lancet Oncology 20 , 1273 – 1285 . doi: 10.1016/s1470-2045(19)30395-x OpenUrl CrossRef PubMed ↵ Fader , A.N. , Roque , D.M. , Siegel , E. , Buza , N. , Hui , P. , Abdelghany , O. , Chambers , S. , Secord , A.A. , Havrilesky , L. , O’Malley , D.M. , Backes , F.J. , Nevadunsky , N. , Edraki , B. , Pikaart , D. , Lowery , W. , ElSahwi , K. , Celano , P. , Bellone , S. , Azodi , M. , Litkouhi , B ., 2020 . Randomized Phase II Trial of Carboplatin–Paclitaxel Compared with Carboplatin–Paclitaxel–Trastuzumab in Advanced (Stage III–IV) or Recurrent Uterine Serous Carcinomas that Overexpress Her2/Neu ( NCT01367002 ): Updated Overall Survival Analysis . Clinical Cancer Research 26 , 3928 – 3935 . doi: 10.1158/1078-0432.ccr-20-0953 OpenUrl Abstract / FREE Full Text ↵ Fader , A.N. , Roque , D.M. , Siegel , E. , Buza , N. , Hui , P. , Abdelghany , O. , Chambers , S.K. , Secord , A.A. , Havrilesky , L. , O’Malley , D.M. , Backes , F. , Nevadunsky , N. , Edraki , B. , Pikaart , D. , Lowery , W. , ElSahwi , K.S. , Celano , P. , Bellone , S. , Azodi , M. , Litkouhi , B ., 2018 . Randomized Phase II Trial of Carboplatin-Paclitaxel Versus Carboplatin-Paclitaxel-Trastuzumab in Uterine Serous Carcinomas That Overexpress Human Epidermal Growth Factor Receptor 2/neu . Journal of Clinical Oncology: Official Journal of the American Society of Clinical Oncology 36 , 2044 – 2051 . doi: 10.1200/JCO.2017.76.5966 OpenUrl CrossRef PubMed ↵ Fremond , S. , Andani , S. , Barkey Wolf , J. , Dijkstra , J. , Melsbach , S. , Jobsen , J.J. , Brinkhuis , M. , Roothaan , S. , Jurgenliemk-Schulz , I. , Lutgens , L.C.H.W. , Nout , R.A. , van der Steen-Banasik , E.M. , de Boer , S.M. , Powell , M.E. , Singh , N. , Mileshkin , L.R. , Mackay , H.J. , Leary , A. , Nijman , H.W. , Smit , V.T.H.B.M. , 2023 . Interpretable deep learning model to predict the molecular classification of endometrial cancer from haematoxylin and eosin-stained whole-slide images: a combined analysis of the PORTEC randomised trials and clinical cohorts . The Lancet. Digital Health 5 , e71 – e82 . doi: 10.1016/S2589-7500(22)00210-2 OpenUrl CrossRef ↵ Fu , Y. , Jung , A.W. , Torne , R.V. , Gonzalez , S. , Vöhringer , H. , Shmatko , A. , Yates , L.R. , Jimenez-Linan , M. , Moore , L. , Gerstung , M ., 2020 . Pan-cancer computational histopathology reveals mutations, tumor composition and prognosis . Nature Cancer 1 , 800 – 810 . doi: 10.1038/s43018-020-0085-8 OpenUrl CrossRef PubMed ↵ G. Bogani , Monk , B.J. , Powell , M.A. , Westin , S.N. , B. Slomovitz , Moore , K.N. , Eskander , R.N. , F. Raspagliesi , M.-P. Barretina-Ginesta , Colombo , N. , Mirza , M.R ., 2024 . Adding immunotherapy to first-line treatment of advanced and metastatic endometrial cancer . Annals of oncology 35 , 414 – 428 . doi: 10.1016/j.annonc.2024.02.006 OpenUrl CrossRef PubMed ↵ Gaffney , D. , Matias-Guiu , X. , Mutch , D. , Scambia , G. , Carien Creutzberg , Fotopoulou , C. , Berek , J.S. , Concin , N. , 2024 . 2023 FIGO staging system for endometrial cancer: The evolution of the revolution . Gynecologic oncology 184 , 245 – 253 . doi: 10.1016/j.ygyno.2024.02.002 OpenUrl CrossRef PubMed ↵ Höhn , A.K. , Brambs , C.E. , Hiller , G.G.R. , May , D. , Schmoeckel , E. , Horn , L.-C ., 2021 . 2020 WHO Classification of Female Genital Tumors . Geburtshilfe und Frauenheilkunde 81 , 1145 – 1153 . doi: 10.1055/a-1545-4279 OpenUrl CrossRef PubMed ↵ Karpel , H. , Slomovitz , B.M. , Coleman , R.L. , Bhavana Pothuri , 2023 . Biomarker-driven therapy in endometrial cancer . International Journal of Gynecological Cancer 33 , 343 – 350 . doi: 10.1136/ijgc-2022-003676 OpenUrl Abstract / FREE Full Text ↵ Khatun , M. , Pasanen , A. , Kanerva , A. , Koivisto-Korander , R. , Tuomi , T. , Bützow , R. , Loukovaara , M ., 2025 . PPP2R1A mutation status as a predictive and prognostic factor in molecularly characterized endometrial carcinoma: a cohort study . International journal of gynecological cancer: official journal of the International Gynecological Cancer Society 35 , 101934 . doi: 10.1016/j.ijgc.2025.101934 OpenUrl CrossRef PubMed ↵ Khatun , M. , Urpilainen , E. , Ahtikoski , A. , Arffman , R.K. , Pasanen , A. , Puistola , U. , Tapanainen , J.S. , Andersson , L.C. , Butzow , R. , Loukovaara , M. , Piltonen , T.T ., 2021 . Low Expression of Stanniocalcin 1 (STC-1) Protein Is Associated With Poor Clinicopathologic Features of Endometrial Cancer . Pathology oncology research: POR 27 , 1609936 . doi: 10.3389/pore.2021.1609936 OpenUrl CrossRef PubMed ↵ Kolehmainen , A.M. , Pasanen , A. , Tuomi , T. , Koivisto-Korander , R. , Butzow , R. , Loukovaara , M ., 2019 . American Society of Anesthesiologists physical status score as a predictor of long-term outcome in women with endometrial cancer . International Journal of Gynecological Cancer 29 , 879 – 885 . doi: 10.1136/ijgc-2018-000118 OpenUrl Abstract / FREE Full Text ↵ Kommoss , S. , McConechy , M.K. , Kommoss , F. , Leung , S. , Bunz , A. , Magrill , J. , Britton , H. , Kommoss , F. , Grevenkamp , F. , Karnezis , A. , Yang , W. , Lum , A. , Krämer , B. , Taran , F. , Staebler , A. , Lax , S. , Brucker , S.Y. , Huntsman , D.G. , Gilks , C.B. , McAlpine , J.N ., 2018 . Final validation of the ProMisE molecular classifier for endometrial carcinoma in a large population-based case series . Annals of Oncology 29 , 1180 – 1188 . doi: 10.1093/annonc/mdy058 OpenUrl CrossRef PubMed ↵ Lee , M. , Yoon , H. , Kim , U. , Kang , J. , Han , Y.B. , Lee , K.H. , Lee , S.J. , Hong , S.H. , Suh , D.H. , Kim , K. , No , J.H. , Kim , Y.B. , Kim , H. , Lee , A ., 2025 . Improved Prognostic Stratification With 2023 International Federation of Gynecology and Obstetrics Staging in Endometrial Cancer Reflecting Poor Prognosis of Aggressive Histological Types and p53 Abnormality . Laboratory investigation; a journal of technical methods and pathology 105 , 104189 . doi: 10.1016/j.labinv.2025.104189 OpenUrl CrossRef PubMed ↵ León-Castillo , A. , Horeweg , N. , Peters , E.E.M. , Ter Haar , N. , Smit , V.T.H.B.M. , de Kroon , C.D. , Boennelycke , M. , Hogdall , E. , Hogdall , C. , Nout , R.R.A. , Creutzberg , C.L. , Bosse , T. , Ortoft , G. , 2025 . Pattern of recurrence of the molecular subgroups in stage I high-grade endometrial cancer . Gynecologic oncology 197 , 43 – 50 . doi: 10.1016/j.ygyno.2025.04.576 OpenUrl CrossRef PubMed ↵ León-Castillo , A. , 2023 . Update in the molecular classification of endometrial carcinoma . International Journal of Gynecological Cancer 33 , 333 – 342 . doi: 10.1136/ijgc-2022-003772 OpenUrl Abstract / FREE Full Text ↵ León-Castillo , A. , Gilvazquez , E. , Nout , R. , Smit , V.T. , McAlpine , J.N. , McConechy , M. , Kommoss , S. , Brucker , S.Y. , Carlson , J.W. , Epstein , E. , Rau , T.T. , Soslow , R.A. , Ganesan , R. , Matias-Guiu , X. , Oliva , E. , Harrison , B.T. , Church , D.N. , Gilks , C.B. , Bosse , T. , 2020 . Clinicopathological and molecular characterisation of “multiple-classifier” endometrial carcinomas . The Journal of Pathology 250 , 312 – 322 . doi: 10.1002/path.5373 OpenUrl CrossRef PubMed ↵ Levine , D.A ., 2013 . Integrated genomic characterization of endometrial carcinoma . Nature 497 , 67 – 73 . doi: 10.1038/nature12113 OpenUrl CrossRef PubMed Web of Science ↵ Li , J. , Ma , D. , Chen , X. , Wei , J. , Xu , J. , Zhao , Y. , Gao , Z ., 2025 . Predicting recurrence risk in endometrial cancer: a multisequence MRI intratumoral and peritumoral radiomics nomogram approach . Frontiers in Oncology 15 . doi: 10.3389/fonc.2025.1569729 OpenUrl CrossRef ↵ Lindemann , K. , Kildal , W. , Kleppe , A. , Tobin , K.A.R. , Pradhan , M. , Mascialino , B. , Schneider , D. , Edvardsen , H. , Sørlie , T. , Kristensen , G.B. , Askautrud , H.A ., 2025 . Real-world outcomes in molecular subgroups for patients with advanced or recurrent endometrial cancer treated with platinum-based chemotherapy . International journal of gynecological cancer: official journal of the International Gynecological Cancer Society 35 , 101618 . doi: 10.1016/j.ijgc.2024.101618 OpenUrl CrossRef PubMed ↵ Liu , G. , Xu , P. , Fu , Z. , Hua , X. , Liu , X. , Li , W. , Zhang , M. , Wu , J. , Wen , J. , Xu , J. , Jia , X ., 2017 . Prognostic and Clinicopathological Significance of ARID1A in Endometrium-Related Gynecological Cancers: A Meta-Analysis . Journal of cellular biochemistry 118 , 4517 – 4525 . doi: 10.1002/jcb.26109 OpenUrl CrossRef ↵ Lombaers , M.S. , Reijnen , C. , Sprik , A. , Bretová , P. , Grube , M. , Vrede , S. , Berg , H.F. , Asberger , J. , Colas , E. , Hausnerova , J. , Huvila , J. , Gil-Moreno , A. , Matias-Guiu , X. , Simons , M. , Snijders , M.P.L.M. , Visser , N.C.M. , Kommoss , S. , Weinberger , V. , Amant , F. , Bronsert , P ., 2025 . ENDORISK-2: a personalized Bayesian network for preoperative risk stratification in endometrial cancer, integrating molecular classification and preoperative myometrial invasion assessment . European Journal of Cancer 116058 . doi: 10.1016/j.ejca.2025.116058 OpenUrl CrossRef Loukovaara , M. , Pasanen , A. , Bützow , R ., 2025a . Distinct clinical outcomes according to molecular subgroups in relapsed endometrial carcinoma: A cohort study . Gynecologic oncology 201 , 216 – 222 . doi: 10.1016/j.ygyno.2025.08.031 OpenUrl CrossRef PubMed ↵ Loukovaara , M. , Pasanen , A. , Bützow , R ., 2025b . Molecular subgroup-specific prognostic value of semiquantitative lymphovascular space invasion in early-stage endometrioid endometrial cancer . Gynecologic oncology 197 , 96 – 101 . doi: 10.1016/j.ygyno.2025.04.589 OpenUrl CrossRef PubMed ↵ Lundberg , S. , Allen , P. , Lee , S.-I ., 2017 . A Unified Approach to Interpreting Model Predictions ↵ Maria-Bianca Anca-Stanciu , Manu , A. , Olinca , M.V. , Cătălin Coroleucă , Diana-Elena Comandașu, Ciprian Andrei Coroleuca , Maier , C. , Bratila , E. , 2025 . Comprehensive Review of Endometrial Cancer: New Molecular and FIGO Classification and Recent Treatment Changes . Journal of Clinical Medicine 14 , 1385 – 1385 . doi: 10.3390/jcm14041385 OpenUrl CrossRef PubMed ↵ Murali , R. , Davidson , B. , Fadare , O. , Carlson , J.A. , Crum , C.P. , Gilks , C.B. , Irving , J.A. , Malpica , A. , Matias-Guiu , X. , McCluggage , W.G. , Mittal , K. , Oliva , E. , Parkash , V. , Rutgers , J.K.L. , Staats , P.N. , Stewart , C.J.R. , Tornos , C. , Soslow , R.A ., 2019 . High-grade Endometrial Carcinomas . International Journal of Gynecological Pathology 38 , S40 – S63 . doi: 10.1097/pgp.0000000000000491 OpenUrl CrossRef PubMed ↵ Nicolò , C. , Périer , C. , Prague , M. , Bellera , C. , MacGrogan , G. , Saut , O. , Benzekry , S ., 2020 . Machine Learning and Mechanistic Modeling for Prediction of Metastatic Relapse in Early-Stage Breast Cancer . JCO Clinical Cancer Informatics 259 – 274 . doi: 10.1200/cci.19.00133 OpenUrl CrossRef ↵ Njoku , K. , Barr , C.E. , Crosbie , E.J ., 2022 . Current and Emerging Prognostic Biomarkers in Endometrial Cancer . Frontiers in Oncology 12 . doi: 10.3389/fonc.2022.890908 OpenUrl CrossRef ↵ Nordin , G. , Mårtensson , A. , Birgitta Swolin , Sandberg , S. , Niels Juel Christensen , Vilhjálmur Þorsteinsson , Leifur Franzson , Veli Kairisto , Savolainen , E. , 2004 . A multicentre study of reference intervals for haemoglobin, basic blood cell counts and erythrocyte indices in the adult population of the Nordic countries . Scandinavian Journal of Clinical & Laboratory Investigation 64 , 385 – 398 . doi: 10.1080/00365510410002797 OpenUrl CrossRef PubMed ↵ Oaknin , A. , Bosse , T.J. , Creutzber , C.L. , Giornelli , G. , Harter , P. , Joly , F. , Lorusso , D. , Marth , C. , Makker , V. , Mirza , M.R. , Ledermann , J.A. , Colombo , N ., 2022 . Endometrial cancer: ESMO Clinical Practice Guideline for diagnosis, treatment and follow-up† . Annals of Oncology 33 . doi: 10.1016/j.annonc.2022.05.009 OpenUrl CrossRef PubMed ↵ Ohad Houri , Gil , Y. , Ofer Gemer , Limor Helpman , Vaknin , Z. , Lavie , O. , Arie , A.B. , Amit , A. , Levy , T. , Ahmet Namazov , Shachar , I.B. , Atlas , I. , Ilan Bruchim , Ram Eitan , 2022 . Prediction of endometrial cancer recurrence by using a novel machine learning algorithm: An Israeli gynecologic oncology group study . Journal of Gynecology Obstetrics and Human Reproduction 51 , 102466 – 102466 . doi: 10.1016/j.jogoh.2022.102466 OpenUrl CrossRef ↵ Onstad , M.A. , Schmandt , R.E. , Lu , K.H ., 2016 . Addressing the Role of Obesity in Endometrial Cancer Risk, Prevention, and Treatment . Journal of Clinical Oncology 34 , 4225 – 4230 . doi: 10.1200/jco.2016.69.4638 OpenUrl CrossRef PubMed ↵ Pasanen , A. , Ahvenainen , T. , Pellinen , T. , Vahteristo , P. , Loukovaara , M. , Bützow , R ., 2019 . PD-L1 Expression in Endometrial Carcinoma Cells and Intratumoral Immune Cells . American Journal of Surgical Pathology 44 , 174 – 181 . doi: 10.1097/pas.0000000000001395 OpenUrl CrossRef ↵ Pasanen , A. , Loukovaara , M. , Ahvenainen , T. , Vahteristo , P. , Bützow , R ., 2021 . Differential impact of clinicopathological risk factors within the 2 largest ProMisE molecular subgroups of endometrial carcinoma . PLOS ONE 16 , e0253472 . doi: 10.1371/journal.pone.0253472 OpenUrl CrossRef PubMed ↵ Pasanen , A. , Loukovaara , M. , Bützow , R ., 2020 . Clinicopathological significance of deficient DNA mismatch repair and MLH1 promoter methylation in endometrioid endometrial carcinoma . Modern Pathology . doi: 10.1038/s41379-020-0501-8 OpenUrl CrossRef ↵ Pasanen , A. , Tuomi , T. , Isola , J. , Staff , S. , Bützow , R. , Loukovaara , M. , 2016 . L1 Cell Adhesion Molecule as a Predictor of Disease-Specific Survival and Patterns of Relapse in Endometrial Cancer . International Journal of Gynecologic Cancer 26 , 1465 – 1471 . doi: 10.1097/igc.0000000000000801 OpenUrl CrossRef ↵ Pecorelli , S ., 2009 . Revised FIGO staging for carcinoma of the vulva, cervix, and endometrium . International journal of gynaecology and obstetrics: the official organ of the International Federation of Gynaecology and Obstetrics 105 , 103 – 4 . doi: 10.1016/j.ijgo.2009.02.012 OpenUrl CrossRef PubMed ↵ Piedimonte , S. , Feigenberg , T. , Drysdale , E. , Kwon , J. , Gotlieb , W.H. , Cormier , B. , Plante , M. , Lau , S. , Helpman , L. , Renaud , M.-C. , May , T. , Vicus , D ., 2022 . Predicting recurrence and recurrence-free survival in high-grade endometrial cancer using machine learning . Journal of surgical oncology 126 , 1096 – 1103 . doi: 10.1002/jso.27008 OpenUrl CrossRef PubMed ↵ Ponce-Bobadilla , A.V. , Schmitt , V. , Maier , C.S. , Mensing , S. , Stodtmann , S. , 2024 . Practical guide to SHAP analysis: Explaining supervised machine learning model predictions in drug development . Clinical and Translational Science 17 . doi: 10.1111/cts.70056 OpenUrl CrossRef PubMed ↵ Schlosshauer , P.W. , Ellenson , L.H. , Soslow , R.A ., 2002 . β-Catenin and E-Cadherin Expression Patterns in High-Grade Endometrial Carcinoma Are Associated with Histological Subtype . Modern Pathology 15 , 1032 – 1037 . doi: 10.1097/01.mp.0000028573.34289.04 OpenUrl CrossRef PubMed Web of Science ↵ Siegel , R.L. , Miller , K.D. , Fuchs , H.E. , Jemal , A ., 2022 . Cancer statistics, 2022 . CA : A Cancer Journal for Clinicians 72 , 7–33. doi: 10.3322/caac.21708 OpenUrl CrossRef PubMed ↵ Siegenthaler , F. , Lindemann , K. , Epstein , E. , Rau , T.T. , Nastic , D. , Ghaderi , M. , Rydberg , F. , Mueller , M.D. , Carlson , J. , Imboden , S ., 2022 . Time to first recurrence, pattern of recurrence, and survival after recurrence in endometrial cancer according to the molecular classification . Gynecologic Oncology 165 , 230 – 238 . doi: 10.1016/j.ygyno.2022.02.024 OpenUrl CrossRef PubMed ↵ Sozzi , G. , Uccella , S. , Berretta , R. , Petrillo , M. , Fanfani , F. , Monterossi , G. , Ghizzoni , V. , Frusca , T. , Ghezzi , F. , Chiantera , V. , Scambia , G ., 2018 . Tumor Size, an Additional Risk Factor of Local Recurrence in Low-Risk Endometrial Cancer: A Large Multicentric Retrospective Study . International Journal of Gynecologic Cancer 28 , 684 – 691 . doi: 10.1097/igc.0000000000001223 OpenUrl CrossRef ↵ Talhouk , A. , McConechy , M.K. , Leung , S. , Li-Chang , H.H. , Kwon , J.S. , Melnyk , N. , Yang , W. , Senz , J. , Boyd , N. , Karnezis , A.N. , Huntsman , D.G. , Gilks , C.B. , McAlpine , J.N ., 2015 . A clinically applicable molecular-based classification for endometrial cancers . British Journal of Cancer 113 , 299 – 310 . doi: 10.1038/bjc.2015.190 OpenUrl CrossRef PubMed ↵ Talhouk , A. , McConechy , M.K. , Leung , S. , Yang , W. , Lum , A. , Senz , J. , Boyd , N. , Pike , J. , Anglesio , M. , Kwon , J.S. , Karnezis , A.N. , Huntsman , D.G. , Gilks , C.B. , McAlpine , J.N ., 2017 . Confirmation of ProMisE: A simple, genomics-based clinical classifier for endometrial cancer . Cancer 123 , 802 – 813 . doi: 10.1002/cncr.30496 OpenUrl CrossRef PubMed ↵ Tuninetti , V. , Farolfi , A. , Rognone , C. , Montanari , D. , De Giorgi , U. , Valabrega , G. , 2024 . Treatment Strategies for Advanced Endometrial Cancer According to Molecular Classification . International Journal of Molecular Sciences 25 , 11448 . doi: 10.3390/ijms252111448 OpenUrl CrossRef PubMed ↵ Urick , M.E. , Bell , D.W ., 2019 . Clinical actionability of molecular targets in endometrial cancer . Nature Reviews Cancer 19 , 510 – 521 . doi: 10.1038/s41568-019-0177-x OpenUrl CrossRef PubMed ↵ Volinsky-Fremond , S. , Horeweg , N. , Andani , S. , Barkey Wolf , J. , Lafarge , M.W. , de Kroon , C.D. , Ørtoft , G. , Høgdall , E. , Dijkstra , J. , Jobsen , J.J. , Lutgens , L.C.H.W. , Powell , M.E. , Mileshkin , L.R. , Mackay , H. , Leary , A. , Katsaros , D. , Nijman , H.W. , de Boer , S.M. , Nout , R.A. , de Bruyn , M. , 2024 . Prediction of recurrence risk in endometrial cancer with multimodal deep learning . Nature Medicine 1 – 12 . doi: 10.1038/s41591-024-02993-w OpenUrl CrossRef PubMed ↵ W Glenn McCluggage , Bosse , T. , C Blake Gilks , Howitt , B.E. , McAlpine , J.N. , Nucci , M.R. , Rabban , J.T. , Singh , N. , Talia , K.L. , Parra-Herran , C ., 2023 . FIGO 2023 endometrial cancer staging: too much, too soon? International journal of gynecological cancer 34 , 138 – 143 . doi: 10.1136/ijgc-2023-004981 OpenUrl Abstract / FREE Full Text ↵ Wang , W. , Xu , Y. , Yuan , S. , Zhiying , L. , Zhu , X. , Zhou , Q. , Shen , W. , Wang , S ., 2022 . Prediction of Endometrial Carcinoma Using the Combination of Electronic Health Records and an Ensemble Machine Learning Method . Frontiers in Medicine 9 . doi: 10.3389/fmed.2022.851890 OpenUrl CrossRef ↵ Yang , X. , Wang , J ., 2019 . The Role of Metabolic Syndrome in Endometrial Cancer: A Review . Frontiers in Oncology 9 . doi: 10.3389/fonc.2019.00744 OpenUrl CrossRef ↵ Zheng , S. , Wu , Y. , Donnelly , E.D. , Strauss , J.B ., 2023 . A cost-effective, machine learning-based new unified risk-classification score (NU-CATS) for patients with endometrial cancer . Gynecologic oncology 175 , 97 – 106 . doi: 10.1016/j.ygyno.2023.06.008 OpenUrl CrossRef PubMed ↵ Zwahlen , D.R. , Schick , U. , Bolukbasi , Y. , Thariat , J. , Abdah-Bortnyak , R. , Kuten , A. , Igdem , S. , Caglar , H. , Ozsaran , Z. , Loessl , K. , Belkaaloul , K.K. , Villette , S. , Vees , H ., 2016 . Outcome and Predictive Factors in Uterine Carcinosarcoma Using Postoperative Radiotherapy: A Rare Cancer Network Study . Rare tumors 8 , 6052 . doi: 10.4081/rt.2016.6052 OpenUrl CrossRef PubMed Supplementary References Aro , K. , Loukovaara , M. , Bützow , R. , Pasanen , A ., 2025 . HER2 amplification and HER2 low expression in endometrial carcinoma: prevalence across molecular, histological and clinicopathological risk groups . BJC Reports 3 . doi: 10.1038/s44276-025-00125-6 OpenUrl CrossRef Aro , K. , Pasanen , A. , Bützow , R. , Loukovaara , M ., 2024 . The impact of estrogen receptor and L1 cell adhesion molecule expression on endometrial cancer outcome correlates with clinicopathological risk group and molecular subgroup . Gynecologic oncology 189 , 9 – 15 . doi: 10.1016/j.ygyno.2024.06.016 OpenUrl CrossRef PubMed Bartley , A.N. , Washington , M.K. , Colasacco , C. , Ventura , C.B. , Ismaila , N. , Benson , A.B. , Carrato , A. , Gulley , M.L. , Jain , D. , Kakar , S. , Mackay , H.J. , Streutker , C. , Tang , L. , Troxell , M. , Ajani , J.A ., 2017 . HER2 Testing and Clinical Decision Making in Gastroesophageal Adenocarcinoma: Guideline From the College of American Pathologists, American Society for Clinical Pathology, and the American Society of Clinical Oncology . Journal of Clinical Oncology 35 , 446 – 464 . doi: 10.1200/jco.2016.69.4836 OpenUrl CrossRef PubMed Guan , B. , Mao , T.-L. , Panuganti , P.K. , Kuhn , E. , Kurman , R.J. , Maeda , D. , Chen , E. , Jeng , Y.-M. , Wang , T.-L. , Shih , I.-M ., 2011 . Mutation and loss of expression of ARID1A in uterine low-grade endometrioid carcinoma . The American journal of surgical pathology 35 , 625 – 632 . doi: 10.1097/PAS.0b013e318212782a OpenUrl CrossRef PubMed Khatun , M. , Pasanen , A. , Kanerva , A. , Koivisto-Korander , R. , Tuomi , T. , Bützow , R. , Loukovaara , M ., 2025 . PPP2R1A mutation status as a predictive and prognostic factor in molecularly characterized endometrial carcinoma: a cohort study . International journal of gynecological cancer: official journal of the International Gynecological Cancer Society 35 , 101934 . doi: 10.1016/j.ijgc.2025.101934 OpenUrl CrossRef PubMed Lassus , H. , Leminen , A. , Lundin , J. , Lehtovirta , P. , Butzow , R ., 2003 . Distinct subtypes of serous ovarian carcinoma identified by p53 determination⋆⋆⋆⋆⋆Supplementary data associated with this article can be found at doi: 10.1016/S0090-8258(03)00608-5 . Gynecologic Oncology 91 , 504 – 512 . 10.1016/j.ygyno.2003.08.034 OpenUrl CrossRef PubMed Meric-Bernstam , F. , Makker , V. , Oaknin , A. , Oh , D.-Y. , Banerjee , S. , González-Martín , A. , Jung , K.H. , Ługowska , I. , Manso , L. , Manzano , A. , Melichar , B. , Siena , S. , Stroyakovskiy , D. , Fielding , A. , Ma , Y. , Puvvada , S. , Shire , N. , Lee , J.-Y ., 2023 . Efficacy and Safety of Trastuzumab Deruxtecan in Patients With HER2-Expressing Solid Tumors: Primary Results From the DESTINY-PanTumor02 Phase II Trial . Journal of Clinical Oncology: Official Journal of the American Society of Clinical Oncology 42 , 101200J CO2302005. doi: 10.1200/JCO.23.02005 OpenUrl CrossRef Pasanen , A. , Ahvenainen , T. , Pellinen , T. , Vahteristo , P. , Loukovaara , M. , Bützow , R ., 2019 . PD-L1 Expression in Endometrial Carcinoma Cells and Intratumoral Immune Cells . American Journal of Surgical Pathology 44 , 174 – 181 . doi: 10.1097/pas.0000000000001395 OpenUrl CrossRef Pasanen , A. , Loukovaara , M. , Ahvenainen , T. , Vahteristo , P. , Bützow , R ., 2021 . Differential impact of clinicopathological risk factors within the 2 largest ProMisE molecular subgroups of endometrial carcinoma . PLOS ONE 16 , e0253472 . doi: 10.1371/journal.pone.0253472 OpenUrl CrossRef PubMed Pasanen , A. , Tuomi , T. , Isola , J. , Staff , S. , Bützow , R. , Loukovaara , M ., 2016 . L1 Cell Adhesion Molecule as a Predictor of Disease-Specific Survival and Patterns of Relapse in Endometrial Cancer . International Journal of Gynecologic Cancer 26 , 1465 – 1471 . doi: 10.1097/igc.0000000000000801 OpenUrl CrossRef Soovares , P. , Pasanen , A. , Similä-Maarala , J. , Bützow , R. , Lassus , H ., 2022 . Clinical factors and biomarker profiles associated with patient outcome in endometrioid ovarian carcinoma - Emphasis on tumor grade . Gynecologic oncology 164 , 187 – 194 . doi: 10.1016/j.ygyno.2021.10.078 OpenUrl CrossRef PubMed V. H. W. M. Jongen , Briët , J.M. , R. De Jong , Klaske ten Hoor , Marike Boezen , van, Nijman , H.W. , Hollema , H. , 2009 . Expression of estrogen receptor-alpha and-beta and progesterone receptor-A and-B in a large cohort of patients with endometrioid endometrial cancer . Gynecologic Oncology 112 , 537 – 542 . doi: 10.1016/j.ygyno.2008.10.032 OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted November 07, 2025. Download PDF Supplementary Material Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Explainable Machine Learning for Preoperative Relapse Prediction in Molecularly Stratified Endometrial Cancer: A Single-Center Finnish Cohort Study Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Explainable Machine Learning for Preoperative Relapse Prediction in Molecularly Stratified Endometrial Cancer: A Single-Center Finnish Cohort Study Sergio Vela Moreno , Masuma Khatun , Annukka Pasanen , Ralf Bützow , Andres Salumets , Mikko Loukovaara , Vijayachitra Modhukur bioRxiv 2025.11.06.686680; doi: https://doi.org/10.1101/2025.11.06.686680 Share This Article: Copy Citation Tools Explainable Machine Learning for Preoperative Relapse Prediction in Molecularly Stratified Endometrial Cancer: A Single-Center Finnish Cohort Study Sergio Vela Moreno , Masuma Khatun , Annukka Pasanen , Ralf Bützow , Andres Salumets , Mikko Loukovaara , Vijayachitra Modhukur bioRxiv 2025.11.06.686680; doi: https://doi.org/10.1101/2025.11.06.686680 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Cancer Biology Subject Areas All Articles Animal Behavior and Cognition (7642) Biochemistry (17715) Bioengineering (13907) Bioinformatics (42003) Biophysics (21470) Cancer Biology (18624) Cell Biology (25533) Clinical Trials (138) Developmental Biology (13390) Ecology (19935) Epidemiology (2067) Evolutionary Biology (24356) Genetics (15617) Genomics (22529) Immunology (17753) Microbiology (40432) Molecular Biology (17200) Neuroscience (88681) Paleontology (667) Pathology (2840) Pharmacology and Toxicology (4828) Physiology (7653) Plant Biology (15161) Scientific Communication and Education (2046) Synthetic Biology (4304) Systems Biology (9826) Zoology (2271)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

⚙ Ask this paper AI returns verbatim quotes from the full text · source: preprint-html ⓘ

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc: last seen: 2026-05-20T01:45:00.602351+00:00