Stacking Ensemble Learning-based Models Enabling Accurate Diagnosis of Cardiac Amyloidosis using SPECT/CT:an International and Multicentre Study

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 47,578 characters · extracted from preprint-html · click to expand
Stacking Ensemble Learning-based Models Enabling Accurate Diagnosis of Cardiac Amyloidosis using SPECT/CT:an International and Multicentre Study | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Stacking Ensemble Learning-based Models Enabling Accurate Diagnosis of Cardiac Amyloidosis using SPECT/CT:an International and Multicentre Study Qu Mo , Jing Cui , Shengguo Jia , Ying Zhang , Yi Xiao , Caiguang Liu , Chunqing Zhou , Clemens P Spielvogel , Raffaella Calabretta , Weihua Zhou , Ke Cao , Marcus Hacker , Xiang Li , Min Zhao doi: https://doi.org/10.1101/2025.06.22.25330039 Qu Mo 1 Department of Nuclear Medicine, Xiangya Hospital, Central South University , Changsha 410008, China 2 Department of Nuclear Medicine, Third Xiangya Hospital, Central South University , Changsha 410013, China Find this author on Google Scholar Find this author on PubMed Search for this author on this site Jing Cui 3 Department of Nuclear Medicine, Fuwai Central China Cardiovascular Hospital, Henan Provincial People’s Hospital Heart Center , Zhengzhou 451464, China Find this author on Google Scholar Find this author on PubMed Search for this author on this site Shengguo Jia 4 Siemens Healthineers Ltd. , Shanghai, China Find this author on Google Scholar Find this author on PubMed Search for this author on this site Ying Zhang 3 Department of Nuclear Medicine, Fuwai Central China Cardiovascular Hospital, Henan Provincial People’s Hospital Heart Center , Zhengzhou 451464, China Find this author on Google Scholar Find this author on PubMed Search for this author on this site Yi Xiao 1 Department of Nuclear Medicine, Xiangya Hospital, Central South University , Changsha 410008, China Find this author on Google Scholar Find this author on PubMed Search for this author on this site Caiguang Liu 1 Department of Nuclear Medicine, Xiangya Hospital, Central South University , Changsha 410008, China Find this author on Google Scholar Find this author on PubMed Search for this author on this site Chunqing Zhou 2 Department of Nuclear Medicine, Third Xiangya Hospital, Central South University , Changsha 410013, China Find this author on Google Scholar Find this author on PubMed Search for this author on this site Clemens P Spielvogel 5 Department of Biomedical Imaging and Image-Guided Therapy, Division of Nuclear Medicine, Medical University of Vienna , Vienna, Austria Find this author on Google Scholar Find this author on PubMed Search for this author on this site Raffaella Calabretta 5 Department of Biomedical Imaging and Image-Guided Therapy, Division of Nuclear Medicine, Medical University of Vienna , Vienna, Austria Find this author on Google Scholar Find this author on PubMed Search for this author on this site Weihua Zhou 6 Department of Applied Computing, Michigan Technological University , Houghton, MI, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Ke Cao 7 Department of Oncology, Third Xiangya Hospital, Central South University , Changsha 410013, China Find this author on Google Scholar Find this author on PubMed Search for this author on this site Marcus Hacker 5 Department of Biomedical Imaging and Image-Guided Therapy, Division of Nuclear Medicine, Medical University of Vienna , Vienna, Austria Find this author on Google Scholar Find this author on PubMed Search for this author on this site Xiang Li 5 Department of Biomedical Imaging and Image-Guided Therapy, Division of Nuclear Medicine, Medical University of Vienna , Vienna, Austria Find this author on Google Scholar Find this author on PubMed Search for this author on this site Min Zhao 2 Department of Nuclear Medicine, Third Xiangya Hospital, Central South University , Changsha 410013, China Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: mzhao1981{at}csu.edu.cn Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF ABSTRACT PURPOSE Cardiac amyloidosis (CA), a life-threatening infiltrative cardiomyopathy, can be non-invasively diagnosed using [ 99m Tc]Tc-bisphosphonate SPECT/CT. However, subjective visual interpretation risks diagnostic inaccuracies. We developed and validated a machine learning (ML) framework leveraging SPECT/CT radiomics to automate CA detection. METHODS This retrospective multicenter study analyzed 290 patients of suspected CA who underwent [ 99m Tc]Tc-PYP or [ 99m Tc]Tc-DPD SPECT/CT. Radiomic features were extracted from co-registered SPECT and CT images, harmonized via intra-class correlation and Pearson correlation filtering, and optimized through LASSO regression. A stacking ensemble model incorporating support vector machine (SVM), random forest (RF), gradient boosting decision tree (GBDT), and adaptive boosting (AdaBoost) classifiers was constructed. The model was validated using an internal validation set (n = 54) and two external test set (n = 54 and n = 58).Model performance was evaluated using the area under the receiver operating characteristic curve (AUC), calibration, and decision curve analysis (DCA). Feature importance was interpreted using SHapley Additive exPlanations (SHAP) values. RESULTS Of 290 patients, 117 (40.3%) had CA. The stacking radiomics model attained AUCs of 0.871, 0.824, and 0.839 in the validation, test 1, and test 2 cohorts, respectively, significantly outperforming the clinical model (AUC 0.546 in validation set, P <0.05). DCA demonstrated superior net benefit over the clinical model across relevant thresholds, and SHAP analysis highlighted wavelet-transformed first-order and texture features as key predictors. CONCLUSION A stacking ML model with SPECT/CT radiomics improves CA diagnosis, showing strong generalizability across varied imaging protocols and populations and highlighting its potential as a decision-support tool. INTRODUCTION Cardiac amyloidosis (CA) is a progressive disorder characterized by extracellular deposition of misfolded protein fibrils in myocardial tissue, leading to potentially fatal complications including heart failure and conduction abnormalities[ 1 ]. Despite advancements in diagnostic techniques, CA remains challenging to diagnose due to its heterogeneous and nonspecific clinical presentation, often resulting in diagnostic delays or misclassification[ 2 ]. While endomyocardial biopsy (EMB) remains the diagnostic gold standard, its invasive nature and associated risks have prompted the development of non-invasive alternatives [ 2 ]. [ 99m Tc]Tc-bisphosphonate scintigraphy has emerged as a reliable non-invasive diagnostic modality for transthyretin cardiac amyloidosis (ATTR-CA), particularly when combined with immunoglobulin light chain screening to exclude amyloid light chain cardiac amyloidosis (AL-CA) [ 3 ]. However, despite the advancements, the visual assessment method is inherently subjective, with accuracy heavily reliant on the physician’s experience[ 4 ]. Moreover, visual scoring has limitations in capturing the heterogeneity of diseases and its ability to reflect subtle disease information is limited, while being less effective in identifying AL-CA [ 5 , 6 ]. Artificial intelligence(AI) has shown increasing promise for the diagnosis and prognostic assessment of CA[ 7 ]. In bone scintigraphy.Delbarre et al. trained a convolutional neural network on 3,048 images, achieving 99% sensitivity and 96% specificity versus expert visual reads [ 8 ]. Speilvogel et al. then implemented an automated image-standardization pipeline followed by deep learning(DL) to identify Perugini score ≥ 2 uptake, achieving an internal cross-validation AUC of 1.000 and external AUCs of 0.925-1.000 [ 9 ]. Hybrid SPECT/CT offers the distinct advantage of precise anatomical localization via co-registered images, which is especially valuable in early-stage disease when regional myocardial uptake may be mistaken for blood pool activity. Recently, a DL method was developed for fully automated volumetric quantification of [ 99m Tc]Tc-PYP using segmentation of co-registered anatomical structures from CT attenuation maps[ 4 ]. Despite these advances, AI -driven SPECT/CT applications for comprehensive CA diagnosis remain unexplored. This study aims to develop and validate an ensemble machine learning (ML) model based on SPECT/CT images for automated detection of CA, providing clinicians with a more reliable diagnostic tool. MATERIALS AND METHODS Study population Data were retrospectively collected from 290 patients with suspected CA who underwent [ 99m Tc]Tc-bisphosphonate SPECT/CT imaging at three centers between February 2021 and February 2024. The training set and internal validation set from the center 1 (Xiangya Hospital of Central South University) consisted of 124 and 54 patients, respectively. The external test sets from the second center (Fuwai Central China Cardiovascular Hospital) and the third center (Vienna General Hospital, Medical University of Vienna) comprised 54 and 58 patients, respectively. Patients from Centers 1 and 2 received [ 99m Tc]Tc-PYP, while patients from Center 3 were administered [ 99m Tc]Tc-DPD as the imaging agent. A flowchart of patient enrollment is shown in Figure 1 . This study was granted ethical approval by the institutional review boards of Xiangya Hospital, Central South University (No. 202310202), Fuwai Central China Cardiovascular Hospital (Ethics Review No. 202303), and the General Hospital of Vienna (EK1557/2020). It was carried out in accordance with the principles of the 1964 Declaration of Helsinki. Owing to the retrospective study design, the Institutional Review Boards of all participating institutions formally waived the requirement for informed consent. Download figure Open in new tab Figure 1. Flowchart of study cohort enrollment. Diagnosis of CA Patients underwent a comprehensive diagnostic workup, which included cardiac imaging tests such as electrocardiogram (ECG), echocardiography, cardiac magnetic resonance imaging (CMR), and [ 99m Tc]Tc -biphosphonate scintigraphy, laboratory tests such as serum N-terminal prohormone of brain natriuretic peptide (NT-proBNP) and estimated glomerular filtration rate (eGFR), as well as myocardial or non-myocardial biopsy. The diagnosis of CA was made according to current guidelines[ 3 , 10 , 11 ]: CA was defined to be present if (1) [ 99m Tc]Tc-bisphosphonate imaging strongly suggested cardiac uptake in the absence of monoclonal gammopathy, the diagnosis was ATTR-CA. or (2) histological evidence of amyloid infiltration was found in endocardial or extracardiac biopsy tissues and cardiac imaging strongly suggested CA, with the presence of monoclonal immunoglobulin or free light chains in blood or urine, or monoclonal plasma cells/B cells in bone marrow, AL-CA was diagnosed or (3) other types of CA were confirmed by immunohistochemistry or mass spectrometry. SPECT/CT Imaging protocols At Center 1&2, patients received an intravenous injection of 370-740 MBq of [ 99m Tc]Tc-PYP, followed by chest planar imaging 1 hour later and SPECT/CT of the thorax 3 hours post-injection. At Center3, patients were administered an intravenous injection of 700 MBq of [ 99m Tc]Tc-DPD, followed by whole-body planar imaging and chest SPECT/CT scan 3 hours later. CT scans were performed before SPECT acquisition to correct for radiation scatter and attenuation, and the SPECT data were reconstructed using the respective algorithms provided by each manufacturer. Detailed information on imaging vectors and acquisition protocols is provided in Supplementary Table 1 . Image analysis Cardiac tracer uptake was assessed according to the Perugini grading system, where Grade 0 indicates no cardiac uptake, Grade 1 indicates mild cardiac uptake (lower than bone), and Grades 2 or 3 indicate intense cardiac uptake (equal to or greater than bone). Grades 0-1 were considered negative, while Grades 2-3 were considered positive[ 3 , 9 ]. In each center, visual scoring was evaluated by two experienced (≥5 years) nuclear medicine physicians who were blinded to patient information. In cases where the visual scoring is ambiguous, to prevent disputes, consultation with a more senior physician is conducted to reach a consensus. A circular region of interest (ROI) was placed over the heart and mirrored to the contralateral chest (avoiding areas such as the sternum and stomach). The average counts within the ROI were calculated to obtain the heart-to-contralateral lung (H/CL) ratio. A 1-hour H/CL ratio ≥ 1.5 was considered positive, and a 3-hour H/CL ratio ≥ 1.3 was considered positive [ 3 ]. Segmentation, radiomics feature extraction and selection The volume of interest (VOI) for the heart contour was automatically segmented by the Siemens software MM RT Image Suite[ 12 ] ( Supplementary Figure 1 ) , and subsequently reviewed and manually adjusted as needed by two experienced nuclear medicine physicians (Q.M., M.Z.),Radiomic features were extracted from both SPECT and CT images using PyRadiomics package ( https://github.com/Radiomics/pyradiomics )[ 13 ], which is compliant with the Imaging Biomarker Standardization Initiative(IBSI). The extracted features can be divided into four sets: (1) first-order statistics; (2) shape-based features extracted from 2-D regions of interest or 3-D VOIs; (3) texture features including gray-level co-occurrence matrix (GLCM), gray-level dependence matrix (GLDM), gray-level run length matrix (GLRLM), gray-level run length matrix(GLRLM), gray-level sizezone matrix (GLSZM) and neighboring gray-level dependence matrix (NGTDM); (4) higher-order features using Laplacian of Gaussian (LoG) filter and wavelet transform filter with all possible combinations of high (H) or low (L) pass filter in each of the three dimensions (HHH, HHL, HLH, LHH, LLL, LLH, LHL, HLL). All data from Center 1 were randomly split into a training set (70%) and an internal validation set (30%).Data from Centers 2 and 3 served as external testing sets. Optimal feature selection involved four sequential steps: (1) Z-score normalization of all features; (2) feature reproducibility was assessed via intra-class correlation coefficient (ICC), retaining only those with ICC > 0.75[ 16 ]; (3) Pearson correlation coefficient (PCC) analysis was performed, and when the PCC between any two features in the training set exceeded 0.90, one feature was removed to reduce redundancy[ 17 ]; and (4) LASSO regression with 1-standard error and 10-fold cross-validation was applied to avoid overfitting[ 18 ]. The radiomics workflow is shown in the Central Illustration . Development and validation of the models Independent predictive factors for CA in the training set were selected using univariate and multivariate logistic regression analysis. All significant clinical factors identified in the univariate analysis were included in the subsequent multivariate analysis. A clinical model was established based on the independent predictive factors. Based on the selected radiomic features, radiomics models were constructed using various ML algorithms, including support vector machine (SVM), random forest (RF), gradient boosting decision Tree (GBDT), adaptive boosting (Adaboost), and the stacking ensemble method. The stacking model utilized SVM, RF, GBDT, and Adaboost as primary learners (first level), with RF serving as the meta-learner (second level). Supplementary Figure 2 illustrates the development process of the stacking radiomics model. By employing metrics such as area under the curve (AUC), accuracy(ACC), sensitivity(SEN), specificity(SPE), positive predictive value (PPV), and negative predictive value (NPV), we compared the performance among different models. while the clinical utility of the models in both training and validation cohorts was evaluated through decision curve analysis (DCA). Shapley Additive Explanations (SHAP) were employed to interpret the ML model by quantifying the contribution of each feature to the model’s predictions[ 19 ]. Statistical analysis All statistical analyses were performed using SPSS (version 27.0), R (version 4.4.1, ( www.Rproject.org ), and Python (version 3.10). Continuous data were represented using mean ± standard deviation (SD) or median (with interquartile range), depending on their distribution. When comparing continuous variables, either the t-test or the Mann-Whitney U test was used. Categorical data were analyzed by the chi-square test or Fisher’s exact test, and were presented as numbers (percentages). NT-proBNP levels were logarithmically transformed prior to inclusion in the logistic regression model. Univariate and multivariate regression analyses were conducted to identify risk factors. Multivariable logistic regression analyses were performed on variables with a P value < 0.1 from the univariate analysis. Model performance was assessed by plotting ROC curves, differences in AUCs between models were statistically compared using the DeLong test. A P value of less than 0.05 was considered statistically significant. RESULTS Patient characteristics At the end of the diagnostic work-up, CA was diagnosed in 58 cases (32.6% of the whole population; 38 cases of ATTR-CA, 15 cases of AL-CA, and 5 cases of other types of CA) at Center 1, 20 cases (37.0% of the whole population; 3 cases of ATTR-CA, 13 cases of AL-CA, and 4 cases of other types of CA) at Center 2, and 39 cases (67.2% of the whole population; 35 cases of ATTR-CA, 4 cases of AL-CA) at Center 3. The clinical characteristics of the patients are summarized in Table 1 . Among these three centers, CA patients had significantly higher levels of NT-proBNP compared to non-CA patients. Furthermore, the H/CL ratio and visual score of CA patients were significantly higher than those of non-CA patients (both P<0.05). View this table: View inline View popup Table 1. Characteristics of the patients in different cohorts Feature Selection A total of 1888 features were extracted,from the CT and SPECT images. 376 features with high consistency were selected after-dimensionality reduction by ICC and PCC analysis, 9 key features were ultimately selected for the radiomics model. Among them, 4 features were extracted from SPECT images: Glszm_GrayLevel_NonUniformity, Log-sigma-3-0-mm-3D_ngtdm_Contrast, Wavelet-LLH_firstorder_Median, and Wavelet-LHH_glszm_GrayLevel_NonUniformity_Normalized. The remaining 5 features were derived from CT images: Firstorder_Entropy, Wavelet-LLH_firstorder_10Percentile, Wavelet-LLH_glszm_SizeZone_NonUniformity_Normalized, Wavelet-LLL_firstorder_90Percentile, and Wavelet-LLL_gldm_Dependence_Entropy. Univariate and multivariate analysis The univariate analysis revealed that age, lgNT-proBNP, and Interventricular septal (IVS) thickness derived from echocardiography were associated with CA. Subsequently, the significant variables from the univariate analysis (age, lgNT-proBNP, IVS thickness) were included in the multivariate logistic regression analysis. In multivariable analysis, lgNT-proBNP (OR: 4.63, 95% CI: 2.09 - 10.29, p < 0.001) and IVS thickness (OR: 1.23, 95% CI: 1.07 - 1.40, p = 0.003) were independent predictors of CA ( Supplementary Table 2 ). A predictive model constructed based on clinical parameters was then used to predict CA. Model Performance for Differentiating CA and Non-CA We evaluated the diagnostic performance of radiomics models based on five ML algorithms. As shown in Figure 2 , the stacking ensemble algorithm model achieved the highest AUCs on the training set and on the Center 2 and Center 3 test sets, with slightly lower performance than SVM on the Center 1-validation set. Despite the lack of statistical significance, the stacking ensemble algorithm model exhibited smaller AUC fluctuations across datasets, suggesting relative robustness. The calibration curves for stacking ensemble model indicated strong agreement between predicted probabilities and observed outcomes across datasets (Brier score =0.070– 0.156). Consequently, we selected the stacking ensemble model for subsequent development. Subsequently, we compared the stacking ensemble-based radiomics model with the clinical model and the H/CL ratio for diagnosing CA. As shown in Table 2 and Figure 3 , the radiomics model achieved higher AUCs than the clinical model across all cohorts. A statistically significant difference was observed in this Center1-validation set between the radiomics model and the clinical model (AUC: 0.871 vs. 0.546, p = 0.01), whereas no significant differences were found in the other dataset. Compared with the H/CL ratio, the radiomics model yielded higher AUCs in all cohorts except Center 3, with a significant difference observed in the Center 1-training set (0.953 vs. 0.859, p = 0.023). Download figure Open in new tab Figure 2. Performance comparison of machine learning models across multicenter cohorts using radar plots. (A) The radar charts display AUC values for five models: Support Vector Machine (SVM), Random Forest (RF), Gradient Boosting Decision Tree (GBDT), Adaptive Boosting (AdaBoost), and Stacking Ensemble, evaluated on Center 1 training set, Center 1 validation set, Center 2 test set, and Center 3 test set. (B) Calibration curves of the radiomics model for the Center 1 training set, Center 1 validation set, Center 2 test set and Center 3 test set. Download figure Open in new tab Figure 3. Receiver operating characteristic (ROC) curves of the Radiomics, Clinical, and H/CL models for distinguishing CA from non-CA. ROC curves are presented for Center 1 training set, Center 1 validation set, Center 2 test set, and Center 3 test set. View this table: View inline View popup Download powerpoint Table 2. Diagnostic Performance of the SPECT/CT Radiomics Model, Clinincal Model and H/CL ratio among Different Cohorts DCA assessed the clinical utility of the predictive model by comparing net benefits at various threshold probabilities ( Figure 4 ). The results demonstrated that the radiomics model consistently provided a higher net benefit than the clinical model across most risk thresholds, while its performance was comparable to that of the H/CL ratio. Download figure Open in new tab Figure 4. Decision curve analysis (DCA) of Radiomics, Clinical, and H/CL models. DCA curves are presented for Center 1 training set, Center 1 validation set, Center 2 test set, and Center 3 test set. Figure 5 displays the SHAP summary plots for the top-performing models, highlighting both SPECT- and CT-derived features. These SHAP plots illustrate the relative contribution of each feature, offering valuable insights into the model’s decision-making process and enhancing interpretability of the ML predictions. Download figure Open in new tab Figure 5. SHAP (SHapley Additive exPlanations) summary plot displaying the impact of various features for radiomics model. Model Performance for Differentiating ATTR-CA and AL-CA To further evaluate the model’s capability to discriminate ATTR-CA from AL-CA, we conducted another validation using data from three centers. Owing to the limited number of CA cases in Centers 2 and 3, these cohorts were combined into a single subgroup. The established radiomics model was then applied independently to the Center 1 cohort and the merged Centers 2&3 cohort. As detailed in Supplementary Table 3 , the model achieved higher accuracy in distinguishing ATTR-CA from AL-CA than in differentiating CA from non-CA in both test sets. DISCUSSION This multicenter study represents the first successful implementation of an ensemble ML model for automated CA diagnosis using hybrid SPECT/CT radiomics. Our key findings demonstrate that the stacking ensemble model integrating SVM, RF, GBDT, and AdaBoost achieved superior diagnostic performance compared to individual classifiers and clinical parameters, with robust generalizability across geographically distinct countries and tracers. The current diagnostic process for CA is complex and time-consuming, highlighting the need for reliable and non-invasive tools to enable early and accurate detection[ 9 , 20 , 21 ]. Patients with CA often present with comorbidities such as increased NT-proBNP levels and left ventricular hypertrophy, which have been identified as predictive factors in prior studies[ 22 - 24 ]. Our research identified lgNT-proBNP and IVS thickness as independent risk factors for CA, consistent with existing literatures. This limited performance is likely due to the clinical overlap between CA and other cardiomyopathies, such as hypertrophic cardiomyopathy and hypertensive cardiomyopathy, which also present with heart failure with preserved ejection fraction (HFpEF) and left ventricular hypertrophy. Therefore, relying solely on these two markers lacks the specificity required for accurate CA diagnosis. The use of [ 99m Tc]Tc-bisphosphonate imaging has become increasingly widespread due to its high diagnostic accuracy and growing awareness of ATTR-CA[ 25 ]. For example, Perugini grading of planar [ 99m Tc]Tc-bisphosphonate scans can reach very high sensitivity (99%) for ATTR-CA but at the cost of reduced specificity (86%) due largely to false positives in AL-CA[ 26 ]. Similarly, the commonly used H/CL ratio threshold (≥1.3 at 3 h) helps confirm ATTR-CA when uptake is equivocal[ 26 ], but its added value over expert reading is modest. In contrast, our model’s automated quantitative analysis consistently outperformed these traditional metrics. Notably, the model’s diagnostic accuracy matched or exceeded that of previously reported AI approaches. For instance, a ML model based on clinical information, laboratory tests, and imaging examinations achieved an AUC of 0.84 in detecting ATTR-CA among patients with AS[ 7 ]. A coronary CT-derived radiomics model achieved AUC 0.91 for CA[ 27 ], while a deep-learning pipeline for SPECT/CT quantitation reported A near-perfect AUC (0.99) in distinguishing ATTR-positive scans[ 4 ]. Likewise, other AI approaches to bone scintigraphy have reported AUCs in the 0.88-0.94 range[ 28 ]. Moreover, the results showed that the diagnostic performance of our radiomics model in the Austrian cohort using [ 99m Tc]Tc-DPD (AUC: 0.839) was comparable to that in the Chinese cohort using [ 99m Tc]Tc-PYP (AUC: 0.824). This consistency across tracers suggests that the model’s performance is largely independent of the specific radiopharmaceutical used. Taken together, these comparisons suggest that our hybrid SPECT/CT radiomics model provides enhanced sensitivity and specificity for CA, independent of imaging protocols and tracers. The improved accuracy is likely attributable to the rich information captured by combining SPECT and CT features. Radiomics analysis extracts subtle patterns of tracer uptake heterogeneity in the SPECT data alongside texture and density features from the CT images. Each modality offers complementary clues: SPECT reflects the degree and distribution of amyloid-binding tracer activity, while CT encodes structural changes (e.g. myocardial thickening, fibrosis). Our SHAP analysis identified wavelet-transformed first-order and texture features as the most influential predictors, reflecting the distribution of pixel intensities within specific frequency bands. This highlights their significance in quantitative SPECT/CT radiomics and their ability to capture subtle pathophysiological information that escapes visual detection. Importantly, our model also demonstrated the ability to classify amyloid subtype. It distinguished ATTR from AL with high accuracy, even outperforming the CA vs. non-CA task. This likely reflects known tracer-binding biology: ATTR-amyloid avidly takes up bone-avid tracers, whereas AL-amyloid shows little or no uptake. In practice, Perugini Grade ≥2 uptake without monoclonal proteins virtually confirms ATTR-CA. Our radiomics model learned these distinctions automatically, capturing subtle texture features linked to tracer retention. Unlike prior AI tools focused only on detecting amyloid presence, our approach enables subtype differentiation-critical for guiding therapy, as ATTR and AL require fundamentally different treatments (stabilizer drugs vs. chemotherapy). These findings have important clinical implications. Early and accurate CA diagnosis is crucial because effective treatments now exist, especially for ATTR (e.g. tafamidis) and AL (chemotherapy, stem cell transplant). Our radiomics model could flag patients who might otherwise be missed by visual readout, enabling prompt intervention. For example, AI-enhanced scintigraphy might detect low-grade tracer uptake or atypical patterns, prompting further workup. By reducing equivocal results, the model may also decrease the need for invasive procedures like biopsy. Moreover, as many CA patients are initially misdiagnosed or diagnosed late, our approach holds promise for earlier detection. In sum, integrating such a model into clinical imaging could enhance confidence in non-invasive diagnosis, guide appropriate workup (e.g. CMR, genetic testing), and ultimately improve patient outcomes. This study has several limitations. (1) As a retrospective study, it is inherently prone to selection bias, which is difficult to avoid. (2) The sample size of this study is relatively small, and the results need to be validated in a multicenter study with a larger sample size. (3) Although we intentionally included data from three centers and multiple scanner types to improve generalizability, device-dependent variability in image texture and reconstruction could still influence performance. In particular, the relative scarcity of AL-CA cases in our training set may have introduced class imbalance, this could lead the model to favor ATTR-like patterns; (4) Like most imaging AI studies to date, our work relied on existing labeled data and did not include prospective validation. CONCLUSION This study establishes that ensemble ML model of SPECT/CT radiomics significantly outperforms conventional diagnostic metrics for CA detection, demonstrating multicenter robustness and clinically actionable calibration, supporting its value in early CA diagnosis and clinical decision-making. Statements & Declarations Fundings This work was funded by National Natural Science Foundation of China (No. 82472029 and 81901784 to M.Z.). Competing interests C.P.S. reports speaker and consulting fees from Pfizer. All other authors have no relationships relevant to the contents of this paper to disclose. Author Contributions Q.M and M.Z contributed to the study design. Material preparation, data collection and analysis were performed by Q.M, J.C, S.J, Y.Z, Y.X, C.L, C.Z and C.P.S. The first draft of the manuscript was written by Q.M and reviewed by R.C,K.C, M.H, X.L, W.Z and M.Z. All authors commented on previous versions of the manuscript. All authors read and approved the final manuscript. Data availability The data underlying this article will be shared on reasonable request to the corresponding author. Ethics approval This study was granted ethical approval by the institutional review boards of Xiangya Hospital, Central South University (No. 202310202), Fuwai Central China Cardiovascular Hospital (Ethics Review No. 202303), and the General Hospital of Vienna (EK1557/2020). It was carried out in accordance with the principles of the 1964 Declaration of Helsinki. Owing to the retrospective study design, the Institutional Review Boards of all participating institutions formally waived the requirement for informed consent. Data Availability The data underlying this article will be shared on reasonable request to the corresponding author. ACKNOWLEDGEMENTS This work was funded by National Natural Science Foundation of China (No. 82472029 and 81901784 to M.Z.). REFERENCES 1. ↵ Rubin J , Maurer MS . Cardiac Amyloidosis: Overlooked, Underappreciated, and Treatable . Annu Rev Med . 2020 ; 71 : 203 - 19 . doi: 10.1146/annurev-med-052918-020140 . OpenUrl CrossRef PubMed 2. ↵ Maurer MS , Elliott P , Comenzo R , Semigran M , Rapezzi C . Addressing Common Questions Encountered in the Diagnosis and Management of Cardiac Amyloidosis . Circulation . 2017 ; 135 : 1357 – 77 . doi: 10.1161/CIRCULATIONAHA.116.024438 . OpenUrl Abstract / FREE Full Text 3. ↵ Dorbala S , Ando Y , Bokhari S , Dispenzieri A , Falk RH , Ferrari VA , et al. ASNC/AHA/ASE/EANM/HFSA/ISA/SCMR/SNMMI Expert Consensus Recommendations for Multimodality Imaging in Cardiac Amyloidosis: Part 1 of 2-Evidence Base and Standardized Methods of Imaging . Circ Cardiovasc Imaging . 2021 ; 14 : e000029 . doi: 10.1161/HCI.0000000000000029 . OpenUrl CrossRef PubMed 4. ↵ Miller RJH , Shanbhag A , Michalowska AM , Kavanagh P , Liang JX , Builoff V , et al. Deep Learning-Enabled Quantification of (99m)Tc-Pyrophosphate SPECT/CT for Cardiac Amyloidosis . J Nucl Med . 2024 ; 65 : 1144 – 50 . doi: 10.2967/jnumed.124.267542 . OpenUrl Abstract / FREE Full Text 5. ↵ Bokhari S , Castano A , Pozniakoff T , Deslisle S , Latif F , Maurer MS . (99m)Tc-pyrophosphate scintigraphy for differentiating light-chain cardiac amyloidosis from the transthyretin-related familial and senile cardiac amyloidoses . Circ Cardiovasc Imaging . 2013 ; 6 : 195 – 201 . doi: 10.1161/CIRCIMAGING.112.000132 . OpenUrl Abstract / FREE Full Text 6. ↵ Hong Z , Spielvogel CP , Xue S , Calabretta R , Jiang Z , Yu J , et al. Enhanced diagnostic and prognostic assessment of cardiac amyloidosis using combined (11)C-PiB PET/CT and (99m)Tc-DPD scintigraphy . Eur J Nucl Med Mol Imaging . 2025 . doi: 10.1007/s00259-025-07157-7 . OpenUrl CrossRef 7. ↵ Shiri I , Balzer S , Baj G , Bernhard B , Hundertmark M , Bakula A , et al. Multi-modality artificial intelligence-based transthyretin amyloid cardiomyopathy detection in patients with severe aortic stenosis . Eur J Nucl Med Mol Imaging . 2025 ; 52 : 485 – 500 . doi: 10.1007/s00259-024-06922-4 . OpenUrl CrossRef PubMed 8. ↵ Delbarre MA , Girardon F , Roquette L , Blanc-Durand P , Hubaut MA , Hachulla E , et al. Deep Learning on Bone Scintigraphy to Detect Abnormal Cardiac Uptake at Risk of Cardiac Amyloidosis . JACC Cardiovasc Imaging . 2023 ; 16 : 1085 – 95 . doi: 10.1016/j.jcmg.2023.01.014 . OpenUrl CrossRef PubMed 9. ↵ Spielvogel CP , Haberl D , Mascherbauer K , Ning J , Kluge K , Traub-Weidinger T , et al. Diagnosis and prognosis of abnormal cardiac scintigraphy uptake suggestive of cardiac amyloidosis using artificial intelligence: a retrospective, international, multicentre, cross-tracer development and validation study . Lancet Digit Health . 2024 ; 6 : e251 – e60 . doi: 10.1016/S2589-7500(23)00265-0 . OpenUrl CrossRef 10. ↵ Gertz MA , Dispenzieri A . Systemic Amyloidosis Recognition, Prognosis, and Therapy: A Systematic Review . JAMA . 2020 ; 324 : 79 - 89 . doi: 10.1001/jama.2020.5493 . OpenUrl CrossRef PubMed 11. ↵ Garcia-Pavia P , Rapezzi C , Adler Y , Arad M , Basso C , Brucato A , et al. Diagnosis and treatment of cardiac amyloidosis: a position statement of the ESC Working Group on Myocardial and Pericardial Diseases . Eur Heart J . 2021 ; 42 : 1554 – 68 . doi: 10.1093/eurheartj/ehab072 . OpenUrl CrossRef PubMed 12. ↵ Pera O , Martinez A , Mohler C , Hamans B , Vega F , Barral F , et al. Clinical Validation of Siemens’ Syngo.via Automatic Contouring System . Adv Radiat Oncol . 2023 ; 8 : 101177 . doi: 10.1016/j.adro.2023.101177 . OpenUrl CrossRef 13. ↵ Zwanenburg A , Vallieres M , Abdalah MA , Aerts H , Andrearczyk V , Apte A , et al. The Image Biomarker Standardization Initiative: Standardized Quantitative Radiomics for High-Throughput Image-based Phenotyping . Radiology . 2020 ; 295 : 328 – 38 . doi: 10.1148/radiol.2020191145 . OpenUrl CrossRef PubMed 14. Liu Y , He C , Fang W , Peng L , Shi F , Xia Y , et al. Prediction of Ki-67 expression in gastrointestinal stromal tumors using radiomics of plain and multiphase contrast-enhanced CT . Eur Radiol . 2023 ; 33 : 7609 – 17 . doi: 10.1007/s00330-023-09727-5 . OpenUrl CrossRef PubMed 15. van Griethuysen JJM , Fedorov A , Parmar C , Hosny A , Aucoin N , Narayan V , et al. Computational Radiomics System to Decode the Radiographic Phenotype . Cancer Res . 2017 ; 77 : e104 – e7 . doi: 10.1158/0008-5472.CAN-17-0339 . OpenUrl Abstract / FREE Full Text 16. ↵ Bo Z , Chen B , Yang Y , Yao F , Mao Y , Yao J , et al. Machine learning radiomics to predict the early recurrence of intrahepatic cholangiocarcinoma after curative resection: A multicentre cohort study . Eur J Nucl Med Mol Imaging . 2023 ; 50 : 2501 – 13 . doi: 10.1007/s00259-023-06184-6 . OpenUrl CrossRef PubMed 17. ↵ Zhao S , Wang J , Jin C , Zhang X , Xue C , Zhou R , et al. Stacking Ensemble Learning-Based [(18)F]FDG PET Radiomics for Outcome Prediction in Diffuse Large B-Cell Lymphoma . J Nucl Med . 2023 ; 64 : 1603 – 9 . doi: 10.2967/jnumed.122.265244 . OpenUrl Abstract / FREE Full Text 18. ↵ Forouzannezhad P , Maes D , Hippe DS , Thammasorn P , Iranzad R , Han J , et al. Multitask Learning Radiomics on Longitudinal Imaging to Predict Survival Outcomes following Risk-Adaptive Chemoradiation for Non-Small Cell Lung Cancer . Cancers (Basel ). 2022 ; 14 . doi: 10.3390/cancers14051228 . OpenUrl CrossRef 19. ↵ Ali S , Akhlaq F , Imran AS , Kastrati Z , Daudpota SM , Moosa M . The enlightening role of explainable artificial intelligence in medical & healthcare domains: A systematic literature review . Comput Biol Med . 2023 ; 166 : 107555 . doi: 10.1016/j.compbiomed.2023.107555 . OpenUrl CrossRef 20. ↵ Vergaro G , Aimo A , Barison A , Genovesi D , Buda G , Passino C , et al. Keys to early diagnosis of cardiac amyloidosis: red flags from clinical, laboratory and imaging findings . Eur J Prev Cardiol . 2020 ; 27 : 1806 – 15 . doi: 10.1177/2047487319877708 . OpenUrl CrossRef PubMed 21. ↵ Rapezzi C , Aimo A , Serenelli M , Barison A , Vergaro G , Passino C , et al. Critical Comparison of Documents From Scientific Societies on Cardiac Amyloidosis: JACC State-of-the-Art Review . J Am Coll Cardiol . 2022 ; 79 : 1288 – 303 . doi: 10.1016/j.jacc.2022.01.036 . OpenUrl CrossRef PubMed 22. ↵ Damy T , Deux JF , Moutereau S , Guendouz S , Mohty D , Rappeneau S , et al. Role of natriuretic peptide to predict cardiac abnormalities in patients with hereditary transthyretin amyloidosis . Amyloid . 2013 ; 20 : 212 – 20 . doi: 10.3109/13506129.2013.825240 . OpenUrl CrossRef PubMed 23. Arana-Achaga X , Goena-Vives C , Villanueva-Benito I , Solla-Ruiz I , Rengel Jimenez A , Gaspar TI , et al. Development and Validation of a Prediction Model and Score for Transthyretin Cardiac Amyloidosis Diagnosis: T-Amylo . JACC Cardiovasc Imaging . 2023 ; 16 : 1567 – 80 . doi: 10.1016/j.jcmg.2023.05.002 . OpenUrl CrossRef PubMed 24. ↵ Vergaro G , Castiglione V , Aimo A , Prontera C , Masotti S , Musetti V , et al. N-terminal pro-B-type natriuretic peptide and high-sensitivity troponin T hold diagnostic value in cardiac amyloidosis . Eur J Heart Fail . 2023 ; 25 : 335 – 46 . doi: 10.1002/ejhf.2769 . OpenUrl CrossRef PubMed 25. ↵ Poterucha TJ , Elias P , Bokhari S , Einstein AJ , DeLuca A , Kinkhabwala M , et al. Diagnosing Transthyretin Cardiac Amyloidosis by Technetium Tc 99m Pyrophosphate: A Test in Evolution . JACC Cardiovasc Imaging . 2021 ; 14 : 1221 – 31 . doi: 10.1016/j.jcmg.2020.08.027 . OpenUrl CrossRef PubMed 26. ↵ Schockling EJ , Farrell MB , Embry-Dierson M , Warren J , Jerome S. Cardiac Amyloidosis Imaging, Part 2: Quantification and Technical Considerations . J Nucl Med Technol . 2023 ; 51 : 90 – 8 . doi: 10.2967/jnmt.123.265416 . OpenUrl Abstract / FREE Full Text 27. ↵ Meng Q , Zhao L , Sun X , Wang Y , Yu L , Schoepf UJ , et al. Development and validation of a radiomics model for detecting cardiac amyloidosis at coronary CT angiography . Eur Heart J Cardiovasc Imaging . 2025 . doi: 10.1093/ehjci/jeaf071 . OpenUrl CrossRef 28. ↵ Kamel MA , Abbas MT , Kanaan CN , Awad KA , Baba Ali N , Scalia IG , et al. How Artificial Intelligence Can Enhance the Diagnosis of Cardiac Amyloidosis: A Review of Recent Advances and Challenges . J Cardiovasc Dev Dis . 2024 ; 11 . doi: 10.3390/jcdd11040118 . OpenUrl CrossRef View the discussion thread. Back to top Previous Next Posted June 23, 2025. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Stacking Ensemble Learning-based Models Enabling Accurate Diagnosis of Cardiac Amyloidosis using SPECT/CT:an International and Multicentre Study Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Stacking Ensemble Learning-based Models Enabling Accurate Diagnosis of Cardiac Amyloidosis using SPECT/CT:an International and Multicentre Study Qu Mo , Jing Cui , Shengguo Jia , Ying Zhang , Yi Xiao , Caiguang Liu , Chunqing Zhou , Clemens P Spielvogel , Raffaella Calabretta , Weihua Zhou , Ke Cao , Marcus Hacker , Xiang Li , Min Zhao medRxiv 2025.06.22.25330039; doi: https://doi.org/10.1101/2025.06.22.25330039 Share This Article: Copy Citation Tools Stacking Ensemble Learning-based Models Enabling Accurate Diagnosis of Cardiac Amyloidosis using SPECT/CT:an International and Multicentre Study Qu Mo , Jing Cui , Shengguo Jia , Ying Zhang , Yi Xiao , Caiguang Liu , Chunqing Zhou , Clemens P Spielvogel , Raffaella Calabretta , Weihua Zhou , Ke Cao , Marcus Hacker , Xiang Li , Min Zhao medRxiv 2025.06.22.25330039; doi: https://doi.org/10.1101/2025.06.22.25330039 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Radiology and Imaging Subject Areas All Articles Addiction Medicine (568) Allergy and Immunology (863) Anesthesia (299) Cardiovascular Medicine (4425) Dentistry and Oral Medicine (443) Dermatology (382) Emergency Medicine (607) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1507) Epidemiology (15222) Forensic Medicine (30) Gastroenterology (1123) Genetic and Genomic Medicine (6589) Geriatric Medicine (667) Health Economics (997) Health Informatics (4524) Health Policy (1368) Health Systems and Quality Improvement (1612) Hematology (540) HIV/AIDS (1264) Infectious Diseases (except HIV/AIDS) (15910) Intensive Care and Critical Care Medicine (1103) Medical Education (623) Medical Ethics (145) Nephrology (667) Neurology (6588) Nursing (346) Nutrition (998) Obstetrics and Gynecology (1143) Occupational and Environmental Health (956) Oncology (3331) Ophthalmology (971) Orthopedics (369) Otolaryngology (420) Pain Medicine (435) Palliative Medicine (129) Pathology (663) Pediatrics (1690) Pharmacology and Therapeutics (691) Primary Care Research (710) Psychiatry and Clinical Psychology (5440) Public and Global Health (9221) Radiology and Imaging (2195) Rehabilitation Medicine and Physical Therapy (1369) Respiratory Medicine (1196) Rheumatology (593) Sexual and Reproductive Health (710) Sports Medicine (529) Surgery (710) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'9ffe2a80185e1b23',t:'MTc3OTQ3NzQ5OA=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00
unpaywall
last seen: 2026-06-17T06:32:23.968882+00:00