Predicting future cognitive impairment in preclinical Alzheimer’s disease using multimodal imaging: a multisite machine learning study

doi:10.1101/2025.10.15.25337507

Predicting future cognitive impairment in preclinical Alzheimer’s disease using multimodal imaging: a multisite machine learning study

2025 · doi:10.1101/2025.10.15.25337507

preprint OA: closed

📄 Open PDF Full text JSON View at publisher

Full text 107,063 characters · extracted from preprint-html · click to expand

Predicting future cognitive impairment in preclinical Alzheimer’s disease using amyloid PET and MRI: a multisite machine learning study | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Predicting future cognitive impairment in preclinical Alzheimer’s disease using amyloid PET and MRI: a multisite machine learning study View ORCID Profile Braden Yang , View ORCID Profile Tom Earnest , View ORCID Profile Murat Bilgel , View ORCID Profile Marilyn S. Albert , View ORCID Profile Sterling C. Johnson , View ORCID Profile Christos Davatzikos , View ORCID Profile Guray Erus , View ORCID Profile Colin L. Masters , View ORCID Profile Susan M. Resnick , View ORCID Profile Michael I. Miller , View ORCID Profile Arnold Bakker , View ORCID Profile John C. Morris , View ORCID Profile Tammie L.S. Benzinger , View ORCID Profile Brian A. Gordon , View ORCID Profile Aristeidis Sotiras , the Alzheimer’s Disease Neuroimaging Initiative , the Preclinical Alzheimer’s Disease Consortium doi: https://doi.org/10.1101/2025.10.15.25337507 Braden Yang a Mallinckrodt Institute of Radiology, Washington University School of Medicine in St. Louis , St. Louis, MO, USA 63110 b Department of Radiology, Perelman School of Medicine, University of Pennsylvania , Philadelphia, PA, USA 19104 c 2 , Philadelphia, PA, USA 19104 Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Braden Yang For correspondence: b.y.yang{at}wustl.edu aristeidis.sotiras{at}pennmedicine.upenn.edu Tom Earnest a Mallinckrodt Institute of Radiology, Washington University School of Medicine in St. Louis , St. Louis, MO, USA 63110 Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Tom Earnest Murat Bilgel d Laboratory of Behavioral Neuroscience, National Institute on Aging Intramural Research Program, National Institutes of Health , Baltimore, MD, USA 21224 Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Murat Bilgel Marilyn S. Albert e Department of Neurology, Johns Hopkins University School of Medicine , Baltimore, MD, USA 21205 Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Marilyn S. Albert Sterling C. Johnson f Wisconsin Alzheimer’s Disease Research Center, University of Wisconsin-Madison School of Medicine and Public Health , Madison, WI, USA 53726 Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Sterling C. Johnson Christos Davatzikos c 2 , Philadelphia, PA, USA 19104 Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Christos Davatzikos Guray Erus c 2 , Philadelphia, PA, USA 19104 Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Guray Erus Colin L. Masters g Florey Institute of Neuroscience and Mental Health , Parkville, VIC, Australia 3052 Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Colin L. Masters Susan M. Resnick d Laboratory of Behavioral Neuroscience, National Institute on Aging Intramural Research Program, National Institutes of Health , Baltimore, MD, USA 21224 Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Susan M. Resnick Michael I. Miller h Center of Imaging Science and Department of Biomedical Engineering, Johns Hopkins University , Baltimore, Maryland, USA 21218 Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Michael I. Miller Arnold Bakker i Department of Psychiatry and Behavioral Sciences, Johns Hopkins University School of Medicine , Baltimore, MD, USA 21205 e Department of Neurology, Johns Hopkins University School of Medicine , Baltimore, MD, USA 21205 Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Arnold Bakker John C. Morris j Department of Neurology, Washington University School of Medicine in St. Louis , St. Louis, MO, USA 63110 Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for John C. Morris Tammie L.S. Benzinger a Mallinckrodt Institute of Radiology, Washington University School of Medicine in St. Louis , St. Louis, MO, USA 63110 Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Tammie L.S. Benzinger Brian A. Gordon a Mallinckrodt Institute of Radiology, Washington University School of Medicine in St. Louis , St. Louis, MO, USA 63110 Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Brian A. Gordon Aristeidis Sotiras a Mallinckrodt Institute of Radiology, Washington University School of Medicine in St. Louis , St. Louis, MO, USA 63110 b Department of Radiology, Perelman School of Medicine, University of Pennsylvania , Philadelphia, PA, USA 19104 c 2 , Philadelphia, PA, USA 19104 k Institute for Informatics, Data Science and Biostatistics, Washington University School of Medicine in St. Louis , St. Louis, MO, USA 63110 Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Aristeidis Sotiras For correspondence: b.y.yang{at}wustl.edu aristeidis.sotiras{at}pennmedicine.upenn.edu Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF Abstract Predicting the likelihood of developing Alzheimer’s disease (AD) dementia in at-risk individuals is important for the design of and optimal recruitment for clinical trials of disease-modifying therapies. Machine learning (ML) has been shown to excel in this task; however, there remains a lack of models developed specifically for the preclinical AD population, who display early signs of abnormal brain amyloidosis but remain cognitively unimpaired. Here, we trained and evaluated ML classifiers to predict whether individuals with preclinical AD will progress to mild cognitive impairment or dementia within multiple fixed time windows, ranging from one to five years. Models were trained on regional imaging features extracted from amyloid positron emission tomography and magnetic resonance imaging pooled across seven independent sites and from two amyloid radiotracers ([ 18 F]-florbetapir and [ 11 C]-Pittsburgh-compound-B). Out-of-sample generalizability was evaluated via a leave-one-site-out and leave-one-tracer-out cross-validation. Classifiers achieved an out-of-sample receiver operating characteristic area-under-the-curve of 0.66 or greater when applied to all except one hold-out sites and 0.72 or greater when applied to each hold-out radiotracer. Additionally, when applying our models in a retroactive cohort enrichment analysis on A4 clinical trial data, we observed increased statistical power of detecting differences in amyloid accumulation between placebo and treatment arms after enrichment by ML stratifications. As emerging investigations of new disease-modifying therapies for AD increasingly focus on asymptomatic, preclinical populations, our findings underscore the potential applicability of ML-based patient stratification for recruiting more homogeneous cohorts and improving statistical power for detecting treatment effects for future clinical trials. Highlights Machine learning can predict future cognitive impairment in preclinical Alzheimer’s Models achieved high out-of-sample ROC-AUC on external sites and PET tracers Models were able to distinguish cognitively stable from decliners in the A4 cohort ML cohort enrichment enhanced secondary treatment effect detection in the A4 cohort 1 Introduction Alzheimer’s disease (AD) is a progressive neurodegenerative disease marked by the accumulation of amyloid-β plaques and tau neurofibrillary tangles in the brain, which leads to neuronal cell death and eventual development of cognitive deficits such as short-term memory loss, impairments in orientation, or difficulty with written and verbal communication. According to current models of the AD pathogenesis timeline, accumulation of these pathologies typically begin years before the onset of clinically-measurable symptoms ( Jack and Holtzman, 2013 ; Jack Jr. et al., 2024 ). Thus, clinical trials of AD treatments have largely focused on disease-modifying therapies, which target these pathologies in the hopes of altering the biological course of the disease and slowing or even preventing the progression of clinical symptoms ( Dyck et al., 2023 ; Sims et al., 2023 ). Yet to date, there have only been a handful of approved disease-modifying therapies, with the rest failing to demonstrate a significant treatment effect ( Kim et al., 2022 ). A potential reason for this high failure rate is that recruited participants may have been at too advanced of a disease stage for treatments to meaningfully alter its progression ( Sperling et al., 2014 ), with the majority of previously conducted trials primarily recruiting individuals who already displayed objective cognitive impairment ( Huang et al., 2020 ; Sims et al., 2023 ; Swanson et al., 2021 ). In response, newly emerging trials have transitioned to targeting preclinical AD, where patients exhibit abnormal brain amyloidosis while showing no signs of cognitive impairment. Furthermore, failures may have also been attributed to high heterogeneity in the phenotypic expression of the disease, particularly in the rates of cognitive decline over time. This heterogeneity potentially leads to differential responses to administered therapies, which may negatively impact the estimation of treatment effects ( Jutten et al., 2021 ). To mitigate this issue, stratification models for distinguishing fast-cognitive decliners from slow or non-decliners are commonly employed in AD clinical trials. These models enable cohort enrichment by identifying and selectively enrolling candidates who are most likely to benefit from disease-modifying therapies in order to increase the likelihood of observing a potential treatment effect ( Ballard et al., 2019 ; Wolz et al., 2016 ). Additionally, biased allocation of fast-decliners and slow-decliners into control and treatment groups may lead to overestimation or underestimation of a potential treatment effect. Proper stratification of clinical trial participants ensures that an equal distribution of fast-to-slow decliners are allocated into each trial arm and may aid in reducing uncertainties in treatment effect estimation, on top of reducing the required sample size and cost of running a trial ( Wang et al., 2024 ). Previous trials have used single risk assessments such as neuropsychological testing and quantitative amyloid and tau measurements from positron emission tomography (PET) to stratify participants into high and low risk groups ( Abdelnour et al., 2022 ; Sims et al., 2023 ; Swanson et al., 2021 ). However, recent evidence has suggested that data-driven stratification models built on machine learning (ML) can outperform single risk factor stratification in enhancing clinical trial operations ( Birkenbihl et al., 2024 ; Gladstein et al., 2025 ; Nallapu et al., 2025 ; Tam et al., 2022 ; Wang et al., 2024 ). By leveraging information across multiple data modalities such as imaging, genetics and cognitive assessments, ML models can learn complex patterns within these multiple modalities to provide more accurate stratifications. These stratifications may be used to guide a more optimized cohort enrichment, leading to increased power of detect hypothetical treatment effects ( Nallapu et al., 2025 ), reduction in random allocation bias ( Wang et al., 2024 ), and reduction in the sample size required to observe a treatment effect ( Birkenbihl et al., 2024 ; Gladstein et al., 2025 ; Tam et al., 2022 ). Among data modalities commonly used for stratification, medical imaging data like PET and magnetic resonance imaging (MRI) are particularly useful for probing the topographical distribution of core and associated AD pathologies in the brain ( Jack Jr. et al., 2024 ), which have been shown to be highly discriminative of cognitive decliners from non-decliners ( Mathotaarachchi et al., 2017 ; Pascoal et al., 2020 ; Pfeil et al., 2021 ). Despite recent progress in developing ML models for this application, previous literature has predominantly focused on individuals who already exhibit cognitive deficits in the form of mild cognitive impairment (MCI) ( Ezzati et al., 2021 ; Samper-González et al., 2018 ), with many studies only training on features extracted from structural MRI ( Basaia et al., 2019 ; Mathotaarachchi et al., 2017 ; Misra et al., 2009 ). Efforts have been made to develop models for the cognitively unimpaired (CU) population that also incorporate amyloid PET, but most have either imposed a single time-to-progression window ( Choi et al., 2024 ; Dansson et al., 2021 ; Pfeil et al., 2021 ) or don’t ensure the presence of amyloid pathology in their CU cohorts ( Karaman et al., 2022 ). Additionally, with trials routinely involving large consortiums of institutions, each utilizing a different set of data acquisition protocols and scanner models, this introduces site-specific biases in the collected data which may negatively affect the ability of models to generalize on out-of-sample data. Furthermore, disparities in the pharmacokinetics and binding properties of different PET radiotracers lead to significant biases in quantitative amyloid PET measurements ( Landau et al., 2014 ; Su et al., 2019 ; Villemagne et al., 2012 ). For these reasons, a rigorous evaluation of ML generalizability to external sites and different amyloid PET radiotracers is needed. Motivated by these gaps, the current study seeks to develop and evaluate ML classifiers to predict future cognitive decline in asymptomatic, preclinical AD patients. We trained support vector machines (SVM) on regional imaging features extracted from amyloid PET and structural MRI to perform binary classification of whether an individual will develop cognitive deficits within multiple follow-up times, ranging from one year to five years. We obtained data from seven independent sites and two amyloid PET radiotracers and estimated the out-of-sample performance of trained models via leave-one-site-out and leave-one-tracer-out cross-validation. Lastly, to gauge the benefit of applying these models in a clinical trial setting, we utilized data from the Anti-Amyloid Treatment in Asymptomatic Alzheimer’s (A4) study ( Sperling et al., 2023 ) to estimate the change in statistical power to detect treatment effects after retroactive cohort enrichment using our models’ predictions. 2 Materials and methods 2.1 Participants and data Participants and their respective data were obtained from the following independent studies and consortia – the A4 study ( Sperling et al., 2023 ), the Alzheimer’s Disease Neuroimaging Initiative (ADNI), the Harvard Aging Brain Study (HABS) ( Dagley et al., 2017 ), the Mayo Clinic Study of Aging (MCSA) ( Roberts et al., 2008 ), the Open Access Series of Imaging Studies 3 (OASIS) ( LaMontagne et al., 2019 ), and the Preclinical Alzheimer’s Disease Consortium (PAC). ADNI, launched in 2003 as a public-private partnership and led by Principal Investigator Michael W. Weiner, MD, has aimed to test whether serial MRI, PET, other biological markers, and clinical and neuropsychological assessment can be combined to measure the progression of MCI and early AD. PAC is a consortium comprising five AD-focused datasets – the Adult Children Study (ACS) ( Coats and Morris, 2005 ; Price and Morris, 1999 ), the Australian Imaging Biomarkers and Lifestyle (AIBL) study ( Fowler et al., 2021 ), the Biomarkers of Cognitive Decline Among Normal Individuals (BIOCARD) study ( Albert et al., 2014 ), the Baltimore Longitudinal Study of Aging (BLSA) ( Resnick et al., 2000 ), and the Wisconsin Registry for Alzheimer’s Prevention (WRAP) ( Johnson et al., 2018 ). All participants provided informed consent to participate in their respective studies in accordance with the Declaration of Helsinki, and ethics approvals were obtained by each site’s respective institutional review board. From the A4 study, only participants from the placebo arm of the clinical trial or from the Longitudinal Evaluation of Amyloid Risk and Neurodegeneration (LEARN) study were used to train the ML models. Participants from the Solanezumab treatment arm were excluded from training and were only used as an additional evaluation set (detailed in section 2.4 A4 trial analyses ). Additionally, we omitted ACS from our analyses since this dataset had significant participant overlap with OASIS. All participants with available [ 18 F]-florbetapir (FBP) or [ 11 C]-Pittsburgh-compound-B (PiB) amyloid PET imaging were selected. We restricted these scans to be amyloid-positive, defined as having a mean cortical amyloid PET signal of greater than a threshold value. We used the dataset-specific definition of the summary cortical region mask and cutoff signal that was optimally determined for each dataset. Further details on how amyloid positivity was determined for each site can be found in the Supplementary Methods. All scans were matched with an accompanying structural T1-weighted MRI scan within one year of the PET acquisition date. Baseline age, sex and APOE4 carriership were selected as additional predictors. We used the global Clinical Dementia Rating ® (CDR ® ) ( Morris, 1997 ), which rates an individual’s cognitive performance in six domains (memory, orientation, judgment and problem solving, community affairs, home and hobbies, and personal care), as a measure of overall dementia severity. All PET scans were matched to a global CDR assessment within one year of the PET acquisition date. Participants who were missing any matching data were excluded from further analyses. The analysis was restricted to participants who were CU at the time of the amyloid PET scan, defined as a global CDR score of zero. We labeled participants as stable if they remained CU for at least five years from the time of the amyloid PET, and as progressor if they converted to a global CDR of greater than zero within a follow-up time that varied from one to five years. Progressors who reverted to CU were excluded. Additionally, stables who did not have a follow-up CDR of zero at least five years from the time of the amyloid PET were excluded. We observed a larger proportion of stable individuals compared to progressors; to reduce class imbalance, we imposed the five-year stability criterion on the stable cohort to obtain the most homogeneous group of participants, with presumably the least amount of pathology, to represent our control group. PAC did not provide CDR scores; we instead used the clinical diagnoses in place of CDR, with a diagnosis of either MCI or dementia being equivalent to CDR>0. In total, 343 stable and 247 progressor participants across seven sites (A4, ADNI, AIBL, BLSA, HABS, MCSA, OASIS) were selected for this study. We excluded BIOCARD and WRAP from our analyses due to too few participants meeting the selection criteria. Participant counts after exclusions are illustrated in Supplementary Fig. 1. 2.2 Image acquisition and processing All scans underwent a standard PET-MRI processing pipeline consisting of segmentation of the MRI into regions-of-interest (ROI) and derivation of regional amyloid standardized uptake value ratios (SUVR) from the amyloid PET. Each participant’s T1-weighted MRI was preprocessed using a fully automated pipeline which included N4 bias correction ( Tustison et al., 2010 ), skull stripping, and segmentation into 145 cortical and subcortical ROI using Multi-atlas region Segmentation utilizing Ensembles of registration algorithms and parameters (MUSE) ( Doshi et al., 2016 ). Manual quality checks were performed on the outputs to ensure correctness of segmentations. We selected 125 relevant ROI and extracted their volumes, normalized by the total intracranial volume, to be used as the volumetric input features of our model. FBP and PiB PET scans were downloaded either in a frame-averaged, smoothed and uniform resolution format (ADNI only) or as the full dynamic scan (all other datasets). For dynamic scans, we selected frames within the 50-70 minute window post-tracer injection for FBP and the 40-60 minute window for PiB. All frames were realigned to remove patient motion, averaged, and coregistered to the T1 image using FSL FLIRT rigid body registration ( Smith et al., 2004 ). Additionally, we performed an iterative smoothing operation by applying a Gaussian smoothing kernel with progressively increasing full width at half maximum until a target resolution was reached (estimated using AFNI’s 3dFWHMx tool). The target resolution was set to the 3dFWHMx -estimated resolution of ADNI frame-averaged scans, which was found to be approximately 10mm isotropic. After smoothing, the PET image was converted to an SUVR image by dividing each voxel by the average signal of the left and right cerebellar gray matter regions. Finally, the MRI-to-PET transformation was applied to the anatomical MUSE ROI labels to sample them to native PET space, and regional SUVRs were computed by averaging the SUVR image over each ROI. For ADNI scans, we only performed coregistration to the T1, SUVR image computation and derivation of regional SUVRs. Manual quality checks were performed to ensure correctness of the frame alignment, PET-MRI coregistration and SUVR computation steps. Of the 145 total ROI, we selected 114 cortical and subcortical gray matter regions to be used as the amyloid input features of our model. The full list of ROIs used in this study are listed in Supplementary Table 1. 2.3 Model development and evaluation 2.3.1 Training The overview of the study is illustrated in Figure 1 . We trained SVM binary classifiers with linear kernel to predict whether an individual will progress to CDR greater than zero using baseline amyloid PET SUVR, volumetric and non-imaging (i.e., age, sex, APOE4 ) features. We chose to train SVM classifiers since it has been widely used and extensively validated for AD diagnosis classification and prediction of future cognitive decline ( Rathore et al., 2017 ). To account for imbalances in class frequency, we employed class-balanced weighting in which misclassifications of the minority class (progressor class in most cases) were more heavily penalized during optimization. Five separate time-to-progression models were trained independently of one another to predict progressor status, with the time window varied between one and five years. For example, the three-year model predicts if an individual will progress to a CDR of greater than zero within three years from baseline. Note that each selected time-to-progression would result in a different set of progressor participants. However, we used the same set of stable participants who remained CU for at least five years as the control group in all five models. Download figure Open in new tab Figure 1. Overview of the study. Analyses were split into model development and evaluation ( a-c ) and A4 trial analyses ( d-e ). (a) Amyloid PET regional SUVRs, MRI regional volumes, and non-imaging features (age, sex, APOE-ε4) were inputted to train support vector machine classifiers to distinguish preclinical AD stables from progressors, where stables are individuals who remain CDR=0 for at least five years from baseline and progressors are individuals who convert to CDR>0 within a specified time window. (b) To evaluate model generalizability to unseen data, models were trained on all but one site or one tracer and tested on the hold-out site or tracer. (c) To estimate relative importance of feature modalities, nested models were trained on a subset of features and classification performance was compared to the model trained on the full feature set. To obtain individual feature-level importance, linear SVM weights were transformed using the data covariance matrix. (d) The SVM classifier trained on all sites except A4 was applied to the A4 cohort to predict progressor status. Only predicted progressors were retained to retroactively enrich the cohort. (e) To gauge the benefit of machine learning cohort enrichment, differences in PACC and global amyloid SUVR were tested between placebo and treatment arms post-enrichment. Abbreviations . CDR: Clinical Dementia Rating, PACC: Preclinical Alzheimer’s Cognitive Composite, SUVR: standardized uptake value ratio, SVM: support vector machine. 2.3.2 Cross-validation We employed a leave-one-site-out and leave-one-tracer-out cross-validation framework, in which data from one site or from one PET tracer were held out for independent testing, while the remaining data were used for training. Along with five times-to-progression, this resulted in 45 total models. All continuous features were z-scored using the standard deviation of only the CU-stable participants of the training fold, which was shown to enhance separation between linearly separable groups ( Linn et al., 2016 ). A grid search with five-fold cross-validation was conducted using the training fold to determine the optimal value of hyperparameter C, which regulates how strongly misclassifications impact the SVM optimization. We optimized hyperparameter C independently for each of our 45 models. To evaluate model performance on the leave-out test set, the receiver operating characteristic area-under-the-curve (ROC-AUC), accuracy, balanced accuracy, F1 score, sensitivity, specificity, positive predictive value (PPV) and negative predictive value (NPV) were reported. 2.3.3 Centiloid sensitivity analysis To address biases in amyloid PET SUVRs due to the inclusion of multiple tracers, we performed a sensitivity analysis where we harmonized regional SUVRs into regional Centiloids before inputting as features to the SVM classifier. The Centiloid scale is a method of linearly transforming raw amyloid PET SUVRs into a scale that is standardized across different tracers ( Klunk et al., 2015 ). We utilized the conversion equations that were uniquely calibrated to each site to convert SUVRs to Centiloid, then retrained our models with Centiloids as the amyloid PET features. Equations were only available for A4, ADNI, MCSA and OASIS, so we included only these sites in the sensitivity analysis. The DeLong test was used to compare ROC-AUC between models utilizing regional Centiloids versus regional SUVRs. Bonferroni correction was applied to p-values to adjust for multiple comparisons. 2.3.4 Feature importance We assessed the relative importance of each input feature for influencing the classification task via two methods. First, to estimate the relative importance of each modality of input feature (amyloid PET SUVR, MRI volume, or non-imaging features), we trained nested models wherein a reduced subset of modalities was used as input. We then computed the change in ROC-AUC on the hold-out test set relative to the full model as a measure of the relative contribution of that modality to the prediction. The DeLong test with Bonferroni correction for multiple comparisons was performed to test for statistical significance of ROC-AUC differences. Secondly, to derive a feature-level measure of the strength of association between each input feature and the progressor class, we computed the covariance-corrected linear SVM weights of the full model, as proposed by Haufe et al. (2014) . This approach transforms classifier weights into interpretable estimates of the feature-level association with the progressor class, with high positive values indicating positive association, high negative values indicating negative association, and values close to zero indicating little to no association. A major advantage of this is that feature importance estimates are less prone to artificial distortion caused by collinearity of features, unlike impurity-based metrics for models such as random forest ( Strobl et al., 2008 ). For each classifier, we applied this method to estimate importance values of each input feature, and we averaged the values across all 45 classifiers to derive an overall feature importance. Additionally, to gauge how the magnitude of feature importance varies in relation to the time-to-progression, we estimated the slope of the absolute value of feature importance versus time-to-progression via an ordinary least squares linear regression. 2.4 A4 trial analyses To further validate trained SVM classifiers, we performed three analyses using the extended A4 study cohort as the external testing set. This extended cohort consisted of participants in the placebo arm and participants treated with Solanezumab, an immunoglobulin monoclonal antibody designed to increase amyloid clearance in the brain. Firstly, we applied the classifier trained on all datasets except A4 to classify A4 participants into stables and progressors using imaging acquired during the screening phase of the trial. We then compared the Preclinical Alzheimer’s Cognitive Composite (PACC), a composite score which has been shown to better track early AD-related cognitive changes ( Donohue et al., 2014 ), between predicted stables and progressors. Mirroring previous work ( Donohue et al., 2023 ; Sperling et al., 2023 ), we fitted a natural cubic spline model on longitudinal PACC scores as the target variable, using continuous time-from-baseline as the independent variable and baseline age, years of education, APOE4 carriership, PACC test version administered, and baseline FBP SUVR of a cortical composite region as covariates. We then estimated a model-adjusted mean PACC score and 95% confidence interval at the 240-week follow-up point (corresponding to the end of the placebo controlled study period) and compared the estimates derived for predicted stables versus predicted progressors using a two-sample t-test. This analysis was independently performed within the placebo and Solanezumab arms. Secondly, we applied the SVM classifications to conduct retroactive enrichment wherein we restricted the cohort to only include predicted progressors. We then tested for treatment effects post-enrichment in the primary endpoint (model-adjusted PACC) and a secondary endpoint (change in amyloid PET SUVR). For the primary endpoint, we fitted the same natural cubic spline model with covariates on the longitudinal PACC scores of the enriched placebo and treatment cohorts. Model-adjusted means and 95% confidence intervals of PACC at the 240-week follow-up point were estimated and compared between placebo and Solanezumab arms using a two-sample t-test. For the secondary endpoint, we computed the change in FBP cortical SUVR from baseline to the 240-week follow-up point and used this metric as the target variable. An analysis of covariance (ANCOVA) was fitted to compare the mean change in SUVR between placebo and Solanezumab arms, controlling for baseline age, APOE4 carriership and baseline SUVR as covariates. Lastly, we performed a bootstrap analysis to estimate the statistical power of detecting a difference in the change in FBP cortical SUVR between baseline and 240-weeks, testing different sample sizes and sampling populations (i.e. enriched vs. unenriched). Here, we focused only on the secondary endpoint rather than the PACC primary endpoint since no statistically significant treatment effect was reported for the primary endpoint in the original A4 study. For a fixed sample size n , we randomly selected n participants each from the placebo and Solanezumab arms. The pool of participants to select from was either the full, unenriched cohort or the ML-enriched cohort. We then reran the ANCOVA as conducted previously to test for significant differences in the adjusted change in SUVR between the randomly selected cohorts. We repeated this procedure 1000 times. Power was estimated as the percentage of significant findings across all 1000 iterations. Samples sizes per trial cohort were varied from 10 to 80 in increments of 10. 3 Results 3.1 Cohort characteristics Table 1 summarizes the cohort characteristics of each site and of the pooled data; p-values were derived from two-sample t-tests for all continuous variables and Fisher’s exact test for all categorical variables. Across all sites, progressors were older on average (75.9 ± 6.4) than stables (72.4 ± 5.6, p 0.05 ). Progressors had a mean time to progression of 2.4 ± 1.3 years and stables remained CU for an average of 7.1 ± 1.6 years. Stables were scanned with a roughly equal proportion of FBP to PiB radiotracer, whereas progressors were more often scanned with FBP (60%). Within individual sites, only age in the A4 cohort displayed a statistically significant difference between stables and progressors across all demographics reported ( p < 0.001 ). View this table: View inline View popup Download powerpoint Table 1. Cohort characteristics of stables and progressors from all individual sites and the pooled dataset. 3.2 Model evaluation We evaluated the external site generalizability of the SVM classifier using leave-one-site-out cross-validation. The classifier generalized well to most leave-out sites and times-to-progression, achieving an ROC-AUC of 0.66 or greater, with a majority exceeding 0.75 or above ( Figure 2 , Table 2 ). The exception was HABS, for which the ROC-AUC fell below 0.50. We also computed aggregate binary classification metrics by combining the out-of-sample predictions of every model on their respective leave-out site and comparing them to the combined ground truth labels from all sites ( Table 2 ). Classifiers achieved an aggregate accuracy of >0.69 and balanced accuracy of >0.58. Classifiers were also highly specific (>0.74) and had high negative predictive value (>0.74). While models also achieved relatively high sensitivity, PPV and F1 score, these metrics were particularly sensitive to time-to-progression. Notably, smaller times-to-progression resulted in poorer sensitivity, PPV and F1 score, likely due to the fact that classifiers were trained on a fewer number of positive cases and were prone to overfitting to the control cases. Classifiers trained on higher times-to-progression exhibited a better balance between sensitivity/PPV to specificity/NPV. Download figure Open in new tab Figure 2. Receiver operating characteristic curves of SVM classifiers trained on each of five times-to-progression. Curves were obtained by applying each trained model to data from its respective hold-out group. Solid lines represent leave-out sites and dotted lines represent leave-out tracers. Across all times-to-progression, SVM classifiers achieved area-under-the-curve of 0.66 or greater in all leave-out sites except for HABS and 0.72 or greater in both leave-out tracers. View this table: View inline View popup Download powerpoint Table 2. Evaluation metrics of SVM classifiers of all five times-to-progression, tested on each site and tracer as the independent testing set. We additionally performed leave-one-tracer-out validation to assess the generalizability of the SVM classifier to unseen tracers. The classifier achieved ROC-AUC of >0.72 across all times-to-progression for both leave-out tracers ( Table 2 ). However, the model trained on PiB and tested on FBP had a low sensitivity and high specificity while the opposite was true for the model trained on FBP and tested on PiB. This may reflect bias in regional SUVRs between FBP and PiB tracers. To address this, we retrained the classifiers using Centiloid-harmonized regional amyloid PET SUVRs and reported the resulting changes in performance (Supplementary Table 2). After harmonization, models achieved a better balance of sensitivity to specificity for both leave-out tracers: sensitivity increased when testing on FBP, and specificity increased when testing on PiB. This was also accompanied by increased aggregate balanced accuracy across all times-to-progression. ROC-AUC was slightly decreased in some cases, but none of these changes were statistically significant via the DeLong test ( p > 0.05 ). 3.3 Feature importance The performances of nested models on each hold-out site are shown in Figure 3 and Supplementary Table 3. When amyloid PET was omitted from the input set, decreases of up to 0.223 in ROC-AUC were observed particularly at time windows of three years or greater (with the exception of A4), although these differences were not statistically significant ( p > 0.05 ). Download figure Open in new tab Figure 3. Difference in hold-out ROC-AUC of nested models relative to the full model trained on all feature modalities. Dotted lines represent imaging models that omit non-imaging features. In many hold-old sites, omission of amyloid PET features (red) at high times-to-progression led to a decrease in ROC-AUC compared to the full model. Omission of volumetric features (blue) resulted in less consistent trends. Except for BLSA and HABS, the non-imaging only model (purple) performs worse than the full model for nearly all times-to-progression. Omission of non-imaging features (green) led to nearly identical performance compared to the full model. When MRI volumetric features were omitted from the input set, we observed less consistent trends across leave-out sites. For some sites such as A4 and OASIS, slight decreases in ROC-AUC were observed, whereas for other sites such as ADNI and HABS slight increases were observed. All differences were not statistically significant ( p > 0.05 ). In many cases, the reduction of model generalizability when amyloid features were omitted was greater than when volumetric features were omitted, especially at later time windows, suggesting a higher relative importance of amyloid PET in these tasks. In all leave-out sites except for BLSA and HABS, the non-imaging only model consistently performed worse than the model integrating features from both imaging modalities, with the difference in ROC-AUC of the one-year model on MCSA being statistically significant ( p < 0.05 ). Finally, omission of non-imaging features led to nearly identical performance compared to the full model. The average importance of each input feature across all trained models is visualized in Figure 4 and Supplementary Fig. 2. For amyloid SUVR features, widespread contributions for predicting the progressor class were observed throughout the cortex, with bilateral inferior and middle temporal gyri exhibiting the strongest mean importance, followed by middle frontal, superior frontal and middle occipital gyri. In contrast, subcortical amyloid SUVR generally had much lower importance. For volumetric features, bilateral inferior lateral ventricular volumes had the highest absolute value of feature importance out of all features (including amyloid SUVR and non-imaging variables). This was followed by lateral ventricle, amygdala and hippocampus volume. Ventricular volumes all had positive importance values, whereas all other volumetric features had negative importances. Among the three non-imaging features, baseline age was most strongly associated with the progressor class. Neither sex nor APOE4 carriership showed strong associations. Download figure Open in new tab Figure 4. Covariance-corrected linear SVM weights per amyloid SUVR ( a ), volumetric ( b ), and non-imaging ( c ) feature. The values shown are the mean importance across all 45 trained models. The ten features with the highest magnitude of mean importance within each imaging modality are shown on the left. Among amyloid SUVR features, temporal, middle & superior frontal and middle occipital gyri had the highest magnitude mean importance. Among volumetric features, lateral ventricle, hippocampus and amygdala had the highest magnitude mean importance. Age was the only non-imaging feature with a high mean importance. Abbreviations. Inf Lat Vent: inferior lateral ventricle, ITG: inferior temporal gyrus, MFG: middle frontal gyrus, MOG: middle occipital gyrus, MTG: middle temporal gyrus, SFG: superior frontal gyrus, STG: superior temporal gyrus We also estimated the rate-of-change of the absolute value of feature importance versus the time-to-progression via a linear regression (Supplementary Fig. 3 & 4). For amyloid SUVR features, regions in the orbitofrontal, temporal and occipital cortices had the highest rate of increase in importance as the time-to-progression window grew. Among volumetric regions, the right lateral inferior ventricles, right frontal operculum and bilateral posterior cingulate gyri had the highest rate of increase. Age had a modest rate of increase, while sex and APOE4 did not show substantial change. Amyloid SUVR features displayed much greater rates-of-change in feature importance compared to either volumetric features or non-imaging features, suggesting that their influence on model outputs becomes more pronounced as the time-to-progression window expands to capture earlier disease progression. This was also consistent with the trends observed in the nested model analysis. 3.4 A4 trial analysis We conducted retroactive analyses on the A4 clinical trial dataset to further validate our SVM classifiers and demonstrate their potential benefit for clinical trial cohort enrichment. Table 3 summarizes the characteristics of the unenriched A4 cohort and the retroactively enriched cohorts using each of our five time-to-progression models. In both placebo and Solanezumab arms, significant differences between the unenriched and enriched cohorts were observed in baseline age, baseline cortical FBP SUVR (except for the one-year progressors of the Solanezumab arm) and baseline PACC (except for the three-year progressors of the placebo arm) ( p < 0.05 ). A lower percentage of females were selected for the enriched cohort in both trial arms compared to the unenriched cohort; this difference was only significant for the one-year progressors ( p 0.05 ). View this table: View inline View popup Download powerpoint Table 3. Cohort characteristics of the placebo and Solanezumab treatment arms of the A4 study. The original, unenriched cohort and ML-enriched cohorts are shown. To validate that the SVM classifier accurately distinguish cognitive stables from decliners, we fitted a natural cubic spline model to longitudinal PACC scores of predicted stables and progressors and estimated the model-adjusted mean PACC score at the 240-week follow-up. In all cases except for the one-year progressor model in the Solanezumab arm, predicted stables had a significantly higher mean estimate of the model-adjusted PACC score at 240 weeks than predicted progressors ( p < 0.01 ) ( Figure 5 , Supplementary Table 4). When using the five-year model, which roughly aligns with the duration of the placebo-controlled period of the A4 trial, predicted progressors of the Solanezumab arm had a mean adjusted PACC score of -3.92 ± 0.57, which was significantly worse ( p < 0.001 ) than -0.84 ± 0.26 for predicted stables (Supplementary Table 4). Similarly, in the placebo group, predicted progressors had a mean adjusted PACC score of -3.39 ± 0.43 compared to -0.96 ± 0.22 for predicted stables ( p < 0.001 ). Download figure Open in new tab Figure 5. Natural cubic spline models of longitudinal PACC scores of predicted stables and progressors from the A4 study cohort. The model-adjusted PACC trajectory and 95% confidence interval are shown for predicted stables (blue), predicted progressors (red), and the overall cohort (black). The vertical dotted line marks the 240-week follow-up point. The effect size of the contrast between stables and progressors and corresponding p-value are also displayed. Asterisks indicate the significance level (*: p < 0.05, **: p < 0.01, ***: p < 0.001). In all cases except for the 1-year progressors of the Solanezumab arm, significant differences were observed between stables and progressors in the model-adjusted PACC at 240-weeks. To assess whether cohort enrichment by the trained classifiers improves our ability to detect treatment effects, we tested for significant effects in the primary (PACC) and secondary (FBP cortical SUVR) endpoints after retroactive enrichment. For PACC, we observed no significant difference in the model-adjusted mean PACC score between placebo and Solanezumab arms when the A4 cohort remained unenriched ( Table 4 ), consistent with the conclusions of the original A4 study ( Sperling et al., 2023 ). The difference in model-adjusted mean PACC remained non-significant after enrichment by any model ( Table 4 ), indicating no clear benefit of retroactive enrichment for recovering an underlying treatment effect in the primary outcome. View this table: View inline View popup Download powerpoint Table 4. Comparisons of A4 trial outcomes between placebo and Solanezumab arms of the original, unenriched cohort and the ML-enriched cohorts. For FBP cortical SUVR, a significant difference between trial arms was observed in the mean change in SUVR of the unenriched cohort, with a mean effect size of -0.407 ± 0.08 ( p < 0.001 ) ( Table 4 ), suggesting that a reduction in the rate of amyloid accumulation was associated with the treatment. After enrichment, this significant difference was preserved in all but the one-year progressor model. Enrichment by the two, four and five-year models resulted in a modest increase in the mean effect size of the contrast, albeit with an increase in the standard error due to reduced sample sizes. Power analysis revealed that for sample sizes between 20 and 80, an increased power to detect this effect was observed after enrichment by the two, four and five-year models ( Figure 6 , Supplementary Fig. 5). However, enrichment by the one-year model and, paradoxically, the three-year model showed a decrease in power. This pattern aligned with the results of the ANCOVA in Table 4 , wherein mean effect size was increased after enrichment by the two, four and five-year models, but not the one or three-year models. Download figure Open in new tab Figure 6. Power to detect differences in change in FBP cortical SUVR between placebo and Solanezumab arms of the A4 study cohort, estimated by bootstrap analysis. Power before (black) and after (colored) retroactive cohort enrichment using SVM classifier predictions are shown. Cohort enrichment by the two-year, four-year and five-year models resulted in increased power at most sample sizes compared to the original, unenriched cohort. 4 Discussion We conducted a rigorous evaluation of machine learning classifiers to predict future cognitive impairment among individuals with preclinical Alzheimer’s disease using imaging features from amyloid PET and MRI. Through leave-one-site-out and leave-one-tracer-out cross-validation, we demonstrated that our models consistently achieved strong generalizability to unseen sites and amyloid PET radiotracers, supporting the viability of these models towards enhancing large, multi-consortia clinical trials for AD. Additionally, we demonstrated that these classifiers may be useful in improving the statistical power of detecting treatment effects using real clinical trial data from the A4 study. The present study represents an important and clinically relevant step towards developing and validating stratification models tailored to the asymptomatic, preclinical AD population. This is of particular importance for future investigations of disease-modifying therapies for AD, given that many are trending towards targeting the disease at an early stage. Furthermore, as amyloid PET is commonly utilized for screening participants into clinical trials ( Rafii et al., 2023 ; Sims et al., 2023 ; Sperling et al., 2023 ), our findings suggest that there is added value in quantifying the spatial distribution of amyloid accumulation, beyond a simple dichotomization of global amyloid burden, for stratifying and enriching trial cohorts. In terms of clinical applications, current use cases of amyloid PET include establishing the presence of abnormal pathology before administering anti-amyloid therapy ( Cummings et al., 2023 ), although the use of PET in asymptomatic individuals remains an area of active debate ( Leuzy et al., 2025 ; Rabinovici et al., 2025 ; Rafii and Aisen, 2023 ). However, we envision, on the premise that treatments intended for asymptomatic preclinical AD individuals are approved in the future, that amyloid PET coupled with predictive models such as ours would serve as valuable prognostic tools for guiding individualized treatment plans. Such applications are anticipated to expand as mechanisms of reimbursement for amyloid PET are relaxed ( “Beta Amyloid Positron Emission Tomography in Dementia and Neurodegenerative Disease,” 2023 ). Several prior studies have demonstrated the ability of ML and imaging features extracted from amyloid PET to predict progression to cognitive impairment in CU cohorts with high accuracy ( Choi et al., 2024 ; Dansson et al., 2021 ; Karaman et al., 2022 ). The model developed by Karaman et al . achieved an ROC-AUC of 0.82 or higher when predicting the future diagnosis of CU individuals from ADNI up to 5-years from baseline. Choi et al . reported a mean ROC-AUC of 0.87 when applying their DL-ADprob model to an external CU cohort from HABS to predict future decline at the 4-year follow-up point. In the current study, our classifiers achieved slightly lower performances at comparable follow-up windows. For most leave-out sites, SVM classifiers achieved an out-of-sample ROC-AUC of 0.66 or higher across all times to progression, including ROC-AUC of 0.74 or higher in identifying 4-year progressors or beyond. The notable exception to this was HABS, which scored an ROC-AUC below 0.5. This likely led to high sampling variability that potentially accentuated any existing site-specific biases which the model may not have been robust to. Despite lower comparative performance, we highlight an important distinction of our study compared to previous literature in that we restricted our cohort of interest to CU individuals who showed evidence of abnormal brain amyloidosis, which has been proposed as a core criterion for the biological definition of AD ( Jack Jr. et al., 2024 ). Discrepancies in performance may potentially be attributable to reduced amyloid signal available for differentiating stables from progressors. Additionally, unlike the previously reported classification performance on a HABS CU cohort by ( Choi et al., 2024 ), which was not restricted to be amyloid-positive, our amyloid-positive CU cohort suffered from low sample sizes and extreme imbalances in the stables-to-progressors ratio. Nonetheless, our findings still suggest considerable robustness of SVM classifiers to out-of-sample data for the task of interest, which is crucial for the viability of such models in clinical trial settings for preclinical AD. In addition to site generalizability, we also showed good generalizability to different amyloid PET radiotracers. Models trained on a single amyloid radiotracer achieved ROC-AUC of 0.72 or greater when applied to the other tracer, even when no explicit tracer harmonization was performed. This, along with previous studies which have shown ML models to accurately predict amyloid positivity ( Fan et al., 2024 ) or future cognitive decline ( Choi et al., 2024 ) without explicit harmonization, may suggest that ML models are capable of finding low-dimensional representations of high-dimensional PET data which are tracer-agnostic. However, we also observed that in the context of a binary classification task, the cutoff thresholds (i.e. the separating hyperplane of the linear SVM) used to determine a binary class decision may not generalize to out-of-sample tracers, as evidenced by high imbalances in the sensitivity and specificity. Converting regional amyloid SUVRs into Centiloids produced models that achieved a much better balance of these metrics, suggesting that explicit harmonization of amyloid PET measurements still holds value for ML models. While the global amyloid PET signal has been known to be associated with future cognitive decline ( Landau et al., 2018 ; Parent et al., 2023 ; Small et al., 2012 ), recent studies have suggested that regional patterns of amyloid accumulation may serve as a more sensitive marker for the risk of cognitive decline, particularly for preclinical AD ( Pascoal et al., 2020 ; Pfeil et al., 2021 ). By leveraging amyloid PET biomarkers at the regional level, our models were able to discern spatial patterns which discriminate stables from progressors in the preclinical stage. Among the most important amyloid SUVR features were the temporal, superior and middle frontal, and middle occipital cortices. Many of these regions were previously identified as important correlates to increased risk of cognitive decline ( Pascoal et al., 2020 ; Pfeil et al., 2021 ). Notably, these regions comprise the intermediate stage of amyloid accumulation according to PET staging models ( Mattsson et al., 2019 ). In contrast, our models assigned a lower average feature importance to regions comprising the early accumulation stage, such as the precuneus and orbitofrontal cortices, suggesting that past a global amyloid threshold, the intermediate stage regions become more important for discriminating future cognitive decline. Additionally, low importances were assigned to subcortical structures such as hippocampus and amygdala, which tend to accumulate amyloid at much later stages of the disease ( Hanseeuw et al., 2018 ; Thal et al., 2002 ). In terms of MRI features, lateral ventricular volume and the volumes of select subcortical regions such as the hippocampus and amygdala had the highest feature importance. Atrophy in these regions has consistently been identified as robust markers of AD disease progression ( Laakso et al., 1995 ; Mungas et al., 2002 ; Nestor et al., 2008 ). Additionally, we found that the importance of amyloid SUVR features increased at a higher rate than volumetric features as the time-to-progression was extended. Our nested model analysis was consistent with this pattern, wherein at higher times-to-progression, the omission of amyloid PET features led to greater decreases in model performance and generalizability compared to either MRI or non-imaging features. These findings may suggest that the influence of amyloid PET on model predictions becomes increasingly important as the cohort includes more early stage progressors. This aligns with current models of AD pathogenesis ( Jack Jr. et al., 2024 ) where amyloid is expected to rise to abnormality well before neurodegeneration occurs, and thus may serve as a better indicator of future cognitive decline in the earlier stages of the disease. Our study notably did not utilize tau PET, which has been shown to closely track longitudinal cognitive decline ( Bejanin et al., 2017 ; Johnson et al., 2016 ), and may serve as a better predictor of the rate of cognitive decline than either amyloid PET or MRI ( Ossenkoppele et al., 2021 ). Despite this, amyloid PET imaging alone has been shown to provide strong prognostic value for predicting cognitive decline even within amyloid-positive, cognitively normal cohorts ( Farrell et al., 2017 ; Pfeil et al., 2021 ; van der Kall et al., 2021 ), a notion which is further supported by our own findings. This is particularly of value for clinical trials for asymptomatic, preclinical AD, where amyloid PET is more often utilized as a screening criterion compared to tau PET. In the context of cohort recruitment for clinical trials, the clinical presentation of AD may remain highly heterogeneous even after stratification by single risk factors such as global amyloid PET signal or APOE4 genotype. Alternatively, ML stratification models trained on a combination of multimodal risk factors have been shown to produce more accurate forecasts of longitudinal cognitive decline, leading to greater enhancements in clinical trial operations ( Wang et al., 2024 ). We successfully identified two distinct subtypes within A4 trial participants that exhibited different rates of cognitive decline, where predicted progressors experienced a significantly faster rate of decline compared to stables. However, when applied to cohort enrichment, our models failed to demonstrate a measurable benefit for enhancing the treatment effect in the primary cognitive outcome, PACC. This could be attributed to a true lack of an underlying treatment effect of Solanezumab therapy. Nonetheless, assuming the presence of a ground truth drug effect, ML models may still provide a boost in treatment effect detection as evidenced by previous literature ( Birkenbihl et al., 2024 ; Nallapu et al., 2025 ; Tam et al., 2022 ). Interestingly, in terms of the secondary outcome, cortical amyloid deposition, the two, four and five-year classifiers identified enriched cohorts that resulted in an increased power for detecting differences in longitudinal amyloid accumulation. However, this was not the case for either the one-year model, likely due to insufficient sample size selected, or the three-year model, perhaps due to selection of a more heterogeneous cohort that consisted of slightly younger participants with slightly lower cortical SUVRs compared to other enriched cohorts. Given these contradictory findings and the fact that models were not directly trained to predict longitudinal amyloid accumulation, our results should be interpreted with caution. Nonetheless, these results suggest that ML stratification models hold potential to identify trial candidates who are more likely to respond to treatments, and as more clinical trial data become available, future investigations should continue to validate ML models for use within this context. We note several key limitations which represent areas of future improvement. Firstly, our study did not utilize tau PET, as previously mentioned, and it did not utilize metabolic PET, such as [ 18 F]-fluorodeoxyglucose PET, which has also been found to be predictive of cognitive decline in preclinical AD ( Mayblyum et al., 2021 ). For a more comprehensive assessment of AD biomarkers and their prognostic value, future predictive models should integrate these additional modalities. Secondly, due to the strict inclusion criteria employed for cohort selection, the sample sizes in the present study are relatively low compared to other studies employing ML techniques for AD risk prediction. We combatted this by obtaining data from seven independent sites and including PET imaging from two tracers. Additionally, our selected cohort suffered from a high amount of class imbalance, with stable participants heavily outnumbering progressors especially in low times-to-progression. In an effort to reduce the effect of class imbalance, SVM models were optimized with a balanced class weighting, and class-balance invariant metrics such as balanced accuracy and F1 score were reported. Nonetheless, a larger sample of preclinical AD individuals, particularly those who eventually progress to clinical symptoms, is desirable especially for developing more sophisticated ML models such as ones built upon deep learning. Thirdly, given issues of class imbalance, the stable cohort was limited to those who remain CN for at least five years from baseline, representative of a control group with presumably the least amount of pathology. However, a more clinically interpretable model would ideally match the time of stability to the time-to-progression (i.e. an individual predicted not to progress within three years would necessarily remain stable for three years). Lastly, each time-to-progression model was trained independently of the rest, ignoring the constraint that predicted classifications should be consistent across time windows. Future work will explore alternate models such as time-to-event models like the survival SVM or the Mirai model for breast cancer prediction ( Yala et al., 2021 ) which constrain predictions at multiple follow-up times to be temporally consistent. 5 Conclusion We performed an extensive validation of machine learning for predicting future cognitive impairment in cognitively unimpaired individuals at the preclinical stage of AD. Our classifiers maintained strong generalizability across most independent testing sites as well as on unseen amyloid PET radiotracers. We further evaluated our models on the A4 clinical trial cohort and observed potential increases in statistical power to detect a secondary treatment effect, indicating potential utility for cohort enrichment. As emerging investigations of new disease modifying therapies for AD increasingly focus on asymptomatic, preclinical populations, our findings underscore the potential applicability of ML-based patient stratification for recruiting more homogeneous cohorts and improving statistical power for detecting treatment effects for future clinical trials. 6 Data availability Data used in the preparation of this study are openly available and can be requested at https://www.a4studydata.org , https://adni.loni.usc.edu , https://www.mayo.edu/research/centers-programs/alzheimers-disease-research-center/research-activities/mayo-clinic-study-aging/overview , and https://sites.wustl.edu/oasisbrains . HABS data release 1.10, obtained September 2019, was used in the preparation of this article, and can be requested via https://habs.mgh.harvard.edu . A separate application process is involved for accessing PAC. Investigators interested in accessing the data should contact the PAC Coordinating Center at Johns Hopkins University for details. SVM was implemented in scikit-learn 1.6.0 using python v3.12.8. All statistical analyses were performed in R v4.4.0. Accompanying code will be made publicly available at https://github.com/sotiraslab . 8 CRediT authorship contribution statement Braden Yang : Conceptualization, Investigation, Formal analysis, Methodology, Software, Visualization, Writing - original draft. Tom Earnest : Methodology, Software, Data curation, Writing - review & editing. Murat Bilgel : Methodology, Software, Data curation, Writing - review & editing. Marilyn S. Albert : Data curation. Sterling C. Johnson : Data curation. Christos Davatzikos : Data curation. Guray Erus : Data curation. Colin L. Masters : Data curation. Susan M. Resnick : Data curation, Writing - review & editing. Michael I. Miller : Data curation. Arnold Bakker : Data curation. John C. Morris : Data curation, Writing - review & editing. Tammie L.S. Benzinger : Conceptualization, Supervision, Data curation, Writing - review & editing. Brian A. Gordon : Conceptualization, Supervision, Writing - review & editing. Aristeidis Sotiras : Conceptualization, Supervision, Project administration, Funding acquisition, Writing - review & editing. 9 Funding BY was supported by the Imaging Science Pathways NIH T32 EB014855 and BrightFocus Foundation grant ADR A2021042S. AS was supported by NIH award R01 AG067103 and BrightFocus Foundation grant ADR A2021042S. Computations were performed using the facilities of the Washington University Research Computing and Informatics Facility, which were partially funded by NIH grants S10OD025200, 1S10RR022984-01A1 and 1S10OD018091-01. Additional support is provided by The McDonnell Center for Systems Neuroscience. 10 Competing interests AS reported receiving personal fees from BrightFocus for serving as a grant reviewer and stock from TheraPanacea outside the submitted work. All remaining authors have no conflicting interests to report. 7 Acknowledgements This work was supported by the donors of the Alzheimer’s Disease Research (ADR) program A2021042S, a program of the BrightFocus Foundation. Research reported in this publication was supported by National Institute on Aging of the National Institutes of Health under award number R01AG067103. The content is solely the responsibility of the authors and does not necessarily represent the official views of the National Institutes of Health. The A4 Study was a secondary prevention trial in preclinical Alzheimer’s disease, aiming to slow cognitive decline associated with brain amyloid accumulation in clinically normal older individuals. The A4 Study was funded by a public-private-philanthropic partnership, including funding from the National Institutes of Health-National Institute on Aging, Eli Lilly and Company, Alzheimer’s Association, Accelerating Medicines Partnership, GHR Foundation, an anonymous foundation, and additional private donors, with in-kind support from Avid Radiopharmaceuticals, Cogstate, Albert Einstein College of Medicine and the Foundation for Neurologic Diseases. The companion observational Longitudinal Evaluation of Amyloid Risk and Neurodegeneration (LEARN) Study was funded by the Alzheimer’s Association and GHR Foundation. The A4 and LEARN Studies were led by Dr. Reisa Sperling at Brigham and Women’s Hospital, Harvard Medical School, and Dr. Paul Aisen at the Alzheimer’s Therapeutic Research Institute (ATRI) at the University of Southern California. The A4 and LEARN Studies were coordinated by ATRI at the University of Southern California, and the data are made available under the auspices of Alzheimer’s Clinical Trial Consortium through the Global Research & Imaging Platform (GRIP). The complete A4 Study Team list is available on: https://www.actcinfo.org/a4-study-team-lists/ . We would like to acknowledge the dedication of the study participants and their study partners who made the A4 and LEARN Studies possible. Data collection and sharing for this project was funded by the Alzheimer’s Disease Neuroimaging Initiative (ADNI) (National Institutes of Health Grant U01 AG024904) and DOD ADNI (Department of Defense award number W81XWH-12-2-0012). ADNI is funded by the National Institute on Aging, the National Institute of Biomedical Imaging and Bioengineering, and through generous contributions from the following: AbbVie, Alzheimer’s Association; Alzheimer’s Drug Discovery Foundation; Araclon Biotech; BioClinica, Inc.; Biogen; Bristol-Myers Squibb Company; CereSpir, Inc.; Cogstate; Eisai Inc.; Elan Pharmaceuticals, Inc.; Eli Lilly and Company; EuroImmun; F. Hoffmann-La Roche Ltd and its affiliated company Genentech, Inc.; Fujirebio; GE Healthcare; IXICO Ltd.; Janssen Alzheimer Immunotherapy Research & Development, LLC.; Johnson & Johnson Pharmaceutical Research & Development LLC.; Lumosity; Lundbeck; Merck & Co., Inc.; Meso Scale Diagnostics, LLC.; NeuroRx Research; Neurotrack Technologies; Novartis Pharmaceuticals Corporation; Pfizer Inc.; Piramal Imaging; Servier; Takeda Pharmaceutical Company; and Transition Therapeutics. The Canadian Institutes of Health Research is providing funds to support ADNI clinical sites in Canada. Private sector contributions are facilitated by the Foundation for the National Institutes of Health ( www.fnih.org ). The grantee organization is the Northern California Institute for Research and Education, and the study is coordinated by the Alzheimer’s Therapeutic Research Institute at the University of Southern California. ADNI data are disseminated by the Laboratory for Neuro Imaging at the University of Southern California. Part of the data used in the preparation of this article were obtained from the Harvard Aging Brain Study (HABS - P01AG036694; https://nam10.safelinks.protection.outlook.com/?url=https%3A%2F%2Fhabs.mgh.harvard.edu%2F&data=05%7C02%7Ctom.earnest%40wustl.edu%7C70bcf8c15ffb44a9848408dccc4c749f%7C4ccca3b571cd4e6d974b4d9beb96c6d6%7C0%7C0%7C638609875978514619%7CUnknown%7CTWFpbGZsb3d8eyJWIjoiMC4wLjAwMDAiLCJQIjoiV2luMzIiLCJBTiI6Ik1haWwiLCJXVCI6Mn0%3D%7C0%7C%7C%7C&sdata=uZIOX1693oz1jyd49mvRaqaaIHC%2BXKDKPHUdotwp%2B8I%3D&reserved=0). The HABS study was launched in 2010, funded by the National Institute on Aging. and is led by principal investigators Reisa A. Sperling MD and Keith A. Johnson MD at Massachusetts General Hospital/Harvard Medical School in Boston, MA. Part of the data contained in this analysis were obtained under one of the following research grants from the National Institutes of Health to the Mayo Clinic Study of Aging (U01 AG06786, Ronald Petersen, PI) or the Mayo Alzheimer’s Disease Research Center (P50 AG16574, Ronald Petersen, PI). Part of the data were provided by OASIS-3: Longitudinal Multimodal Neuroimaging (Principal Investigators: T. Benzinger, D. Marcus, J. Morris). OASIS-3 was supported by the following funding sources: NIH P30 AG066444, P30 NS09857781, P01 AG026276, P01 AG003991, R01 AG043434, UL1 TR000448, R01 EB009352. AV-45 doses were provided by Avid Radiopharmaceuticals, a wholly owned subsidiary of Eli Lilly. Avid Radiopharmaceuticals, Inc., a wholly owned subsidiary of Eli Lilly and company, enabled use of the 18F-florbetapir tracer, but did not provide direct funding and was not involved in data analysis or interpretation. The Preclinical AD Consortium is supported by the National Institutes of Health (NIH), USA [grant number RF1-AG059869]. The individual studies in the consortium are funded, in part, by the following grants: U19-AG033655, P01-AG026276, RF1-AG027161 and the Australian Commonwealth Scientific Industrial Research Organization (CSIRO); as well as the National Institute on Aging Intramural Research Program. Footnotes ↵ * This research was supported in part by the Intramural Research Program of the National Institutes of Health (NIH). The contributions of the NIH authors are considered Works of the United States Government. The findings and conclusions presented in this paper are those of the authors and do not necessarily reflect the views of the NIH or the U.S. Department of Health and Human Services. ↵ † Data used in preparation of this article were obtained from the Alzheimer’s Disease Neuroimaging Initiative (ADNI) database (adni.loni.usc.edu). As such, the investigators within the ADNI contributed to the design and implementation of ADNI and/or provided data but did not participate in the analysis or writing of this report. A complete listing of ADNI investigators can be found at: http://adni.loni.usc.edu/wp-content/uploads/how_to_apply/ADNI_Acknowledgement_List.pdf - addition of nested model analysis - addition of study overview figure (Figure 1) - significant changes to Discussion section 11 References ↵ Abdelnour , C. , Agosta , F. , Bozzali , M. , Fougère , B. , Iwata , A. , Nilforooshan , R. , Takada , L.T. , Viñuela , F. , Traber , M. , 2022 . Perspectives and challenges in patient stratification in Alzheimer’s disease . Alzheimers Res. Ther . 14 , 112 . doi: 10.1186/s13195-022-01055-y OpenUrl CrossRef ↵ Albert , M. , Soldan , A. , Gottesman , R. , McKhann , G. , Sacktor , N. , Farrington , L. , Grega , M. , Turner , R. , Lu , Y. , Li , S. , Wang , M.-C. , Selnes , O. , 2014 . Cognitive changes preceding clinical symptom onset of mild cognitive impairment and relationship to ApoE genotype . Curr. Alzheimer Res . 11 , 773 – 784 . OpenUrl PubMed ↵ Ballard , C. , Atri , A. , Boneva , N. , Cummings , J.L. , Frölich , L. , Molinuevo , J.L. , Tariot , P.N. , Raket , L.L. , 2019 . Enrichment factors for clinical trials in mild-to-moderate Alzheimer’s disease . Alzheimers Dement. Transl. Res. Clin. Interv . 5 , 164 – 174 . doi: 10.1016/j.trci.2019.04.001 OpenUrl CrossRef PubMed ↵ Basaia , S. , Agosta , F. , Wagner , L. , Canu , E. , Magnani , G. , Santangelo , R. , Filippi , M. , 2019 . Automated classification of Alzheimer’s disease and mild cognitive impairment using a single MRI and deep neural networks . NeuroImage Clin . 21 , 101645 . doi: 10.1016/J.NICL.2018.101645 OpenUrl CrossRef PubMed ↵ Bejanin , A. , Schonhaut , D.R. , La Joie , R. , Kramer , J.H. , Baker , S.L. , Sosa , N. , Ayakta , N. , Cantwell , A. , Janabi , M. , Lauriola , M. , O’Neil , J.P. , Gorno-Tempini , M.L. , Miller , Z.A. , Rosen , H.J. , Miller , B.L. , Jagust , W.J. , Rabinovici , G.D. , 2017 . Tau pathology and neurodegeneration contribute to cognitive impairment in Alzheimer’s disease . Brain 140 , 3286 – 3300 . doi: 10.1093/brain/awx243 OpenUrl CrossRef PubMed ↵ Beta Amyloid Positron Emission Tomography in Dementia and Neurodegenerative Disease , 2023 . ↵ Birkenbihl , C. , de Jong , J. , Yalchyk , I. , Fröhlich , H. , for the Alzheimer’s Disease Neuroimaging Initiative , 2024 . Deep learning-based patient stratification for prognostic enrichment of clinical dementia trials . Brain Commun . 6 , fcae445. doi: 10.1093/braincomms/fcae445 OpenUrl CrossRef ↵ Choi , Y.S. , Ngam , P.I. , Lee , J.R. , Hwang , D. , Tan , E.-K. , for the Harvard Aging Brain Study , for the Australian Imaging Biomarkers and Lifestyle Study of Aging , for the Japanese Alzheimer’s Disease Neuroimaging Initiative , for the Alzheimer’s Disease Neuroimaging Initiative , 2024 . Deep learning-based amyloid PET harmonization to predict cognitive decline in non-demented elderly . Radiol. Adv . 1 , umae019. doi: 10.1093/radadv/umae019 OpenUrl CrossRef ↵ Coats , M. , Morris , J.C. , 2005 . Antecedent biomarkers of Alzheimer’s disease: The Adult Children Study . J. Geriatr. Psychiatry Neurol . 18 , 242 – 244 . doi: 10.1177/0891988705281881 OpenUrl CrossRef PubMed Web of Science ↵ Cummings , J. , Apostolova , L. , Rabinovici , G.D. , Atri , A. , Aisen , P. , Greenberg , S. , Hendrix , S. , Selkoe , D. , Weiner , M. , Petersen , R.C. , Salloway , S. , 2023 . Lecanemab: appropriate use recommendations . J. Prev. Alzheimers Dis . 10 , 362 – 377 . doi: 10.14283/jpad.2023.30 OpenUrl CrossRef PubMed ↵ Dagley , A. , LaPoint , M. , Huijbers , W. , Hedden , T. , McLaren , D.G. , Chatwal , J.P. , Papp , K.V. , Amariglio , R.E. , Blacker , D. , Rentz , D.M. , Johnson , K.A. , Sperling , R.A. , Schultz , A.P. , 2017 . Harvard Aging Brain Study: Dataset and accessibility. NeuroImage , Data Sharing Part II 144 , 255 – 258 . doi: 10.1016/j.neuroimage.2015.03.069 OpenUrl CrossRef ↵ Dansson , H.V. , Stempfle , L. , Egilsdóttir , H. , Schliep , A. , Portelius , E. , Blennow , K. , Zetterberg , H. , Johansson , F.D. , for the Alzheimer’s Disease Neuroimaging Initiative (ADNI) , 2021 . Predicting progression and cognitive decline in amyloid-positive patients with Alzheimer’s disease . Alzheimers Res. Ther . 13 , 151 . doi: 10.1186/s13195-021-00886-5 OpenUrl CrossRef ↵ Donohue , M.C. , Langford , O. , Insel , P.S. , van Dyck , C.H. , Petersen , R.C. , Craft , S. , Sethuraman , G. , Raman , R. , Aisen , P.S. , Initiative, F. the A.D.N. , 2023 . Natural cubic splines for the analysis of Alzheimer’s clinical trials . Pharm. Stat . 22 , 508 – 519 . doi: 10.1002/pst.2285 OpenUrl CrossRef PubMed ↵ Donohue , M.C. , Sperling , R.A. , Salmon , D.P. , Rentz , D.M. , Raman , R. , Thomas , R.G. , Weiner , M. , Aisen , P.S. , 2014 . The Preclinical Alzheimer Cognitive Composite: measuring amyloid-related decline . JAMA Neurol . 71 , 961 – 970 . doi: 10.1001/JAMANEUROL.2014.803 OpenUrl CrossRef PubMed ↵ Doshi , J. , Erus , G. , Ou , Y. , Resnick , S.M. , Gur , R.C. , Gur , R.E. , Satterthwaite , T.D. , Furth , S. , Davatzikos , C. , 2016 . MUSE: MUlti-atlas region Segmentation utilizing Ensembles of registration algorithms and parameters, and locally optimal atlas selection . NeuroImage 127 , 186 – 195 . doi: 10.1016/j.neuroimage.2015.11.073 OpenUrl CrossRef PubMed ↵ Dyck , C.H. van , Swanson , C.J. , Aisen , P. , Bateman , R.J. , Chen , C. , Gee , M. , Kanekiyo , M. , Li , D. , Reyderman , L. , Cohen , S. , Froelich , L. , Katayama , S. , Sabbagh , M. , Vellas , B. , Watson , D. , Dhadda , S. , Irizarry , M. , Kramer , L.D. , Iwatsubo , T. , 2023 . Lecanemab in early Alzheimer’s disease . N. Engl. J. Med . 388 , 9 – 21 . doi: 10.1056/NEJMoa2212948 OpenUrl CrossRef PubMed ↵ Ezzati , A. , Abdulkadir , A. , Jack , C.R. , Thompson , P.M. , Harvey , D.J. , Truelove-Hill , M. , Sreepada , L.P. , Davatzikos , C. , Lipton , R.B. , 2021 . Predictive value of ATN biomarker profiles in estimating disease progression in Alzheimer’s disease dementia . Alzheimers Dement . 17 , 1855 – 1867 . doi: 10.1002/ALZ.12491 OpenUrl CrossRef ↵ Fan , S. , Ponisio , M.R. , Xiao , P. , Ha , S.M. , Chakrabarty , S. , Lee , J.J. , Flores , S. , LaMontagne , P. , Gordon , B. , Raji , C.A. , Marcus , D.S. , Nazeri , A. , Ances , B.M. , Bateman , R.J. , Morris , J.C. , Benzinger , T.L.S. , Sotiras , A. , Haller , S. , Atzen , S. , 2024 . AmyloidPETNet: Classification of amyloid positivity in brain PET imaging using end-to-end deep learning . Radiology 311 , e231442 . doi: 10.1148/radiol.231442 OpenUrl CrossRef PubMed ↵ Farrell , M.E. , Kennedy , K.M. , Rodrigue , K.M. , Wig , G. , Bischof , G.N. , Rieck , J.R. , Chen , X. , Festini , S.B. , Devous , M.D. , Sr . , Park , D.C. , 2017 . Association of longitudinal cognitive decline with amyloid burden in middle-aged and older adults: evidence for a dose response relationship . JAMA Neurol . 74 , 830 – 838 . doi: 10.1001/jamaneurol.2017.0892 OpenUrl CrossRef PubMed ↵ Fowler , C. , Rainey-Smith , S.R. , Bird , S. , Bomke , J. , Bourgeat , P. , Brown , B.M. , Burnham , S.C. , Bush , A.I. , Chadunow , C. , Collins , S. , Doecke , J. , Doré , V. , Ellis , K.A. , Evered , L. , Fazlollahi , A. , Fripp , J. , Gardener , S.L. , Gibson , S. , Grenfell , R. , Harrison , E. , Head , R. , Jin , L. , Kamer , A. , Lamb , F. , Lautenschlager , N.T. , Laws , S.M. , Li , Q.-X. , Lim , L. , Lim , Y.Y. , Louey , A. , Macaulay , S.L. , Mackintosh , L. , Martins , R.N. , Maruff , P. , Masters , C.L. , McBride , S. , Milicic , L. , Peretti , M. , Pertile , K. , Porter , T. , Radler , M. , Rembach , A. , Robertson , J. , Rodrigues , M. , Rowe , C.C. , Rumble , R. , Salvado , O. , Savage , G. , Silbert , B. , Soh , M. , Sohrabi , H.R. , Taddei , K. , Taddei , T. , Thai , C. , Trounson , B. , Tyrrell , R. , Vacher , M. , Varghese , S. , Villemagne , V.L. , Weinborn , M. , Woodward , M. , Xia , Y. , Ames , D. , 2021 . Fifteen years of the Australian Imaging, Biomarkers and Lifestyle (AIBL) Study: progress and pbservations from 2,359 older adults spanning the spectrum from cognitive normality to Alzheimer’s disease . J. Alzheimers Dis. Rep . 5 , 443 – 468 . doi: 10.3233/ADR-210005 OpenUrl CrossRef ↵ Gladstein , S. , Yang , L. , Wooten , D. , Huang , X. , Comley , R. , Guo , Q. , Initiative, the A.D.N. , 2025 . Machine learning–enhanced screening funnel for clinical trials in Alzheimer’s disease . Alzheimers Dement. Transl. Res. Clin. Interv . 11 , e70084 . doi: 10.1002/trc2.70084 OpenUrl CrossRef ↵ Hanseeuw , B.J. , Betensky , R.A. , Mormino , E.C. , Schultz , A.P. , Sepulcre , J. , Becker , J.A. , Jacobs , H.I.L. , Buckley , R.F. , LaPoint , M.R. , Vannini , P. , Donovan , N.J. , Chhatwal , J.P. , Marshall , G.A. , Papp , K.V. , Amariglio , R.E. , Rentz , D.M. , Sperling , R.A. , Johnson , K.A. , Initiative, for the A.D.N. , Study , and the H.A.B. , 2018 . PET staging of amyloidosis using striatum . Alzheimers Dement . 14 , 1281 – 1292 . doi: 10.1016/j.jalz.2018.04.011 OpenUrl CrossRef ↵ Haufe , S. , Meinecke , F. , Görgen , K. , Dähne , S. , Haynes , J.-D. , Blankertz , B. , Bießmann , F. , 2014 . On the interpretation of weight vectors of linear models in multivariate neuroimaging . NeuroImage 87 , 96 – 110 . doi: 10.1016/j.neuroimage.2013.10.067 OpenUrl CrossRef PubMed Web of Science ↵ Huang , L.-K. , Chao , S.-P. , Hu , C.-J. , 2020 . Clinical trials of new drugs for Alzheimer disease . J. Biomed. Sci . 27 , 18 . doi: 10.1186/s12929-019-0609-7 OpenUrl CrossRef PubMed ↵ Jack , C.R. , Holtzman , D.M. , 2013 . Biomarker modeling of Alzheimer’s disease . Neuron 80 , 1347 – 1358 . doi: 10.1016/j.neuron.2013.12.003 OpenUrl CrossRef PubMed Web of Science ↵ Jack Jr. , C.R. , Andrews , J.S. , Beach , T.G. , Buracchio , T. , Dunn , B. , Graf , A. , Hansson , O. , Ho , C. , Jagust , W. , McDade , E. , Molinuevo , J.L. , Okonkwo , O.C. , Pani , L. , Rafii , M.S. , Scheltens , P. , Siemers , E. , Snyder , H.M. , Sperling , R. , Teunissen , C.E. , Carrillo , M.C. , 2024 . Revised criteria for diagnosis and staging of Alzheimer’s disease: Alzheimer’s Association Workgroup . Alzheimers Dement . 20 , 5143 – 5169 . doi: 10.1002/alz.13859 OpenUrl CrossRef PubMed ↵ Johnson , K.A. , Schultz , A. , Betensky , R.A. , Becker , J.A. , Sepulcre , J. , Rentz , D. , Mormino , E. , Chhatwal , J. , Amariglio , R. , Papp , K. , Marshall , G. , Albers , M. , Mauro , S. , Pepin , L. , Alverio , J. , Judge , K. , Philiossaint , M. , Shoup , T. , Yokell , D. , Dickerson , B. , Gomez-Isla , T. , Hyman , B. , Vasdev , N. , Sperling , R. , 2016 . Tau positron emission tomographic imaging in aging and early Alzheimer disease . Ann. Neurol . 79 , 110 – 119 . doi: 10.1002/ana.24546 OpenUrl CrossRef PubMed ↵ Johnson , S.C. , Koscik , R.L. , Jonaitis , E.M. , Clark , L.R. , Mueller , K.D. , Berman , S.E. , Bendlin , B.B. , Engelman , C.D. , Okonkwo , O.C. , Hogan , K.J. , Asthana , S. , Carlsson , C.M. , Hermann , B.P. , Sager , M.A. , 2018 . The Wisconsin Registry for Alzheimer’s Prevention: A review of findings and current directions . Alzheimers Dement. Diagn. Assess. Dis. Monit . 10 , 130 – 142 . doi: 10.1016/j.dadm.2017.11.007 OpenUrl CrossRef PubMed ↵ Jutten , R.J. , Sikkes , S.A.M. , Flier , W.M.V. der , Scheltens , P. , Visser , P.J. , Tijms , B.M. , Initiative, for the A.D.N. , 2021 . Finding treatment effects in Alzheimer trials in the face of disease progression heterogeneity . Neurology 96 , e2673 – e2684 . doi: 10.1212/WNL.0000000000012022 OpenUrl CrossRef PubMed ↵ Karaman , B.K. , Mormino , E.C. , Sabuncu , M.R. , Initiative, for the A.D.N. , 2022 . Machine learning based multi-modal prediction of future decline toward Alzheimer’s disease: An empirical study . PLOS ONE 17 , e0277322 . doi: 10.1371/journal.pone.0277322 OpenUrl CrossRef PubMed ↵ Kim , C.K. , Lee , Y.R. , Ong , L. , Gold , M. , Kalali , A. , Sarkar , J. , 2022 . Alzheimer’s disease: key insights from two decades of clinical trial failures . J. Alzheimer’s Dis . 87 , 83 – 100 . doi: 10.3233/JAD-215699 OpenUrl CrossRef ↵ Klunk , W.E. , Koeppe , R.A. , Price , J.C. , Benzinger , T.L. , Devous Sr. , M.D. , Jagust , W.J. , Johnson , K.A. , Mathis , C.A. , Minhas , D. , Pontecorvo , M.J. , Rowe , C.C. , Skovronsky , D.M. , Mintun , M.A. , 2015 . The Centiloid Project: Standardizing quantitative amyloid plaque estimation by PET . Alzheimers Dement . 11 , 1 – 15 .e4. doi: 10.1016/j.jalz.2014.07.003 OpenUrl CrossRef PubMed ↵ Laakso , M.P. , Soininen , H. , Partanen , K. , Helkala , E.-L. , Hartikainen , P. , Vainio , P. , Hallikainen , M. , Hänninen , T. , Riekkinen Sr , P.J. , 1995 . Volumes of hippocampus, amygdala and frontal lobes in the MRI-based diagnosis of early Alzheimer’s disease: Correlation with memory functions . J. Neural Transm. - Park. Dis. Dement. Sect . 9 , 73 – 86 . doi: 10.1007/BF02252964 OpenUrl CrossRef PubMed Web of Science ↵ LaMontagne , P.J. , Benzinger , T.LS. , Morris , J.C. , Keefe , S. , Hornbeck , R. , Xiong , C. , Grant , E. , Hassenstab , J. , Moulder , K. , Vlassenko , A.G. , Raichle , M.E. , Cruchaga , C. , Marcus , D. , 2019 . OASIS-3: longitudinal neuroimaging, clinical, and cognitive dataset for normal aging and Alzheimer disease . medRxiv 2019.12.13.19014902. doi: 10.1101/2019.12.13.19014902 OpenUrl Abstract / FREE Full Text ↵ Landau , S.M. , Horng , A. , Jagust , W.J. , For the Alzheimer’s Disease Neuroimaging Initiative , 2018 . Memory decline accompanies subthreshold amyloid accumulation . Neurology 90 , e1452 – e1460 . doi: 10.1212/WNL.0000000000005354 OpenUrl Abstract / FREE Full Text ↵ Landau , S.M. , Thomas , B.A. , Thurfjell , L. , Schmidt , M. , Margolin , R. , Mintun , M. , Pontecorvo , M. , Baker , S.L. , Jagust , W.J. , the Alzheimer’s Disease Neuroimaging Initiative , 2014 . Amyloid PET imaging in Alzheimer’s disease: a comparison of three radiotracers . Eur. J. Nucl. Med. Mol. Imaging 41 , 1398 – 1407 . doi: 10.1007/s00259-014-2753-3 OpenUrl CrossRef PubMed ↵ Leuzy , A. , Bollack , A. , Pellegrino , D. , Teunissen , C.E. , La Joie , R. , Rabinovici , G.D. , Franzmeier , N. , Johnson , K. , Barkhof , F. , Shaw , L.M. , Arkhipenko , A. , Schindler , S.E. , Honig , L.S. , Moscoso Rial , A. , Schöll , M. , Zetterberg , H. , Blennow , K. , Hansson , O. , Farrar , G. , 2025 . Considerations in the clinical use of amyloid PET and CSF biomarkers for Alzheimer’s disease . Alzheimers Dement . 21 , e14528 . doi: 10.1002/alz.14528 OpenUrl CrossRef PubMed ↵ Linn , K.A. , Gaonkar , B. , Satterthwaite , T.D. , Doshi , J. , Davatzikos , C. , Shinohara , R.T. , 2016 . Control-group feature normalization for multivariate pattern analysis of structural MRI data using the support vector machine . NeuroImage 132 , 157 – 166 . doi: 10.1016/J.NEUROIMAGE.2016.02.044 OpenUrl CrossRef PubMed ↵ Mathotaarachchi , S. , Pascoal , T.A. , Shin , M. , Benedet , A.L. , Kang , M.S. , Beaudry , T. , Fonov , V.S. , Gauthier , S. , Rosa-Neto , P. , 2017 . Identifying incipient dementia individuals using machine learning and amyloid imaging . Neurobiol. Aging 59 , 80 – 90 . doi: 10.1016/J.NEUROBIOLAGING.2017.06.027 OpenUrl CrossRef PubMed ↵ Mattsson , N. , Palmqvist , S. , Stomrud , E. , Vogel , J. , Hansson , O. , 2019 . Staging β-amyloid pathology with amyloid positron emission tomography . JAMA Neurol . 76 , 1319 – 1329 . doi: 10.1001/jamaneurol.2019.2214 OpenUrl CrossRef ↵ Mayblyum , D.V. , Becker , J.A. , Jacobs , H.I.L. , Buckley , R.F. , Schultz , A.P. , Sepulcre , J. , Sanchez , J.S. , Rubinstein , Z.B. , Katz , S.R. , Moody , K.A. , Vannini , P. , Papp , K.V. , Rentz , D.M. , Price , J.C. , Sperling , R.A. , Johnson , K.A. , Hanseeuw , B.J. , 2021 . Comparing PET and MRI biomarkers predicting cognitive decline in preclinical Alzheimer disease . Neurology 96 , e2933 – e2943 . doi: 10.1212/WNL.0000000000012108 OpenUrl Abstract / FREE Full Text ↵ Misra , C. , Fan , Y. , Davatzikos , C. , 2009 . Baseline and longitudinal patterns of brain atrophy in MCI patients, and their use in prediction of short-term conversion to AD: Results from ADNI . NeuroImage 44 , 1415 – 1422 . doi: 10.1016/j.neuroimage.2008.10.031 OpenUrl CrossRef PubMed Web of Science ↵ Morris , J.C. , 1997 . Clinical Dementia Rating: a reliable and valid diagnostic and staging measure for dementia of the Alzheimer type . Int. Psychogeriatr . 9 , 173 – 176 . doi: 10.1017/S1041610297004870 OpenUrl CrossRef PubMed ↵ Mungas , D. , Reed , B.R. , Jagust , W.J. , DeCarli , C. , Mack , W.J. , Kramer , J.H. , Weiner , M.W. , Schuff , N. , Chui , H.C. , 2002 . Volumetric MRI predicts rate of cognitive decline related to AD and cerebrovascular disease . Neurology 59 , 867 – 873 . doi: 10.1212/WNL.59.6.867 OpenUrl Abstract / FREE Full Text ↵ Nallapu , B.T. , Petersen , K.K. , Qian , T. , Demirsoy , I. , Ghanbarian , E. , Davatzikos , C. , Lipton , R.B. , Ezzati , A. , for the Alzheimer’s Disease Neuroimaging Initiative , 2025 . A machine learning approach to predict cognitive decline in Alzheimer disease clinical trials . Neurology 104 , e213490 . doi: 10.1212/WNL.0000000000213490 OpenUrl CrossRef PubMed ↵ Nestor , S.M. , Rupsingh , R. , Borrie , M. , Smith , M. , Accomazzi , V. , Wells , J.L. , Fogarty , J. , Bartha , R. , 2008 . Ventricular enlargement as a possible measure of Alzheimer’s disease progression validated using the Alzheimer’s disease neuroimaging initiative database . Brain 131 , 2443 – 2454 . doi: 10.1093/brain/awn146 OpenUrl CrossRef PubMed Web of Science ↵ Ossenkoppele , R. , Smith , R. , Mattsson-Carlgren , N. , Groot , C. , Leuzy , A. , Strandberg , O. , Palmqvist , S. , Olsson , T. , Jögi , J. , Stormrud , E. , Cho , H. , Ryu , Y.H. , Choi , J.Y. , Boxer , A.L. , Gorno-Tempini , M.L. , Miller , B.L. , Soleimani-Meigooni , D. , Iaccarino , L. , La Joie , R. , Baker , S. , Borroni , E. , Klein , G. , Pontecorvo , M.J. , Devous , M.D. , Sr . , Jagust , W.J. , Lyoo , C.H. , Rabinovici , G.D. , Hansson , O. , 2021 . Accuracy of tau positron emission tomography as a prognostic marker in preclinical and prodromal Alzheimer disease: a head-to-head comparison against amyloid positron emission tomography and magnetic resonance imaging . JAMA Neurol . 78 , 961 – 971 . doi: 10.1001/jamaneurol.2021.1858 OpenUrl CrossRef PubMed ↵ Parent , C. , Rousseau , L.-S. , Predovan , D. , Duchesne , S. , Hudon , C. , 2023 . Longitudinal association between ß-amyloid accumulation and cognitive decline in cognitively healthy older adults: A systematic review . Aging Brain 3 , 100074 . doi: 10.1016/j.nbas.2023.100074 OpenUrl CrossRef PubMed ↵ Pascoal , T.A. , Therriault , J. , Mathotaarachchi , S. , Kang , M.S. , Shin , M. , Benedet , A.L. , Chamoun , M. , Tissot , C. , Lussier , F. , Mohaddes , S. , Soucy , J.P. , Massarweh , G. , Gauthier , S. , Rosa-Neto , P. , 2020 . Topographical distribution of Aβ predicts progression to dementia in Aβ positive mild cognitive impairment . Alzheimers Dement. Diagn. Assess. Dis. Monit . 12 , e12037 . doi: 10.1002/DAD2.12037 OpenUrl CrossRef ↵ Pfeil , J. , Hoenig , M.C. , Doering , E. , van Eimeren , T. , Drzezga , A. , Bischof , G.N. , 2021 . Unique regional patterns of amyloid burden predict progression to prodromal and clinical stages of Alzheimer’s disease . Neurobiol. Aging 106 , 119 – 129 . doi: 10.1016/J.NEUROBIOLAGING.2021.06.014 OpenUrl CrossRef PubMed ↵ Price , J.L. , Morris , J.C. , 1999 . Tangles and plaques in nondemented aging and “preclinical” Alzheimer’s disease . Ann. Neurol . 45 , 358 – 368 . doi: 10.1002/1531-8249(199903)45:3%253C358::AID-ANA12%253E3.0.CO;2-X OpenUrl CrossRef PubMed Web of Science ↵ Rabinovici , G.D. , Knopman , D.S. , Arbizu , J. , Benzinger , T.L.S. , Donohoe , K.J. , Hansson , O. , Herscovitch , P. , Kuo , P.H. , Lingler , J.H. , Minoshima , S. , Murray , M.E. , Price , J.C. , Salloway , S.P. , Weber , C.J. , Carrillo , M.C. , Johnson , K.A. , 2025 . Updated appropriate use criteria for amyloid and tau PET: A report from the Alzheimer’s Association and Society for Nuclear Medicine and Molecular Imaging Workgroup . Alzheimers Dement . 21 , e14338 . doi: 10.1002/alz.14338 OpenUrl CrossRef PubMed ↵ Rafii , M.S. , Aisen , P.S. , 2023 . Detection and treatment of Alzheimer’s disease in its preclinical stage. Nat . Aging 3 , 520 – 531 . doi: 10.1038/s43587-023-00410-4 OpenUrl CrossRef PubMed ↵ Rafii , M.S. , Sperling , R.A. , Donohue , M.C. , Zhou , J. , Roberts , C. , Irizarry , M.C. , Dhadda , S. , Sethuraman , G. , Kramer , L.D. , Swanson , C.J. , Li , D. , Krause , S. , Rissman , R.A. , Walter , S. , Raman , R. , Johnson , K.A. , Aisen , P.S. , 2023 . The AHEAD 3–45 Study: Design of a prevention trial for Alzheimer’s disease . Alzheimers Dement. J. Alzheimers Assoc . 19 , 1227 – 1233 . doi: 10.1002/alz.12748 OpenUrl CrossRef PubMed ↵ Rathore , S. , Habes , M. , Iftikhar , M.A. , Shacklett , A. , Davatzikos , C. , 2017 . A review on neuroimaging-based classification studies and associated feature extraction methods for Alzheimer’s disease and its prodromal stages . NeuroImage 155 , 530 – 548 . doi: 10.1016/J.NEUROIMAGE.2017.03.057 OpenUrl CrossRef PubMed ↵ Resnick , S.M. , Goldszal , A.F. , Davatzikos , C. , Golski , S. , Kraut , M.A. , Metter , E.J. , Bryan , R.N. , Zonderman , A.B. , 2000 . One-year Age Changes in MRI Brain Volumes in Older Adults . Cereb. Cortex 10 , 464 – 472 . doi: 10.1093/cercor/10.5.464 OpenUrl CrossRef PubMed Web of Science ↵ Roberts , R.O. , Geda , Y.E. , Knopman , D.S. , Cha , R.H. , Pankratz , V.S. , Boeve , B.F. , Ivnik , R.J. , Tangalos , E.G. , Petersen , R.C. , Rocca , W.A. , 2008 . The Mayo Clinic Study of Aging: design and sampling, participation, baseline measures and sample characteristics . Neuroepidemiology 30 , 58 – 69 . doi: 10.1159/000115751 OpenUrl CrossRef PubMed Web of Science ↵ Samper-González , J. , Burgos , N. , Bottani , S. , Fontanella , S. , Lu , P. , Marcoux , A. , Routier , A. , Guillon , J. , Bacci , M. , Wen , J. , Bertrand , A. , Bertin , H. , Habert , M.O. , Durrleman , S. , Evgeniou , T. , Colliot , O. , 2018 . Reproducible evaluation of classification methods in Alzheimer’s disease: Framework and application to MRI and PET data . NeuroImage 183 , 504 – 521 . doi: 10.1016/J.NEUROIMAGE.2018.08.042 OpenUrl CrossRef PubMed ↵ Sims , J.R. , Zimmer , J.A. , Evans , C.D. , Lu , M. , Ardayfio , P. , Sparks , J. , Wessels , A.M. , Shcherbinin , S. , Wang , H. , Monkul Nery , E.S. , Collins , E.C. , Solomon , P. , Salloway , S. , Apostolova , L.G. , Hansson , O. , Ritchie , C. , Brooks , D.A. , Mintun , M. , Skovronsky , D.M. , TRAILBLAZER-ALZ 2 Investigators , 2023 . Donanemab in early symptomatic Alzheimer disease: the TRAILBLAZER-ALZ 2 randomized clinical trial . JAMA 330 , 512 – 527 . doi: 10.1001/jama.2023.13239 OpenUrl CrossRef PubMed ↵ Small , G.W. , Siddarth , P. , Kepe , V. , Ercoli , L.M. , Burggren , A.C. , Bookheimer , S.Y. , Miller , K.J. , Kim , J. , Lavretsky , H. , Huang , S.-C. , Barrio , J.R. , 2012 . Prediction of cognitive decline by positron emission tomography of brain amyloid and tau . Arch. Neurol . 69 , 215 – 222 . doi: 10.1001/archneurol.2011.559 OpenUrl CrossRef PubMed Web of Science ↵ Smith , S.M. , Jenkinson , M. , Woolrich , M.W. , Beckmann , C.F. , Behrens , T.E.J. , Johansen-Berg , H. , Bannister , P.R. , De Luca , M. , Drobnjak , I. , Flitney , D.E. , Niazy , R.K. , Saunders , J. , Vickers , J. , Zhang , Y. , De Stefano , N. , Brady , J.M. , Matthews , P.M. , 2004 . Advances in functional and structural MR image analysis and implementation as FSL. NeuroImage , Mathematics in Brain Imaging 23 , S208 – S219 . doi: 10.1016/j.neuroimage.2004.07.051 OpenUrl CrossRef ↵ Sperling , R.A. , Donohue , M.C. , Raman , R. , Rafii , M.S. , Johnson , K. , Masters , C.L. , Dyck , C.H. van , Iwatsubo , T. , Marshall , G.A. , Yaari , R. , Mancini , M. , Holdridge , K.C. , Case , M. , Sims , J.R. , Aisen , P.S. , 2023 . Trial of Solanezumab in preclinical Alzheimer’s disease . N. Engl. J. Med . 389 , 1096 – 1107 . doi: 10.1056/NEJMoa2305032 OpenUrl CrossRef PubMed ↵ Sperling , R.A. , Rentz , D.M. , Johnson , K.A. , Karlawish , J. , Donohue , M. , Salmon , D.P. , Aisen , P. , 2014 . The A4 study: Stopping AD before symptoms begin? Sci. Transl. Med . 6 . doi: 10.1126/SCITRANSLMED.3007941/ASSET/1A7D4501-F70E-47E3-B98C-C19B558DDE40/ASSETS/GRAPHIC/6228FS13-F1.JPEG OpenUrl CrossRef ↵ Strobl , C. , Boulesteix , A.-L. , Kneib , T. , Augustin , T. , Zeileis , A. , 2008 . Conditional variable importance for random forests . BMC Bioinformatics 9 , 307 . doi: 10.1186/1471-2105-9-307 OpenUrl CrossRef PubMed ↵ Su , Y. , Flores , S. , Wang , G. , Hornbeck , R.C. , Speidel , B. , Joseph-Mathurin , N. , Vlassenko , A.G. , Gordon , B.A. , Koeppe , R.A. , Klunk , W.E. , Jack Jr. , C.R. , Farlow , M.R. , Salloway , S. , Snider , B.J. , Berman , S.B. , Roberson , E.D. , Brosch , J. , Jimenez-Velazques , I. , van Dyck , C.H. , Galasko , D. , Yuan , S.H. , Jayadev , S. , Honig , L.S. , Gauthier , S. , Hsiung , G.-Y.R. , Masellis , M. , Brooks , W.S. , Fulham , M. , Clarnette , R. , Masters , C.L. , Wallon , D. , Hannequin , D. , Dubois , B. , Pariente , J. , Sanchez-Valle , R. , Mummery , C. , Ringman , J.M. , Bottlaender , M. , Klein , G. , Milosavljevic-Ristic , S. , McDade , E. , Xiong , C. , Morris , J.C. , Bateman , R.J. , Benzinger , T.L.S. , 2019 . Comparison of Pittsburgh compound B and florbetapir in cross-sectional and longitudinal studies . Alzheimers Dement. Diagn. Assess. Dis. Monit . 11 , 180 – 190 . doi: 10.1016/j.dadm.2018.12.008 OpenUrl CrossRef PubMed ↵ Swanson , C.J. , Zhang , Y. , Dhadda , S. , Wang , J. , Kaplow , J. , Lai , R.Y.K. , Lannfelt , L. , Bradley , H. , Rabe , M. , Koyama , A. , Reyderman , L. , Berry , D.A. , Berry , S. , Gordon , R. , Kramer , L.D. , Cummings , J.L. , 2021 . A randomized, double-blind, phase 2b proof-of-concept clinical trial in early Alzheimer’s disease with lecanemab, an anti-Aβ protofibril antibody . Alzheimers Res. Ther . 13 , 80 . doi: 10.1186/s13195-021-00813-8 OpenUrl CrossRef PubMed ↵ Tam , A. , Laurent , C. , Gauthier , S. , Dansereau , C. , 2022 . Prediction of cognitive decline for enrichment of Alzheimer’s disease clinical trials . J. Prev. Alzheimers Dis . 9 , 400 – 409 . doi: 10.14283/jpad.2022.49 OpenUrl CrossRef ↵ Thal , D.R. , Rüb , U. , Orantes , M. , Braak , H. , 2002 . Phases of Aβ-deposition in the human brain and its relevance for the development of AD . Neurology 58 , 1791 – 1800 . doi: 10.1212/WNL.58.12.1791 OpenUrl Abstract / FREE Full Text ↵ Tustison , N.J. , Avants , B.B. , Cook , P.A. , Zheng , Y. , Egan , A. , Yushkevich , P.A. , Gee , J.C. , 2010 . N4ITK: Improved N3 bias correction . IEEE Trans. Med. Imaging 29 , 1310 – 1320 . doi: 10.1109/TMI.2010.2046908 OpenUrl CrossRef PubMed Web of Science ↵ van der Kall , L.M. , Truong , T. , Burnham , S.C. , Doré , V. , Mulligan , R.S. , Bozinovski , S. , Lamb , F. , Bourgeat , P. , Fripp , J. , Schultz , S. , Lim , Y.Y. , Laws , S.M. , Ames , D. , Fowler , C. , Rainey-Smith , S.R. , Martins , R.N. , Salvado , O. , Robertson , J. , Maruff , P. , Masters , C.L. , Villemagne , V.L. , Rowe , C.C. , 2021 . Association of β-Amyloid level, clinical progression, and longitudinal cognitive change in normal older individuals . Neurology 96 , e662 – e670 . doi: 10.1212/WNL.0000000000011222 OpenUrl Abstract / FREE Full Text ↵ Villemagne , V.L. , Mulligan , R.S. , Pejoska , S. , Ong , K. , Jones , G. , O’Keefe , G. , Chan , J.G. , Young , K. , Tochon-Danguy , H. , Masters , C.L. , Rowe , C.C. , 2012 . Comparison of 11C-PiB and 18F-florbetaben for Aβ imaging in ageing and Alzheimer’s disease . Eur. J. Nucl. Med. Mol. Imaging 39 , 983 – 989 . doi: 10.1007/s00259-012-2088-x OpenUrl CrossRef PubMed ↵ Wang , C. , Tachimori , H. , Yamaguchi , H. , Sekiguchi , A. , Li , Y. , Yamashita , Y. , 2024 . A multimodal deep learning approach for the prediction of cognitive decline and its effectiveness in clinical trials for Alzheimer’s disease . Transl. Psychiatry 14 , 1 – 11 . doi: 10.1038/s41398-024-02819-w OpenUrl CrossRef PubMed ↵ Wolz , R. , Schwarz , A.J. , Gray , K.R. , Yu , P. , Hill , D.L.G. , For the Alzheimer’s Disease Neuroimaging Initiative , 2016 . Enrichment of clinical trials in MCI due to AD using markers of amyloid and neurodegeneration . Neurology 87 , 1235 – 1241 . doi: 10.1212/WNL.0000000000003126 OpenUrl Abstract / FREE Full Text ↵ Yala , A. , Mikhael , P.G. , Strand , F. , Lin , G. , Smith , K. , Wan , Y.-L. , Lamb , L. , Hughes , K. , Lehman , C. , Barzilay , R. , 2021 . Toward robust mammography-based models for breast cancer risk . Sci. Transl. Med . 13 , eaba4373. doi: 10.1126/scitranslmed.aba4373 OpenUrl Abstract / FREE Full Text View the discussion thread. Back to top Previous Next Posted March 16, 2026. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Predicting future cognitive impairment in preclinical Alzheimer’s disease using amyloid PET and MRI: a multisite machine learning study Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Predicting future cognitive impairment in preclinical Alzheimer’s disease using amyloid PET and MRI: a multisite machine learning study Braden Yang , Tom Earnest , Murat Bilgel , Marilyn S. Albert , Sterling C. Johnson , Christos Davatzikos , Guray Erus , Colin L. Masters , Susan M. Resnick , Michael I. Miller , Arnold Bakker , John C. Morris , Tammie L.S. Benzinger , Brian A. Gordon , Aristeidis Sotiras , the Alzheimer’s Disease Neuroimaging Initiative , the Preclinical Alzheimer’s Disease Consortium medRxiv 2025.10.15.25337507; doi: https://doi.org/10.1101/2025.10.15.25337507 Share This Article: Copy Citation Tools Predicting future cognitive impairment in preclinical Alzheimer’s disease using amyloid PET and MRI: a multisite machine learning study Braden Yang , Tom Earnest , Murat Bilgel , Marilyn S. Albert , Sterling C. Johnson , Christos Davatzikos , Guray Erus , Colin L. Masters , Susan M. Resnick , Michael I. Miller , Arnold Bakker , John C. Morris , Tammie L.S. Benzinger , Brian A. Gordon , Aristeidis Sotiras , the Alzheimer’s Disease Neuroimaging Initiative , the Preclinical Alzheimer’s Disease Consortium medRxiv 2025.10.15.25337507; doi: https://doi.org/10.1101/2025.10.15.25337507 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Radiology and Imaging Subject Areas All Articles Addiction Medicine (570) Allergy and Immunology (863) Anesthesia (301) Cardiovascular Medicine (4442) Dentistry and Oral Medicine (444) Dermatology (383) Emergency Medicine (609) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1511) Epidemiology (15231) Forensic Medicine (30) Gastroenterology (1126) Genetic and Genomic Medicine (6610) Geriatric Medicine (668) Health Economics (998) Health Informatics (4542) Health Policy (1370) Health Systems and Quality Improvement (1613) Hematology (543) HIV/AIDS (1266) Infectious Diseases (except HIV/AIDS) (15924) Intensive Care and Critical Care Medicine (1103) Medical Education (623) Medical Ethics (147) Nephrology (668) Neurology (6608) Nursing (346) Nutrition (999) Obstetrics and Gynecology (1146) Occupational and Environmental Health (957) Oncology (3338) Ophthalmology (974) Orthopedics (369) Otolaryngology (420) Pain Medicine (436) Palliative Medicine (130) Pathology (665) Pediatrics (1693) Pharmacology and Therapeutics (692) Primary Care Research (712) Psychiatry and Clinical Psychology (5449) Public and Global Health (9240) Radiology and Imaging (2203) Rehabilitation Medicine and Physical Therapy (1370) Respiratory Medicine (1196) Rheumatology (596) Sexual and Reproductive Health (714) Sports Medicine (530) Surgery (712) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'a0205b410d49ad07',t:'MTc3OTgzNjAxMQ=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

⚙ Ask this paper AI returns verbatim quotes from the full text · source: preprint-html ⓘ

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc: last seen: 2026-05-20T01:45:00.602351+00:00