BrainVAE: Exploring the role of white matter BOLD in preclinical Alzheimer’s disease classification

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 46,867 characters · extracted from preprint-html · click to expand
BrainVAE: Exploring the role of white matter BOLD in preclinical Alzheimer’s disease classification | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results BrainVAE: Exploring the role of white matter BOLD in preclinical Alzheimer’s disease classification Yikang Li , Lyuan Xu , Lianrui Zuo , Yukie Chang , Zhaohua Ding , Adam W. Anderson , View ORCID Profile Kurt G. Schilling , John C. Gore , Yurui Gao , the Alzheimer’s Disease Neuroimaging Initiative doi: https://doi.org/10.1101/2025.05.07.652697 Yikang Li 1 Vanderbilt University Institute of Imaging Science, Vanderbilt University Medical Center , Nashville, TN, United States 4 Department of Biomedical Engineering, Vanderbilt University , Nashville, TN, United State Find this author on Google Scholar Find this author on PubMed Search for this author on this site Lyuan Xu 1 Vanderbilt University Institute of Imaging Science, Vanderbilt University Medical Center , Nashville, TN, United States 2 Department of Electrical and Computer Engineering, Vanderbilt University , Nashville, TN, United States Find this author on Google Scholar Find this author on PubMed Search for this author on this site Lianrui Zuo 2 Department of Electrical and Computer Engineering, Vanderbilt University , Nashville, TN, United States Find this author on Google Scholar Find this author on PubMed Search for this author on this site Yukie Chang 5 Department of Computer Science, Pomona College , Claremont, CA, United States Find this author on Google Scholar Find this author on PubMed Search for this author on this site Zhaohua Ding 1 Vanderbilt University Institute of Imaging Science, Vanderbilt University Medical Center , Nashville, TN, United States 2 Department of Electrical and Computer Engineering, Vanderbilt University , Nashville, TN, United States Find this author on Google Scholar Find this author on PubMed Search for this author on this site Adam W. Anderson 1 Vanderbilt University Institute of Imaging Science, Vanderbilt University Medical Center , Nashville, TN, United States 3 Department of Radiology and Radiological Sciences, Vanderbilt University Medical Center , Nashville, TN, United States 4 Department of Biomedical Engineering, Vanderbilt University , Nashville, TN, United State Find this author on Google Scholar Find this author on PubMed Search for this author on this site Kurt G. Schilling 1 Vanderbilt University Institute of Imaging Science, Vanderbilt University Medical Center , Nashville, TN, United States 3 Department of Radiology and Radiological Sciences, Vanderbilt University Medical Center , Nashville, TN, United States Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Kurt G. Schilling John C. Gore 1 Vanderbilt University Institute of Imaging Science, Vanderbilt University Medical Center , Nashville, TN, United States 3 Department of Radiology and Radiological Sciences, Vanderbilt University Medical Center , Nashville, TN, United States 4 Department of Biomedical Engineering, Vanderbilt University , Nashville, TN, United State Find this author on Google Scholar Find this author on PubMed Search for this author on this site Yurui Gao 1 Vanderbilt University Institute of Imaging Science, Vanderbilt University Medical Center , Nashville, TN, United States 4 Department of Biomedical Engineering, Vanderbilt University , Nashville, TN, United State Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: yurui.gao{at}vanderbilt.edu Abstract Full Text Info/History Metrics Preview PDF Abstract INTRODUCTION Like gray matter (GM), white matter (WM) BOLD functional signals change in preclinical AD. However, the potential of WM BOLD for identifying preclinical AD remains underexplored. METHODS We developed BrainVAE, a transformer-based variational autoencoder with interpretability, to classify preclinical AD and normal controls using resting-state fMRI data. We benchmarked BrainVAE against nine alternative models under three input configurations: WM-only, GM-only, and combined WM+GM. Interpretability analysis was also performed to investigate each brain region’s contribution to the classification task. RESULTS BrainVAE outperformed other models and performed well (accuracy = 83.42%, F1-score = 91.62%, AUC = 64.50%) using the combined input compared to WM-only and GM-only. Specific WM bundles--including corpus callosum, fornix, and corticospinal tract—were among the most influential features contributing to the classification. DISCUSSION Incorporating WM BOLD signals improves the distinction of preclinical AD from controls, underscoring the potential role of WM BOLD features for detecting early-stage AD. Highlights BrainVAE integrates white and gray matter BOLD signals for classification of pre-AD and controls. BrainVAE achieves high accuracy (83.42%) and F1-score (91.62%) in identifying pre-AD. Models using combined WM+GM inputs outperform those using WM-only or GM-only inputs. WM regions, such as corpus callosum and fornix, contribute significantly to model predictions. Results suggest WM BOLD signals are informative markers for early AD detection. 1. Background Alzheimer’s disease (AD) is a progressive neurodegenerative disorder characterized by the accumulation of amyloid-beta (Aβ) plaques and hyperphosphorylated tau proteins, leading to widespread neuronal dysfunction and ultimately cognitive decline 1 . Functional alterations may begin years or even decades before the onset of clinical symptoms, involving both gray matter (GM) and white matter (WM) networks. 2 This prolonged preclinical phase offers a critical window for early detection of AD. Resting state functional MRI (fMRI) has emerged as a promising tool for detecting early functional disturbances in the brain. 2 , 3 However, most prior fMRI research has focused on GM signals, often discarding signals in WM as nuisance variables. 4 , 5 Recent evidence suggests that WM BOLD fluctuations—although weaker—are reliably detectable and associated with brain activity. Importantly, our work has demonstrated that fMRI measures in WM are altered not only in mild cognitive impairment and AD dementia 6 but also during the preclinical AD period 7 , suggesting their potential for early disease classification. Despite these promising observations, it remains unclear whether WM fMRI signals provide additional diagnostic power beyond traditional GM fMRI features alone. We hypothesized that adding WM functional information to GM would enhance performance in identifying preclinical AD. However, testing this hypothesis using traditional methods poses several critical challenges. First, WM BOLD signals inherently possess lower signal-to-noise ratios than GM 8 , 9 , while the functional parcellation of WM remains less mature compared to GM, making it challenging to compute robust and reproducible metrics of functional connectivity. Second, functional connectivity matrices in preclinical AD are characterized by subtle, small-magnitude changes that are distributed across many ROI pairs, requiring models capable of detecting weak and spatially diffuse inter-regional dependencies. 10 , 11 Third, the relatively small number of preclinical AD datasets leads to class imbalance, increasing the risk of overfitting, particularly for standard supervised learning approaches. In addition, recent developments in deep learning provide interpretable attention mechanisms that enable the quantitative assessment of each white matter bundle’s contribution to classification outcomes 12 . To address these challenges, we propose Brain Variational AutoEncoder (BrainVAE) , a novel deep learning model designed to integrate WM and GM fMRI measures for the classification of preclinical AD and controls. First, we employ deep neural networks capable of extracting robust and biologically relevant features from fMRI data with low signal-to-noise ratios and anatomical variability, particularly within WM. Second, we use a transformer-based encoder architecture, whose self-attention mechanism effectively captures subtle and spatially diffuse inter-regional dependencies between brain regions. 13 , 14 , 15 This approach enhances the model’s generalizability while maintaining biological interpretability, enabling accurate identification of preclinical AD based on integrated WM and GM functional connectivities. BrainVAE extends beyond conventional classification models by integrating interpretability directly into its architecture. Through the transformer-based encoder, BrainVAE systematically assigns attention weights to individual GM parcels and WM bundles, enabling identification of brain regions, which is most critical for distinguishing preclinical AD from normal aging. To validate the effectiveness of our approach, we benchmarked BrainVAE against a diverse range of machine learning and deep learning models. Each model was evaluated using three types of input datasets: GM-only, WM-only, and combined GM-WM functional connectivity matrices. This experimental design allowed us to assess both the overall classification performance and the added diagnostic value of incorporating WM signals. Overall, BrainVAE demonstrated robust generalization across input types while providing insights into the functional relevance of WM networks in early AD diagnosis. 2. Methods 2.1 Data and Participants The dataset for primary classification was sourced from the Alzheimer’s Disease Neuroimaging Initiative (ADNI), comprising resting state fMRI and T1-weighted images of 78 participants with preclinical AD (pre-AD) (64% female; 77.0 ± 6.8 years) and 217 normal controls (NC) (56% female; 75.2 ± 7.4 years). All these participants were clinically unimpaired, defined by a Clinical Dementia Rating (CDR) of 0 and a Mini-Mental State Examination (MMSE) score between 24 and 30. Pre-AD participants were Aβ-positive, meeting at least one of the following criteria: cerebrospinal fluid (CSF) Aβ 1.22 17 , Pittsburgh compound B (PiB) PET SUVR > 1.42 18 , or Florbetaben (FBB) PET SUVR > 1.478 19 . In contrast, NC participants were Aβ-negative across all available modalities. For pretraining purposes, fMRI and T1-weighted data from 1953 cognitively normal older participants (55% female; 70.8 ± 7.2 years) were obtained from the Baltimore Longitudinal Study of Aging (BLSA) 20 and the Open Access Series of Imaging Studies (OASIS) 21 . These datasets have comparable spatial resolution, repetition time and number of time points. Detailed cohort characteristics, including demographic information and clinical measures, are summarized in Table 1 . View this table: View inline View popup Table 1. Characteristics of the Study Cohort including classification datasets and pretrain datasets. Note: a Uncorrected P < .05 b FDR-corrected P < .05 2.2 Data Processing Data processing includes image preprocessing and evaluation of FC matrices, briefly stated as below (see ref 7 for more details). The fMRI images were first corrected for slice timing and head motion; participants with head rotation > 2° or head translation > 2mm were excluded. Twenty-four motion parameters and the mean signal from CSF were regressed out 22 . Each time series was detrended and bandpass filtered (0.01– 0.1□Hz). These preprocessing steps were executed using the Data Processing Assistant for Resting-State fMRI toolbox 23 . Meanwhile, tissue probability maps (TPMs) for brain-wide GM, WM, and CSF were generated by segmenting the T1-weighted images using the Computational Anatomy Toolbox (CAT12) 24 . Both the filtered fMRI data and TPMs were normalized to MNI space. To prevent partial volume effects at the WM-GM interface, spatial smoothing was intentionally omitted. GM and deep WM were parcellated into 200 cortical parcels and 48 WM bundles, based on the Schaefer atlas 25 and the JHU’s Eve atlas 26 , respectively, resulting in a total of 248 regions ( Fig. 1a ). Regional time series were extracted by averaging the z-scored time series within each region. FC was computed using Pearson’s correlation between the time series of each pair of regions, yielding a 248□×□248 FC matrix for each participant. To curb the spurious correlations arising from noise alone, FC values below 0.1 were set to zero. Download figure Open in new tab Figure 1. The overall pipeline of BrainVAE consists of three stages: pretraining, supervised-learning and joint finetuning. The first datasets on the upper left are the large healthy datasets that are used for pretraining stage. The labeled datasets were used in the supervised-learning and joint finetuning stages. Download figure Open in new tab Figure 2. The main architecture of the Transformer-based encoder in the BrainVAE model. 2.3 BrainVAE Model FC matrices are derived from datasets with significant class imbalance, as the number of preclinical AD scans is substantially lower relative to cognitively normal controls. Under these circumstances a discriminative neural network is prone to over□fitting the minority class and to ignoring subtle but physiologically meaningful signals between-group difference. We therefore adopt a variational auto□encoder framework, which first learns—without labels—a low□dimensional, smooth manifold representing normal GM and WM connectivity. Supervised classification is performed only in that compressed latent space; these yields strong regularization, an explicit probabilistic measure of abnormality via the latent Kullback–Leibler (KL) term, and a principled way to combine unsupervised information from 1,953 healthy controls with the limited labelled cohort. The neural network, shown in Figure 1 , comprises a transformer□based encoder that converts a 248□×□248 correlation matrix,□ X , into latent mean µ and log-variance log ( σ 2 ), a decoder that reconstructs x from a stochastic latent vector z , and a multilayer perceptron classifier that maps s ∈ ℝ 2 . To stabilize learning under class imbalance (78□pre-AD vs 217□CN), network parameters are optimized in three successive stages described in Section 2.3.3 . 2.3.1 Pretrained Variational AutoEncoder In this study, the input to the VAE is the correlation matrix derived from each participant’s resting-state fMRI signals. For each participant we observe a symmetric correlation matrix: The goal is to encode the matrix into a latent vector z ∈ ℝ d , d = 64, distributed according to the Gaussian prior p ( z ) = N(0, I), and then decode z back into a reconstructed correlation matrix with the least difference compared to X . During the pretraining, the network is optimized so that the reconstructed output is close to the original input, but with additional constraints that ensure the latent space remains well-organized and continuous. The encoder portion of the VAE applies several learnable transformations to the correlation matrix. The encoder parameterized by ϕ approximates the posterior distribution: where µ ϕ and log are learned functions mapping the input FC matrix X ∈ ℝ N × N to a d-dimensional latent space, representing the mean and variance of the Gaussian distribution, respectively. Instead of directly sampling z from these learned distributions (which would break the computational graph), a reparameterization step is introduced. In this step, the network draws random noise ϵ from a standard normal distribution and constructs so that the backpropagation algorithm can still update all parameters. The decoder p ψ ( X | z ) receives z and attempts to reconstruct the correlation matrix Since the reconstruction target is correlation coefficient, which has values between -1 to 1, we used a hyperbolic tangent as the final activation layer to enforce this data range. Reconstruction fidelity is measured with a mean-squared error (MSE) or similar criterion, ensuring that reconstructed matrices approximate the actual functional connectivity patterns in the training dataset. To keep the latent variables from collapsing onto arbitrary points, an additional penalty term known as the Kullback– Leibler (KL) divergence is included. The KL term forces the learned distribution N ( µ, σ 2 ) to remain close to a chosen prior (typically N (0, I )). Thus, the overall training objective for stage 1 can be written as: where B is the mini batch size, and α = 1. The first term encourages accurate reconstruction; the KL term constrains the latent distribution to remain close to the unit Gaussian, preventing “holes” where the decoder has never been trained and thus enforcing a smooth, informative latent manifold. 2.3.2 Transformer-based Autoencoder Traditional multilayer perceptron (MLP) encoders treat each input as an independent feature and rely on fully connected layers to capture relationships across regions, which can be inefficient or ineffective for modeling complex inter-regional dependencies in brain connectivity data. To better capture the structured relationships inherent in functional connectivity (FC) matrices, we adopted a transformer-based encoder architecture. Transformers are suited for this task due to their self-attention mechanism, which explicitly models pairwise interactions between all regions of interest (ROIs), regardless of spatial proximity or ordering. By treating each row of the FC matrix (i.e., each ROI’s connectivity profile) as a token, the transformer can learn contextualized representations that reflect both local and global connectivity patterns. This structure-aware encoding is especially valuable in the context of preclinical AD, where subtle but distributed alterations in connectivity may serve as early biomarkers. The transformer encoder was used for both the unsupervised pretraining phase and the downstream classification task. The inputs for the transformer-based encoder are the rows of X interpreted as 248 ordered tokens { x 1 , x 2 , …, x N }∈ ℝ N . Each token is linearly embedded , where W emb ∈ ℝ d × N , d is the dimensionality of each query or key, followed by batch normalization across tokens. Then two identical self-attention blocks (dropout□0.3) are stacked. For a set of token features H ∈ ℝ d × N , each attention head h computes , with learnable projections where queries: , keys: and values: . Our transformer based encoder has four heads, which run in parallel; their outputs are concatenated, passed through a 256-unit feed-forward network, and combined with residual connections and layer-norm—this constitutes one transformer block, yielding a depth sufficient to model higher-order connectivity patterns while avoiding over-fitting. Our transformer-based encoder enables the latent representation z to encode not only the overall covariance structure but also specific region-to-region dependencies that may be highly relevant for distinguishing preclinical AD from normal aging. In the final classification step, the network extracts z and feeds it into a supervised head (a series of fully connected layers) trained to categorize each participant as either cognitively normal or pre-AD. 2.3.3 Three □ stage training protocol The main architecture of BrainVAE leverages the strengths of both unsupervised representation learning and attention-driven encoding. In this case, to maximize the strength of representation learning and avoid the classic label imbalance problems, we stated the three stages training protocol within the BrainVAE model. The first stage is unsupervised pre-training the transformer-based encoder and decoder. During the process, parameters ( ϕ, ϕ ) are learned by minimizing ℒ VAE on 2□000 healthy controls. Weights yielding the lowest validation loss are retained. In the second stage, the classifier is trained on the labeled classification datasets while the encoder and decoder are frozen. The supervised loss is defined as the combination of a class-balanced Focal term 26 ℒ CB − Focal and the differentiable AUROC surrogate 27 ℒ AUC : In the third stage, all parameters of encoder, decoder and classifier are trained in a joint loss function for fine tuning. The composite loss is defined as: where λ KL =10 −3 and , β max =0.3, and T is the number of epochs. 2.4 Benchmark Models and Performance Assessments To validate the effectiveness of the proposed model, a comprehensive set of benchmark models was implemented for comparisons, including classic machine learning algorithms, convolution neural networks (CNN)-based models, and graph neural networks (GNN)-based models ( Fig. 3 ). Specifically, the machine learning models included support vector machines (SVM) 30 , multilayer perceptron (MLP) 31 , and random forests 32 , all of which used regional time series as input. The CNN-based models included BrainNetCNN 33 , Transformer 34 and Brain Network Transformer 14 , using FC matrices as input. The GNN-based models included BrainGNN 35 , interpretable GNN (IBGNN) 36 and its variant IBGNN+. These models operate on graph representations, where nodes represent brain regions and edge weights encode inter-regional functional connectivity. Download figure Open in new tab Figure 3. The benchmarked models across different types of data and different approaches. Model performance was assessed using five-fold cross-validation. with accuracy, F1-score, and receiver operating characteristic curve (AUC) as assessment metrics. Each model was evaluated on three input configurations: one with only GM parcels, one with only WM bundles, and one combining both. This experimental design aimed to assess whether adding WM features improved classification performance. 2.5 Interpretability Analysis The BrainVAE framework incorporates a transformer-based attention encoder, which not only boosts classification accuracy but also provides interpretability by highlighting the most informative brain regions across the cohort. Specifically, the attention mechanism learned to assign higher attention weights to brain regions—either GM parcels or WM bundles—that contribute more to the classification of preclinical AD and NC. The regional importance scores were extracted by averaging the attention weights across all self-attention heads. Higher importance score indicated a larger contribution to the classification. In the combined configuration (WM+GM), attention scores were specifically examined to quantify how integral WM bundles were to the network’s understanding of emerging pathology. The presence of WM bundles among the top-ranked features provided evidence supporting the critical role of WM signals in early disease detection. 3. Results 3.1 BrainVAE benchmarking BrainVAE achieved averaged classification accuracies of 0.7763, 0.8271, and 0.8342 for the WM-only, GM-only and combined WM+GM configurations, respectively, outperforming all nine benchmark models ( Table 2 ). It also yielded the highest average F1-scores for all three configurations: 0.873 (WM-only), 0.904 (GM-only) and 0.916 (WM+GM). In terms of AUC, BrainVAE ranked first for the WM-only and WM+GM configurations, and among the top three for GM-only. Collectively, these results suggest that BrainVAE model provides superior overall classification performance ( Table 2 ). View this table: View inline View popup Download powerpoint Table 2. The performance comparison between BrainVAE and other models with different types of data input. Using only WM BOLD features, BrainVAE achieved a 6% higher AUC, 6% lower accuracy and 3% lower F1-score compared to the GM-only inputs, suggesting that WM BOLD carries at least comparable information to conventional GM BOLD for classification. Notably, all benchmark models showed lower or almost the same AUCs when using WM-only versus GM-only input ( Table 2 ), indicating BrainVAE may be uniquely more sensitive to WM BOLD information. 3.2 Classification with combined WM and GM features Across nearly all models, performance was improved when using combined WM+GM features as input, compared to using either WM-only or GM-only input alone. The combined input consistently produced the highest accuracy, F1-score, and AUC for most models. Full comparisons across models and input types are presented in Table 2 (and illustrated in Fig. 4 ). Download figure Open in new tab Figure 4. Visualization of classification performance (Accuracy, AUC, and F1-score) for BrainVAE and baseline models across three input conditions: white matter only, gray matter only, and combined matter. 3.3 Interpretability Analysis Results Figure 5A presents the resulting attention score matrix for the combined WM+GM input, where rows and columns correspond to 248 ROIs (200 GM, 48 WM). Download figure Open in new tab Figure 5. A. Correlation attention scores across combined gray and white matter ROIs, indicating network-level contributions to classification. B. Ranked importance scores for each ROI, with gray matter (orange) and white matter (blue), highlighting the top five white matter ROIs. C. Top five important white matter ROIs identified by BrainVAE’s attention mechanism for pre-clinical Alzheimer’s disease classification. To evaluate the importance of each ROI, we summed the attention weights across each row in the matrix. The resulting importance distribution is shown in Figure 5B , with GM and WM regions color-coded in orange and blue, respectively. Several WM bundles ranked among the highest in attention score, with some exceeding all GM parcels. The top-ranked WM regions were further visualized in Figure 5C , including left tapetum, splenium of corpus callosum, body of corpus callosum, fornix, and right corticospinal tract. 4. Discussion The main goal of this study is to investigate whether incorporating WM functional signals, alongside the more commonly studied GM connectivity patterns, could enhance the classification of individuals with pre-AD versus normal controls. Leveraging a novel transformer-based variational autoencoder, BrainVAE, we systematically evaluated classification performance across multiple input configurations and model types. Three key findings emerged: (1) BrainVAE consistently outperformed all benchmark models in distinguishing pre-AD from cognitively normal controls; (2) combining WM+GM input led to improved classification accuracy across a range of models; and (3) attention-based interpretability revealed that several WM bundles were among the most influential regions contributing to model predictions. 4.1 Overall Performance of BrainVAE BrainVAE achieved the highest performance in distinguishing preclinical AD from normal controls, demonstrating its ability to extract informative functional features for classification even if no between-group differences were observed in clinical cognitive scores ( Table 1 ). Classification accuracy remained consistent across different input conditions, including WM-only (0.7763), GM-only (0.8271), and combined WM+GM (0.8342), with relatively small performance gap. This suggests that BrainVAE is capable of effectively leveraging information from WM connectivity, even in face of its lower signal-to-noise ratio and less mature functional parcellation. In addition, the model produced stable results across cross-validation folds, as reflected by the small standard deviations reported in Table 2 , indicating robustness to class imbalance and limited sample sizes in the pre-AD group. Across all benchmark models, BrainVAE consistently achieved the highest classification performance under each input condition, including WM-only, GM-only, and combined GM-WM connectivity. This suggests that its transformer-based encoder and variational autoencoder structure provided stronger representational capacity for capturing informative features in the functional connectivity data. 4.2 Value of WM BOLD signals Not only BrainVAE, but also nearly all benchmark models demonstrated improved classification performance when using combined WM+GM input compared to GM-only or WM-only, regardless of model architecture. While GM-only inputs generally outperformed WM-only, the combined input consistently yielded the highest accuracy, F1-score, and AUC across all model categories. These findings highlight the added diagnostic value of incorporating WM BOLD features and suggest that its contribution is robust across both classic machine learning and deep learning frameworks. 4.3 Interpretability Analysis The interpretability results revealed that BrainVAE does not distribute predictive attention uniformly across all brain regions, but instead concentrates it on a selective subset of regions, spanning both WM bundles and GM parcels. The distribution of attention weights exhibited a non-random, asymmetric pattern, where a small number of regions—particularly within WM—received disproportionately high scores. This indicates that the model identifies localized functional features as critical for classification, rather than treating all regions as equally informative or relying on uniform global patterns. The consistent presence of WM bundles among the top-ranked attention regions suggests that the model considers functional interactions within WM as directly informative, rather than as secondary or supporting input. At the same time, known GM regions associated with early-stage AD also received relatively high attention scores, reflecting BrainVAE’s integration of complementary contributions from both tissue types for decision-making. Together, these findings demonstrate that BrainVAE’s architecture provides a selective focus on functionally meaningful connections and support a regionally specific decision-making strategy that spans both WM and GM domains. 4.4 Biological Relevance The WM bundles identified as critical to BrainVAE’s classification decisions—including the left tapetum, splenium of the corpus callosum, and fornix—are anatomically positioned to support long-range connectivity between cortical regions. The fornix and tapetum are involved in limbic and memory-related processing, while the corpus callosum facilitates interhemispheric information transfer. These tracts contribute to large-scale networks that subserve episodic memory, attention, and executive function—domains known to be subtly affected in the preclinical stage of AD 37 . The elevated attention weights assigned to these tracts align with accumulating evidence that WM abnormalities may precede or co-occur with cortical atrophy in AD. Myelin loss and axonal disruption in these regions have been linked to Aβ accumulation, particularly during the asymptomatic stage 38 , 39 . Moreover, alterations in the posterior callosal regions and corticospinal tract have been associated with early functional impairment in motor-related systems, which may reflect broader network disintegration that extends beyond cognitive circuits 40 . These findings support a growing body of work indicating that functional connectivity in WM is not merely epiphenomenal but may provide early biomarkers for AD detection. Functional MRI studies have shown that BOLD signals in WM are both detectable and behaviorally meaningful, particularly when analyzed in the context of WM–GM integration 41 , 42 . The identification of high-attention WM bundles by BrainVAE suggests that these regions may capture subtle disruptions in long-range communication that are difficult to detect with GM features alone. Taken together, these results reinforce a network-based perspective of AD pathology, in which early dysfunction involves distributed alterations across both WM and GM structures, potentially mediated by molecular and structural degeneration within WM tracts. 5. Conclusion In conclusion, this work demonstrates that accounting for WM BOLD features (time series, FC, and graphs) substantially enhanced the detection of preclinical AD. The synergy between WM and GM features underscores the network-centric character of early AD pathology, offering an expanded view beyond cortical atrophy alone. By elucidating which parcels and bundles particularly contribute to classification, the BrainVAE model provides a framework for future efforts in refining early biomarkers and improving disease characterization. Acknowledgements This work was supported by NIH grants RF1MH123201 (Gore and Landman), R01NS113832 (Gore), R21AG083915 (Gao), K01EB032898 (Schilling), I would like to thank my supervisors, Dr. John Gore, Dr. Kurt Schilling and Dr. Yurui Gao for their guidance and support throughout this project. Funder Information Declared NIH , RF1MH123201 , R01NS113832 , R21AG083915 , K01EB032898 Footnotes ↵ a Data used in preparation of this article were obtained from the Alzheimer’s Disease Neuroimaging Initiative (ADNI) database (adni.loni.usc.edu). As such, the investigators within the ADNI contributed to the design and implementation of ADNI and/or provided data but did not participate in analysis or writing of this report. A complete listing of ADNI investigators can be found at: http://adni.loni.usc.edu/wp-content/uploads/how_to_apply/ADNI_Acknowledgement_List.pdf . References 1. ↵ Jack Jr. , C. R. et al. NIA-AA Research Framework: Toward a biological definition of Alzheimer’s disease . Alzheimer’s & Dementia 14 , 535 – 562 ( 2018 ). OpenUrl CrossRef 2. ↵ Wang , L. et al. Cerebrospinal fluid Aβ42, phosphorylated Tau181, and resting-state functional connectivity . JAMA Neurol 70 , 1242 – 1248 ( 2013 ). OpenUrl PubMed 3. ↵ Wang , K. et al. Altered functional connectivity in early Alzheimer’s disease: a resting-state fMRI study . Hum Brain Mapp 28 , 967 – 978 ( 2007 ). OpenUrl CrossRef PubMed Web of Science 4. ↵ Gore , J. C. et al. Functional MRI and resting state connectivity in white matter - a mini-review . Magn Reson Imaging 63 , 1 – 11 ( 2019 ). OpenUrl CrossRef PubMed 5. ↵ Ding , Z. et al. Detection of synchronous brain activity in white matter tracts at rest and under functional loading . Proc Natl Acad Sci U S A 115 , 595 – 600 ( 2018 ). OpenUrl Abstract / FREE Full Text 6. ↵ Gao , Y. et al. Functional connectivity of white matter as a biomarker of cognitive decline in Alzheimer’s disease . PLoS One 15 , e0240513 ( 2020 ). OpenUrl CrossRef PubMed 7. ↵ Xu , L. et al. Reductions in the white-gray functional connectome in preclinical Alzheimer’s disease and their associations with amyloid and cognition . Alzheimers Dement 20 , 8317 – 8330 ( 2024 ). OpenUrl CrossRef PubMed 8. ↵ Grajauskas , L. A. , Frizzell , T. , Song , X. & D’Arcy , R. C. N. White Matter fMRI Activation Cannot Be Treated as a Nuisance Regressor: Overcoming a Historical Blind Spot . Front. Neurosci . 13 , ( 2019 ). 9. ↵ Frontiers | Functional MRI activation in white matter during the Symbol Digit Modalities Test . https://www.frontiersin.org/journals/human-neuroscience/articles/10.3389/fnhum.2014.00589/full . 10. ↵ Sui , J. , Jiang , R. , Bustillo , J. & Calhoun , V. Neuroimaging-based Individualized Prediction of Cognition and Behavior for Mental Disorders and Health: Methods and Promises . Biological Psychiatry 88 , 818 – 828 ( 2020 ). OpenUrl CrossRef PubMed 11. ↵ Sohn , W. S. , Yoo , K. , Na , D. L. & Jeong , Y. Progressive Changes in Hippocampal Resting-state Connectivity Across Cognitive Impairment: A Cross-sectional Study From Normal to Alzheimer Disease . Alzheimer Disease & Associated Disorders 28 , 239 ( 2014 ). OpenUrl CrossRef PubMed 12. ↵ Qiu , S. et al. Development and validation of an interpretable deep learning framework for Alzheimer’s disease classification . Brain 143 , 1920 – 1933 ( 2020 ). OpenUrl CrossRef PubMed 13. ↵ Dosovitskiy , A. et al. An Image is Worth 16×16 Words: Transformers for Image Recognition at Scale. in ( 2020 ). 14. ↵ Kan , X. et al. Brain Network Transformer . Advances in Neural Information Processing Systems 35 , 25586 – 25599 ( 2022 ). OpenUrl 15. ↵ Kingma , D. P. & Welling , M. An Introduction to Variational Autoencoders . MAL 12 , 307 – 392 ( 2019 ). OpenUrl 16. ↵ Vos , S. J. et al. Preclinical Alzheimer’s disease and its outcome: a longitudinal cohort study . Lancet Neurol 12 , 957 – 965 ( 2013 ). OpenUrl CrossRef PubMed Web of Science 17. ↵ Mishra , S. et al. AV-1451 PET imaging of tau pathology in preclinical Alzheimer disease: Defining a summary measure . Neuroimage 161 , 171 – 178 ( 2017 ). OpenUrl CrossRef PubMed 18. ↵ Vlassenko , A. G. et al. Imaging and cerebrospinal fluid biomarkers in early preclinical alzheimer disease . Ann Neurol 80 , 379 – 387 ( 2016 ). OpenUrl CrossRef PubMed 19. ↵ Sabri , O. et al. Florbetaben PET imaging to detect amyloid beta plaques in Alzheimer’s disease: phase 3 study . Alzheimers Dement 11 , 964 – 974 ( 2015 ). OpenUrl CrossRef PubMed 20. ↵ Resnick , S. M. et al. One-year age changes in MRI brain volumes in older adults . Cereb Cortex 10 , 464 – 472 ( 2000 ). OpenUrl CrossRef PubMed Web of Science 21. ↵ Marcus , D. S. et al. Open Access Series of Imaging Studies (OASIS): cross-sectional MRI data in young, middle aged, nondemented, and demented older adults . J Cogn Neurosci 19 , 1498 – 1507 ( 2007 ). OpenUrl CrossRef PubMed Web of Science 22. ↵ Friston , K. J. , Williams , S. , Howard , R. , Frackowiak , R. S. & Turner , R. Movement-related effects in fMRI time-series . Magn Reson Med 35 , 346 – 355 ( 1996 ). OpenUrl CrossRef PubMed Web of Science 23. ↵ Yan , C.-G. , Wang , X.-D. , Zuo , X.-N. & Zang , Y.-F. DPABI: Data Processing & Analysis for (Resting-State) Brain Imaging . Neuroinformatics 14 , 339 – 351 ( 2016 ). OpenUrl CrossRef PubMed 24. ↵ Gaser , C. et al. CAT: a computational anatomy toolbox for the analysis of structural MRI data . Gigascience 13 , giae049 ( 2024 ). OpenUrl CrossRef PubMed 25. ↵ Kong , R. et al. Individual-Specific Areal-Level Parcellations Improve Functional Connectivity Prediction of Behavior . Cereb Cortex 31 , 4477 – 4500 ( 2021 ). OpenUrl CrossRef PubMed 26. ↵ Mori , S. et al. Stereotaxic white matter atlas based on diffusion tensor imaging in an ICBM template . Neuroimage 40 , 570 – 582 ( 2008 ). OpenUrl CrossRef PubMed Web of Science 27. ↵ Vaswani , A. et al. Attention Is All You Need. Preprint at doi: 10.48550/arXiv.1706.03762 ( 2023 ). OpenUrl CrossRef 28. Lin , T.-Y. , Goyal , P. , Girshick , R. , He , K. & Dollar , P. Focal Loss for Dense Object Detection . IEEE Trans Pattern Anal Mach Intell 42 , 318 – 327 ( 2020 ). OpenUrl CrossRef PubMed 29. Cui , Y. , Jia , M. , Lin , T.-Y. , Song , Y. & Belongie , S. Class-Balanced Loss Based on Effective Number of Samples. in 9268 – 9277 ( 2019 ). 30. ↵ Hearst , M. A. , Dumais , S. T. , Osuna , E. , Platt , J. & Scholkopf , B. Support vector machines . IEEE Intelligent Systems and their Applications 13 , 18 – 28 ( 1998 ). OpenUrl CrossRef 31. ↵ Gardner , M. W. & Dorling , S. R. Artificial neural networks (the multilayer perceptron)—a review of applications in the atmospheric sciences . Atmospheric Environment 32 , 2627 – 2636 ( 1998 ). OpenUrl CrossRef Web of Science 32. ↵ Breiman , L. Random Forests . Machine Learning 45 , 5 – 32 ( 2001 ). OpenUrl CrossRef 33. ↵ Kawahara , J. et al. BrainNetCNN: Convolutional neural networks for brain networks; towards predicting neurodevelopment . NeuroImage 146 , 1038 – 1049 ( 2017 ). OpenUrl CrossRef PubMed 34. ↵ Khan , S. et al. Transformers in Vision: A Survey . ACM Comput. Surv . 54 , 200:1-200: 41 ( 2022 ). OpenUrl 35. ↵ Li , X. et al. BrainGNN: Interpretable Brain Graph Neural Network for fMRI Analysis . Medical Image Analysis 74 , 102233 ( 2021 ). OpenUrl CrossRef PubMed 36. ↵ Wang , L. , Dou , Q. , Fletcher , P. T. , Speidel , S. & Li , S. Cui , H. et al. /person-group>. Interpretable Graph Neural Networks for Connectome-Based Brain Disorder Analysis . in Medical Image Computing and Computer Assisted Intervention – MICCAI 2022 (eds. Wang , L. , Dou , Q. , Fletcher , P. T. , Speidel , S. & Li , S. ) 375 – 385 ( Springer Nature Switzerland, Cham , 2022 ). doi: 10.1007/978-3-031-16452-1_36 . OpenUrl CrossRef 37. ↵ Pereira , J. B. et al. Abnormal Structural Brain Connectome in Individuals with Preclinical Alzheimer’s Disease . Cereb Cortex 28 , 3638 – 3649 ( 2018 ). OpenUrl CrossRef PubMed 38. ↵ Dean , D. C. , III . et al. Association of Amyloid Pathology With Myelin Alteration in Preclinical Alzheimer Disease . JAMA Neurology 74 , 41 – 49 ( 2017 ). OpenUrl CrossRef PubMed 39. ↵ Roher , A. E. et al. Increased A beta peptides and reduced cholesterol and myelin proteins characterize white matter degeneration in Alzheimer’s disease . Biochemistry 41 , 11080 – 11090 ( 2002 ). OpenUrl CrossRef PubMed Web of Science 40. ↵ Silbert , L. C. , Nelson , C. , Howieson , D. B. , Moore , M. M. & Kaye , J. A. Impact of white matter hyperintensity volume progression on rate of cognitive and motor decline . Neurology 71 , 108 – 113 ( 2008 ). OpenUrl CrossRef PubMed 41. ↵ Marussich , L. , Lu , K.-H. , Wen , H. & Liu , Z. Mapping white-matter functional organization at rest and during naturalistic visual perception . NeuroImage 146 , 1128 – 1141 ( 2017 ). OpenUrl CrossRef PubMed 42. ↵ Li , M. , Newton , A. T. , Anderson , A. W. , Ding , Z. & Gore , J. C. Characterization of the hemodynamic response function in white matter tracts for event-related fMRI . Nat Commun 10 , 1140 ( 2019 ). OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted May 13, 2025. Download PDF Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following BrainVAE: Exploring the role of white matter BOLD in preclinical Alzheimer’s disease classification Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share BrainVAE: Exploring the role of white matter BOLD in preclinical Alzheimer’s disease classification Yikang Li , Lyuan Xu , Lianrui Zuo , Yukie Chang , Zhaohua Ding , Adam W. Anderson , Kurt G. Schilling , John C. Gore , Yurui Gao , the Alzheimer’s Disease Neuroimaging Initiative bioRxiv 2025.05.07.652697; doi: https://doi.org/10.1101/2025.05.07.652697 Share This Article: Copy Citation Tools BrainVAE: Exploring the role of white matter BOLD in preclinical Alzheimer’s disease classification Yikang Li , Lyuan Xu , Lianrui Zuo , Yukie Chang , Zhaohua Ding , Adam W. Anderson , Kurt G. Schilling , John C. Gore , Yurui Gao , the Alzheimer’s Disease Neuroimaging Initiative bioRxiv 2025.05.07.652697; doi: https://doi.org/10.1101/2025.05.07.652697 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Neuroscience Subject Areas All Articles Animal Behavior and Cognition (7629) Biochemistry (17660) Bioengineering (13881) Bioinformatics (41911) Biophysics (21436) Cancer Biology (18578) Cell Biology (25482) Clinical Trials (138) Developmental Biology (13371) Ecology (19887) Epidemiology (2067) Evolutionary Biology (24302) Genetics (15599) Genomics (22483) Immunology (17728) Microbiology (40364) Molecular Biology (17163) Neuroscience (88537) Paleontology (666) Pathology (2830) Pharmacology and Toxicology (4821) Physiology (7637) Plant Biology (15129) Scientific Communication and Education (2045) Synthetic Biology (4290) Systems Biology (9817) Zoology (2269)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00