Quantum-Enhanced Transfer Learning for MS Lesion Detection in MRI: A Hybrid Classical-Quantum Framework

doi:10.1101/2025.11.16.25340339

Quantum-Enhanced Transfer Learning for MS Lesion Detection in MRI: A Hybrid Classical-Quantum Framework

2025 · doi:10.1101/2025.11.16.25340339

preprint OA: closed

📄 Open PDF Full text JSON View at publisher

Full text 73,383 characters · extracted from preprint-html · click to expand

Quantum-Enhanced Transfer Learning for MS Lesion Detection in MRI: A Hybrid Classical-Quantum Framework | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Quantum-Enhanced Transfer Learning for MS Lesion Detection in MRI: A Hybrid Classical-Quantum Framework View ORCID Profile Mohadeseh Zarei Ghobadi , View ORCID Profile Elaheh Afsaneh doi: https://doi.org/10.1101/2025.11.16.25340339 Mohadeseh Zarei Ghobadi 1 Independent Researcher , Tehran, Iran Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Mohadeseh Zarei Ghobadi For correspondence: mohadesehzaree{at}gmail.com Elaheh Afsaneh 1 Independent Researcher , Tehran, Iran Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Elaheh Afsaneh Abstract Full Text Info/History Metrics Data/Code Preview PDF Abstract Accurate detection of multiple sclerosis (MS) lesions in magnetic resonance imaging (MRI) requires robust deep learning models to capture subtle spatial and textural features. We introduce hybrid quantum-classical transfer learning algorithms for MS classification using axial and sagittal MRI scans, combining classical convolutional neural networks (CNNs) including EfficientNetB3, ResNet50, DenseNet121 with parameterized quantum circuits to enhance feature representation via entanglement and quantum-specific non-linearities. Quantum layers are trained end-to-end with classical backbones via backpropagation, enabling seamless integration of quantum-enhanced features. For axial MRI, QResNet50 achieved a high accuracy of 97.58% and AUC of 99.31%, while QDenseNet121 reached 97.28% accuracy and 99.13% AUC. For sagittal MRI, classical ResNet50 excelled with 99.15% accuracy and 99.93% AUC, while QEfficientNetB3 improved accuracy (97.46% to 98.30%) but reduced AUC (99.51% to 99.32%), and QDenseNet121 achieved 98.87% accuracy and 99.83% AUC. Hybrid models showed mixed results, with QCNN underperforming, suggesting quantum benefits are architecture-dependent. Despite simulated quantum circuits mitigating hardware limitations, our results demonstrate the potential to enhance diagnostic performance in specific architectures. This work clarifies a foundational step toward quantum-enhanced deep learning for clinical applications, opening research directions in quantum-aware transfer learning and error mitigation for biomedical imaging. 1 Introduction Quantum machine learning (QML), which lies at the intersection of quantum computing and classical machine learning, has undergone significant advancements in recent years due to the unique strengths of quantum technology in enhancing data processing and model training ( 1 ). However, current hardware limitations, such as limited qubit counts and error rate, continue to pose challenges for the full realization and scalability of quantum models ( 2 , 3 ). Quantum neural networks (QNNs), a key component of QML, have demonstrated promising results across various domains by utilizing quantum phenomena like superposition and entanglement to improve learning performance. Among the various quantum neural network architectures, Quantum Convolutional Neural Networks (QCNNs) have emerged as a powerful hybrid quantum-classical approaches ( 4 ). QCNNs utilize the potential of quantum computing inspired by classical convolutional neural networks to reduce dimensionality and tackle complex high-dimensional problems. This approach is especially valuable in healthcare applications and medical diagnostics, particularly for the early detection of Multiple Sclerosis (MS), where timely and accurate diagnosis is critical. Multiple Sclerosis is a chronic inflammatory disorder of the central nervous system characterized by damage to the myelin sheath and nerve fibers ( 5 ). The myelin sheath is a fatty-protein coating that insulates nerve cells in the brain and spinal cord, enabling rapid transmission of electrical impulses ( 6 ). Damage to this protective layer disrupts nerve signal conduction and leads to the formation of scar tissue, known as plaques or sclerosis. The number of people suffering from this disease is estimated to be approximately 2-3 million worldwide ( 7 ). Multiple sclerosis is more commonly observed in young to middle-aged females, although this has not always been the case ( 8 ). The etiology of MS remains unclear, but it is widely recognized as a multifactorial disease influenced by genetic and environmental risk factors ( 9 , 10 ). The pathology of MS is highly heterogeneous, posing challenges in accurately diagnosing the disease in its early stages, measuring progression, and evaluating treatment efficacy ( 8 ). Its diagnosis remains difficult due to the absence of specific symptoms, physical findings, or laboratory tests that can definitively confirm the condition ( 11 ). Consequently, physicians rely on a combination of diagnostic methods, including thorough review of the patient’s medical history, neurological examinations, magnetic resonance imaging (MRI), cerebrospinal fluid analysis, and blood tests ( 10 , 12 – 15 ) to exclude other conditions that present with similar symptoms. Among these, MRI modalities are considered the most effective non-invasive tool for detecting MS lesions, providing crucial information about brain structure and tissue abnormalities. MRI biomarker, such as lesion count, evolution over time, and brain volume measurements (including grey matter and white matter) are valuable indicators for disease prognosis and treatment response ( 16 – 19 ). To enhance diagnostic accuracy, boost efficiency, and minimize manual errors, artificial intelligence (AI)-powered computer-aided diagnosis systems have been integrated with conventional MRI technology. Recent advancements in AI, particularly deep learning (DL) methods like convolutional neural networks (CNNs), has significantly enhanced the accuracy and efficiency of diagnosing MS through MRI data analysis ( 20 , 21 ). In a study, multiple sclerosis patients were categorized based on their disability level using a deep learning model incorporating convolutional neural networks ( 22 ). The model outperformed traditional methods by effectively extracting optimal MRI features. Attention-map analysis showed the frontotemporal cortex and cerebellum play crucial roles in predicting disability and also indicated that MS progression involves a complex distribution of neural damage across the central nervous system. In another study, a four-layer deep belief network was used to extract latent features from normal-appearing white and gray matter image patches, selected via voxel-wise t-tests and excluding lesion-overlapping areas ( 23 ). These features were then undergone LASSO-based selection to reduce overfitting and are used to train a random forest classifier to distinguish multiple sclerosis patients from healthy controls. The integration of multimodal myelin and T1-weighted features enhanced classification accuracy compared to single-modality approaches, highlighting the advantage of joint feature learning in improving predictive performance. To improve the accuracy of multiple sclerosis diagnosis using MRI scans, a model was developed that integrates a multi-view ResNet architecture with novel attention mechanisms-the View Space Attention Block (VSAB) and View Channel Attention Block (VCAB)-to extract detailed features from 2D brain images. Additionally, the Quantum RIME (QRIME) algorithm was introduced, combining RIME with Quantum Behaved Particle Swarm Optimization (QPSO) to perform efficient dimensionality reduction, thereby enhancing both diagnostic accuracy and computational efficiency ( 24 ). The results showed the potential of AI applications in improving the early detection of neurodegenerative diseases. In another study, disability progression prediction in MS patients was investigated using a time-dependent deep learning model based on sequential medical imaging data ( 25 ). The study captured temporal relationships across multiple MRI timepoints and demonstrated that quantum models achieved competitive performance compared to classical neural network architectures in binary classification of MS disability. In this study. we explored the application of classical and hybrid quantum-classical deep learning models for the detection of MS lesions in axial and sagittal brain MRI scans. Given the heterogeneous spatial distribution and textural characteristics of MS lesions, the ability of these models to adapt to such variability plays a crucial role in achieving reliable and robust diagnostic performance. Leveraging transfer learning techniques with architectures such as ResNet50, EfficientNetB3, and DenseNet121, we established a classical baseline before integrating parameterized quantum circuits to form hybrid quantum-classical models. A comparative evaluation across imaging planes revealed distinct performance trends, showing both the promise and current limitations of quantum-enhanced deep learning in the context of medical image analysis. This study is systematically organized to investigate hybrid quantum-classical approaches for MS detection. The Introduction highlights the clinical importance of MS diagnosis and reviews the application of deep learning methods in improving diagnostic accuracy using MRI data. The Methods section provides a rigorous technical exposition of: (i) classical CNN architectures (CNN, DenseNet121, ResNet50, EfficientNetB3) and their quantum hybrid variants, (ii) quantum circuit design principles including amplitude/angle embedding strategies, and (iii) the experimental framework encompassing data preprocessing and hyperparameter optimization. The Results section presents a comprehensive performance analysis across axial and sagittal MRI planes, with quantitative evaluation through accuracy, precision, recall, F1-score, and AUC metrics. The Discussion explains these findings within current literature, examines the differences between quantum and classical performance, and addresses practical implementation constraints. Finally, the Conclusion synthesizes key insights regarding quantum-enhanced feature learning while outlining future research directions in quantum medical imaging. 2 Theoretical Background 2.1 Quantum Computing In this section, we provide a brief background and introduce fundamental quantum computing concepts. These preliminaries will be used to describe the QCNN algorithms in the following sections. Quantum bit (qubit) A qubit is mathematically described as a vector in a two-dimensional Hilbert space, with the computational basis states |0⟩ and |1⟩ forming its foundation ( 26 ). Unlike classical bits, qubits can exist in a superposition state, meaning they can simultaneously represent a linear combination of these basis states weighted by complex probability amplitudes. This property enables quantum entanglement, where the states of several qubits become connected so that the state of each qubit depends on the others, no matter how far apart they are. When one qubit in an entangled system is measured, its state collapses and immediately determines the states of the others. These extraordinary features allow entangled qubits to encode and process information in ways that far exceed the capabilities of classical bits, giving quantum computers the potential to solve certain complex problems much more efficiently than traditional computers. Quantum gates Quantum gates are mathematical operations that act on one or more qubits to change their quantum states ( 27 ). The most commonly used gates include the Hadamard, CNOT, Rotation, and Pauli gates. The Hadamard gate creates superposition by transforming a qubit from a definite state into a combination of |0⟩ and |1⟩ states, while the CNOT gate as a two-qubit gate generates entanglement between qubits. Rotation gates perform parameterized rotations around the X . Y . or Z axes of the Bloch sphere, and Pauli gates ( X . Y . and Z ) are used for controlled bit and phase flips. Quantum circuits Quantum circuits consist of sequences of quantum gates arranged according to quantum algorithms to manipulate qubits ( 28 ). These circuits generate superposition and entanglement, which serve as fundamental resources for quantum computation. Quantum gates and circuits form the foundational elements in designing quantum computing models. Within a quantum circuit, measurement gates convert quantum states into classical information by collapsing them. Typically, several measurements are conducted, and their results are aggregated to estimate observable values and make predictions ( 29 ). 2.2 Quantum neural network (QNN) A quantum neural network in contrast to a classical convolutional neural network, consists of quantum layers that typically include three main components: embedding (data encoding), quantum circuits (often variational circuits with parameterized gates and entanglement), and measurement ( 30 ). Initially, classical data is encoded into a quantum state via a state preparation routine or feature map, which is usually designed to enhance model performance ( 31 ). Following encoding, a variational quantum circuit with parameterized gates is applied and optimized for a specific task through loss function minimization ( 32 ). The output of the quantum model is then obtained by measuring the quantum state and applying classical post-processing to the measurement outcomes. This framework allows QNNs to leverage quantum phenomena to potentially improve computational efficiency and representational capacity compared to classical neural networks. 2.3 Quantum Encoding Quantum machine learning relies on embedding classical data into quantum states using quantum principles ( 33 ). This process involves mapping data vectors into parameters that define quantum circuits, thereby generating quantum feature representations in Hilbert space. Two common encoding methods are amplitude encoding and angle encoding. Amplitude encoding In amplitude encoding, classical data is embedded into the probability amplitudes of a quantum state. By exploiting quantum superposition, the encoded information is accessed by measuring the quantum state’s amplitudes ( 34 ). A key advantage is its efficiency in representing large datasets using relatively few qubits. Specifically, encoding a classical dataset with M data points and N features per point requires n = log 2 ( NM ) qubits. To perform amplitude encoding, classical data vectors x = ( x 1 . x 2 . …. x N ) are mapped to quantum states as: where | i ⟩ denotes the computational basis states and x i represents the i -th component of the classical data. The quantum system is initially prepared in the all-zero state |0⟩ ⊗ n . where n is the number of qubits determined by the dataset size. A sequence of unitary operations, such as rotations and controlled gates, is then applied to transform this initial state into the desired encoded quantum state. Angle encoding Angle encoding embeds classical data into quantum states via parameterized rotations around the X . Y . or Z axes, with angles corresponding to data values. For example, a classical data vector x = ( x 1 . x 2 . …. x N ) can be encoded using rotations around the Y -axis as: Angle encoding maps each feature to the rotation angle of a single qubit, requiring one qubit per feature. This method uses relatively fewer quantum gates, enhancing its compatibility with existing quantum hardware. Generally, encoding a dataset with n features requires exactly n qubits. For datasets with a large number of features, amplitude encoding requires fewer qubits per data point but demands a higher number of quantum gates to prepare the corresponding quantum state. In contrast, angle encoding is simpler and more resilient to noise on current quantum devices, making it more practical given existing hardware limitations. However, angle encoding is less efficient when handling high-dimensional data. Each method offers distinct advantages and trade-offs, where the choice between amplitude and angle encoding depends on the available quantum hardware capabilities and the specific requirements of the machine learning task ( 35 ). 2.4 Circuit Design The circuit design defines the sequence and types of quantum gates applied to the qubits after data encoding ( 36 ). Typically, this involves a combination of parameterized rotation gates and entangling gates applied to neighboring qubits. Entangling gates create quantum correlations across adjacent qubits, enabling the circuit to exploit quantum phenomena such as superposition and interference. This enhanced representational power enables quantum convolutional layers to capture more complex features from imaging data. During training, the parameters of the rotation gates are optimized to minimize a loss function, tailoring the quantum circuit to the specific learning task. 2.5 Measurement and Output Features After processing through the quantum convolutional layer, measurements are performed on the qubits to extract expectation values of specific observables. These quantum-derived features constitute the output of the quantum layer and can be fed into subsequent layers-either quantum or classical-enabling hybrid quantum-classical architectures. 3 Methods 3.1 Dataset details and preprocessing We utilized a dataset comprising 1441 axial and 2016 sagittal FLAIR MRI brain images exhibiting visible MS lesions, alongside 2016 axial and sagittal image slices depicting normal brain appearance without white matter lesions ( 37 ). The images prospectively collected from 72 patients diagnosed with MS and 59 healthy control subjects. Fig. 1 presents ten representative samples, with randomly selected axial images from the MS and healthy groups shown in Fig. 1a and Fig. 1b , respectively, and sagittal images from the MS and healthy groups displayed in Fig. 1c and Fig. 1d , respectively. Download figure Open in new tab Fig. 1. Representative MRI samples from MS and healthy groups. Randomly selected axial images from (a) MS and (b) healthy groups; Randomly selected sagittal images from (c) MS and (d) healthy groups. We divided the dataset into training, validation, and test subsets to ensure robust model evaluation. Initially, the entire dataset was split into a combined training-validation set and a separate test set, with 20% of the data reserved for testing. This division employed stratified sampling to preserve the original class distribution across the subsets, thereby preventing class imbalance issues ( 38 ). Subsequently, the combined training-validation set was further split into distinct training and validation subsets, allocating 20% of the data for validation. Both splitting steps were conducted using a fixed random seed to ensure reproducibility of the data partitions. For training data, augmentation was performed using Kornia, a PyTorch-based computer vision library ( 39 ). Fig. 2a and Fig. 2b depict the size of the training image data before augmentation for axial and sagittal images, respectively, while Fig. 2c illustrates the size of the training image data following augmentation. Download figure Open in new tab Fig. 2. Training image dataset sizes before and after augmentation. (a) Number of axial training images before augmentation. (b) Number of sagittal training images before augmentation. (c) Number of training images after augmentation. To standardize input dimensions for the mode, all images were resized to 224 × 224 pixels. We normalized pixel intensities to the [0.1] range by dividing by the maximum 8-bit value (255), ensuring consistent input scaling throughout the dataset. 3.2 Classical deep learning algorithms 3.2.1 Convolutional neural network Among DL models. convolutional neural networks are particularly prominent and widely applied in tasks such as object detection, speech recognition, image classification, and biomarker detection ( 40 , 41 ). CNNs employ multi-layered architectures to learn hierarchical data representations, where each layer extracts increasingly complex features ( 42 ). This structure integrates feature extraction and classification into a single efficient framework that requires minimal preprocessing. As a result, CNNs can automatically learn and identify patterns directly from raw data without manual intervention. The core components of CNNs include convolutional layers, activation functions, pooling layers, and fully connected layers ( 41 ). Convolutional layers These layers extract distinctive features from input data through multiple convolution operations using learnable kernels ( 43 ). This process preserves spatial structure while reducing parameters through local connectivity and parameter sharing, enabling hierarchical feature learning. The output of a convolutional layer is a set of feature maps that highlight specific patterns in the data. Activation functions These functions are applied directly to the output of convolutional layers to introduce non-linearity into the model ( 44 ). This non-linearity allows CNNs to capture and represent complex, non-linear relationships within data. It enables the network to solve tasks beyond simple linear classification or regression and to effectively model intricate real-world patterns. Common activation functions include the Rectified Linear Unit (ReLU), sigmoid, and hyperbolic tangent (tanh). Pooling layers These layers usually follow convolutional and activation layers and reduce the number of network connections by downsampling and reducing the dimensionality of the input data ( 45 ). This reduction in data size lowers computational demands and aids in minimizing overfitting. Fully connected (FC) layer The FC layer is typically positioned at the end of a CNN to connect every neuron to all neurons in the preceding layer ( 46 ). It receives input from the last convolutional or pooling layer and acts as a classifier to enable the network to make predictions. In this study, we implement a classical CNN architecture composed of a fixed convolutional base followed by a configurable dense classifier. The convolutional base includes two blocks: each consists of a Conv2d layer with ReLU activation and max pooling. Specifically, the first block applies 32 filters of size 3×3 with unit padding to the input, followed by ReLU and 2×2 max pooling with stride 2. The second block increases the number of filters to 64 while maintaining the same kernel and padding configuration. After feature extraction, spatial dimensions are flattened into a vector whose size is determined dynamically during initialization via a dummy forward pass. The classifier module is then constructed based on this inferred input size and consists of a variable number of fully connected layers, each followed by ReLU activation and dropout regularization. The final dense layer outputs logits for two classes. Formally, given an input tensor x ∈ℝ 3×B× H × W , the network computes: where x flat is the resulting flattened feature vector with shape B × d in . B represents the batch size (number of input samples processed together), d in denotes the flattened feature dimension output by the convolutional base. d prev and d units represent the input and output dimensions of each linear transformation, respectively. This modular design supports flexible experimentation with network depth and regularization strength while maintaining a simple and interpretable baseline CNN structure. 3.2.2 DenseNet121 Architecture DenseNet (Densely Connected Convolutional Network) is a convolutional neural network architecture designed to improve feature reuse and gradient flow by establishing direct connections between all layers within a dense block ( 47 ). DenseNet121, a 121-layer variant, achieves high parameter efficiency and strong performance in image classification tasks, making it well-suitable for medical imaging applications ( 48 ). Unlike traditional CNNs, where layers receive input only from the immediately preceding layer, DenseNet121 connects each layer to every preceding layers in the same dense block by concatenating their feature maps. Formally, the output of layer ℓ is defined as: Where, [ x 0 . x 1 . …. x l −1 ] denotes the concatenation of feature maps from all previous layers, and H ℓ is a composite function comprising batch normalization ( BN ), ReLU activation, and a 3×3 convolution (Conv 3×3 ). To improve computational efficiency, a 1×1 convolution (bottleneck layer. Conv 1×1 ) precedes H l to reduce channel dimensionality and to improve computational efficiency: Each layer in a dense block produces k feature maps, where k is the growth rate (commonly 32), resulting an output channel count after l layers: In our implementation, we used the pretrained DenseNet121 backbone from torchvision, modified to freeze the initial stem layer and the first dense block to prevent overfitting on small datasets. The final classifier layer is replaced with a configurable stack of FC layers, including ReLU activations and dropout regularization. Specifically: The output of the DenseNet121 backbone is passed through an adaptive average pooling layer, reducing spatial dimensions to 1×1. The resulting tensor is flattened into a 1024-dimensional feature vector. A variable number of FC layers follow, each with configurable width and dropout rate. The final linear layer outputs logits for two classes. 3.2.3 ResNet50 Architecture Residual Networks (ResNet) address the vanishing gradient problem by introducing residual connections that facilitate the training of deeper convolutional neural networks ( 49 ). These skip connections allow gradients to flow more directly through the network, simplifying optimization and improving learning stability. While residual connections help mitigate vanishing gradients, batch normalization and ReLU activation also play critical roles in ensuring stable and efficient training. ResNet50, a 50-layer variant, achieves strong performance in image classification and is widely adopted in various applications due to its balance between accuracy and computational efficiency ( 50 ). The architecture begins with a stem comprising a 7×7 convolution, batch normalization, ReLU activation, and a 3×3 max-pooling layer, which transforms input images into feature maps of size 64 channels. This is followed by four stages of residual bottleneck blocks. Each block expands, transforms, and reduces channel dimensions using three convolutional layers: two 1×1 convolutions and one 3×3 convolution: Where, Conv 1×1 expand expands channels, Conv 3×3 applies a 3×3 convolution, and Conv 1×1 reduce reduces channels to the output dimension C out . A skip connection adds the input x to the output. with a 1×1 convolution applied to x if channel dimensions differ. For an input of size 224×224, the final stage of four outputs feature maps of size 7×7×2048, which are spatially reduced via an adaptive average pooling layer to a 2048-dimensional vector: The classifier consists of a configurable stack of fully connected layers, each with ReLU activation and dropout, culminating in a final linear layer that produces class logits: Where, Flatten converts the pooled features into a vector of size 2048 ( 51 ). To leverage transfer learning, we initialize the ResNet50 backbone using pretrained weights from a specified path. The stem and the first residual stage— including the initial convolution, batch normalization, activation, max pooling, and first residual block — were frozen to preserve low-level features learned on large-scale datasets. Later layers and the newly defined dense classifier were fine-tuned during training. 3.2.4 EfficientNet-B3 Architecture EfficientNet is a family of convolutional neural networks that optimize accuracy and efficiency by uniformly scaling network depth, width, and input resolution using a compound scaling factor ( 52 , 53 ). EfficientNet-B3, a mid-sized variant, balances computational cost and performance, making it suitable for image classification tasks. The architecture is composed of a stem layer followed by a sequence of mobile inverted bottleneck convolution (MBConv) blocks augmented with squeeze-and-excitation (SE) modules ( 54 ). Each MBConv block processes input feature maps x ∈ℝ H × W × C in through the following operations: Here, Conv 1×1 expand increases channel dimensionality, Conv k × k depthwise applies a depthwise convolution, and Conv reduce reduces channels. A residual skip connection adds the input x to the output when their dimensions’ match. The SE feature maps via global average pooling and two fully connected layers: Where, GlobalAvgPool reduces spatial dimensions. FC 1 and FC 2 are fully connected layers and σ is the sigmoid function. The EfficientNet-B3 backbone outputs feature maps of size 1536 channels for standard 224×224 RGB inputs. These feature maps are spatially reduced via global average pooling, resulting in a 1536-dimensional feature vector. The final classifier includes a configurable stack of FC layers with ReLU activation and dropout regularization, culminating in a linear output layer producing class logits: Where, flatten reshapes pooled features into a vector of size 1536. To leverage transfer learning, we initialized the EfficientNet-B3 backbone using pretrained weights. Early layers—including the stem and initial MBConv blocks (up to block 4)—were frozen to retain pretrained features and reduced overfitting on small datasets. Later layers and the newly defined dense classifier were fine-tuned during training. 3.3 Hybrid classical-quantum model In this study, we introduced hybrid classical-quantum models including QCNN, QDenseNet121, QResNet50, and QEfficientNet-B3 that integrate classical convolutional feature extraction with a variational quantum circuit to construct a quantum-enhanced classifier. The architecture is composed of three main components: (i) a classical convolutional base for spatial feature learning, (ii) a dimensionality reduction layer that maps classical features into a quantum-compatible latent space, and (iii) a parametrized quantum circuit followed by a flexible dense classifier. Fig. 3 shows the schematic flowchart of hybrid classical-quantum models architectures that are explained in further sections. Overall details of each architecture are also shown in Fig. 4 . Download figure Open in new tab Fig. 3. Schematic representation of the hybrid classical-quantum architectures. Download figure Open in new tab Fig. 4. Overall details of hybrid classic-quantum architecture. 3.3.1 QCNN Architecture The QCNN model begins with a standard convolutional neural network comprising two blocks of Conv2d-ReLU-MaxPool operations. Each convolutional layer preserves spatial resolution through unit padding while increasing channel depth, followed by 2×2 max pooling that reduces spatial dimensions. This feature extraction stage ensures that the model captures hierarchical spatial patterns before transitioning to quantum processing. The output is then flattened and projected via a linear layer into a latent vector of size n qubits , matching the number of qubits in the subsequent quantum layer. The quantum component is implemented as a parameterized quantum circuit executed on a simulated device using PennyLane ( 55 ). Each qubit undergoes an RX rotation based on the corresponding classical input, followed by multiple layers of entangling CNOT gates and trainable Z-axis rotations. Expectation values of Pauli-Z observables across all qubits are returned as the final measurement and fed into a configurable stack of dense layers. These dense layers consist of fully connected layers, each followed by ReLU activation and dropout regularization, except the final output layer which maps to 2 class logits. The model processes input images through the following stages: Convolutional Feature Extraction: Where, ConvNet consists of two Conv2d-ReLU-MaxPool blocks, reducing spatial dimensions. Flattening and Dimensionality Reduction: Where, σ denotes the sigmoid function, ensuring inputs fall within the valid range for quantum encoding and x talent is obtained through a linear transformation projects the high-dimensional flattened features into a lower-dimensional space with size matching the number of qubits in the quantum circuit Quantum Circuit Layer: The encoded vector x encoded is fed into a variational quantum circuit. Each batch element is processed independently on a simulated quantum device with n q qubits. The circuit performs input encoding: followed by entangling CNOT gates and RZ rotations across layers. Final measurements are taken as: Final Classification: The classifier consists of a customizable sequence of fully connected layers, each followed by ReLU activation and dropout regularization, ending with a final linear layer that outputs the class logits. 3.3.2 QDensenet121/QResNet50 Architecture 1. Classical Feature Extraction The backbone of QDenseNet121 or QResNet50 extract high-level feature vectors z ∈ ℝ 1024 and z∈ ℝ 2048 , respectively, via adaptive average pooling of convolutional feature maps. These vectors are further processed by n dense fully connected layers with ReLU activations and dropout regularization: where ℎ 0 = z . W i ∈ ℝ udense × uin . b i ∈ ℝ udense . u in is the input dimension for the first dense layer, and u dense is the number of units in each classical dense layer, thereafter. The final dense layer projects to a vector of size 2 nqubits : Where, σ is the sigmoid function, ensuring the quantum circuit input parameters lie within [0, π], W q and b q are weight matrix and bias vector projecting the final dense layer output to the quantum circuit input size 2 nqubits . 2. Quantum Circuit Encoding and Variational Layers The vector q is normalized and encoded into a quantum state via amplitude embedding on an n qubits -qubit system: Here, ∣ ψ 0 ⟩ ∈ ℂ 2 is a normalized quantum state. The variational quantum circuit consists of n layers layers, each applying parameterized single-qubit U Rot (θ k.j .0 . θ k.j .1 . θ k.j .2 ) = R z (θ k.j .2 ). R z (θ k.j .1 ). R z (θ k.j .0 ) rotations on qubit j , followed by entangling CNOT gates between adjacent qubits: in which, I denotes identiy matrix and X indicates X rotation. The output is a vector of expectation values: Where, σ x j and σ z j are Pauli operators. 3. Classical Post-Processing and Classification The quantum output e is fed into a classical classifier comprising two fully connected layers with ReLU activation and dropout: Where W i ∈ ℝ udense × uin , b i ∈ ℝ udense , W 2 ∈ ℝ 2× uclassical , y ∈ ℝ 2 represents binary class logits. 3.3.3 QEfficientNetB3-quantum architecture 1. Classical Feature Processing The EfficientNet-B3 backbone extracts a feature vector z∈ℝ 1536 via global average pooling of its final convolutional output. This vector is processed through fully connected layers with ReLU activation and dropout regularization: for i = 1. …. n dense − 1, ℎ 0 = z , W i ∈ ℝ udense × uin , b i ∈ ℝ udense , and u in = 1536 for the first layer and u dense (subsequent layers). The final layer projects to n qubits dimensions (one feature per qubit) and scales to [0,π] via a sigmoid: ensuring rotation angles ∈ [0. π] for quantum encoding. 2. Quantum Circuit Design The circuit employs angle embedding to map classical features to qubit rotations, reducing computational overhead compared to amplitude embedding: 3. Variational Quantum Layers The circuit applies n layers layers of trainable rotations and entangling gates: Rotational Gates: Each layer k applies R x .R Y .R Z rotations parameterized by weights θ k . j.m : Where, j indexes qubits and m indexes rotation axes. Entanglement: CNOT gates create a ring topology (qubit j entangled with ( j +1) mod n qubits ): 4. Measurement and Classical Classifier The circuit measures Pauli-Z expectations on all qubits: A classical fully connected network processes e to produce logits: Where, W2∈R 2×dclassical . 3.3.4 Optimization The hybrid quantum-classical models were trained using a combination of cross-entropy loss and L2 regularization to prevent overfitting and improve generalization: Where t i ∈ {0.1} 2 is the true label, y i = softmax(z i ) is the predicted probability, and || W || 2 is the Frobenius norm of weight matrices, using learning rate η. To further enhance training efficiency and avoid overfitting, we implemented an early stopping mechanism that monitors validation loss during training. This ensures optimal use of computational resources while retaining the most effective model state observed throughout training. Hyperparameter tuning was carried out using Optuna, a powerful framework for automated hyperparameter optimization ( 56 ). Over 50 trials were executed across a predefined search space encompassing both classical and quantum parameters. For each trial, Optuna evaluated model performance based on validation metrics, iteratively refining its search strategy to identify the most promising configurations. The final optimal set of hyperparameters was selected based on overall performance across training, validation, and test sets. All experiments were conducted on the Leonardo supercomputer, part of the European high-performance computing infrastructure hosted by the CINECA interuniversity consortium ( 57 ). We utilized the “boost_usr_prod” SLURM partition, which provides access to NVIDIA A100 GPUs through the Leonardo Booster environment for accelerated deep learning computations. Additionally, a subset of algorithms was tested using an NVIDIA A100 GPU from a paid Google Colab Pro account to ensure development flexibility and reproducibility across environments. 4 Results The performance metrics highlight the potential of hybrid classical-quantum models for enhancing MS detection, particularly in capturing complex lesion patterns. The optimized hyperparameters for each method are detailed in Table 1 . Improvements in AUC, a critical metric for distinguishing MS lesions from normal tissue, were observed in QDenseNet121 and QResNet50 for axial MRI, suggesting quantum layers can enhance discriminative power in certain architectures. However, inconsistent benefits across models indicate that quantum integration is context-specific, influenced by classical model complexity and quantum circuit design. Performance declines in QCNN and QEfficientNetB3 further reveal the need for careful architectural design to maximize quantum contributions. View this table: View inline View popup Table 1. The optimized hyperparameters for each method. 4.1 Evaluation of Classic and Hybrid Classic-Quantum DL Models for Axial MRI The metrics including accuracy, precision, recall, F1-score, and AUC offer insights into the models’ effectiveness in identifying MS-related features in axial MRI images ( Table 2 ). The results reveal both the strengths of classic DL models and the potential of quantum-enhanced approaches with implications for advancing MS diagnostics. View this table: View inline View popup Download powerpoint Table 2. Performance metrics of classic and hybrid classic-quantum algorithms for axial MRI images. Among the classic DL models, EfficientNetB3 achieved the highest performance, with an accuracy of 98.18%, precision of 98.20%, recall of 98.18%, F1-score of 98.18%, and an AUC of 99.02%. This performance is likely due to EfficientNetB3’s compound scaling approach, which optimizes network architecture to capture the subtle and heterogeneous patterns of MS lesions. ResNet50 and DenseNet121 also performed robustly, with accuracies of 96.97% and 95.77%, respectively, and AUC values above 98%, indicating strong discriminative ability for MS-related features. In contrast, the CNN model showed the lowest performance (accuracy of 93.95%. AUC of 97.81%), suggesting that simpler architectures may struggle to model the complex characteristics of MS lesions. The hybrid classic-quantum models demonstrate varied performance relative to their classic counterparts. Notably, QDenseNet121 showed a significant improvement, with an accuracy increasing from 95.77% to 97.28% and AUC from 98.66% to 99.13%. Similarly, QResNet50 improved accuracy versus classical counterpart (from 96.97% to 97.58%) and AUC (from 98.69% to 99.31%), indicating that quantum circuits may enhance the model’s ability to capture residual features critical for identifying MS-specific patterns. However, the QCNN model exhibited a slight performance decline (accuracy drops from 93.95% to 93.05%. AUC from 97.81% to 96.85%), possibly due to the limited capacity of the CNN architecture to leverage quantum enhancements effectively. Intriguingly, EfficientNetB3’s hybrid model shows no improvement in accuracy (98.18%) and a slight AUC decrease (from 99.02% to 98.14%), suggesting that its highly optimized classic architecture may already be near the performance, leaving little room for quantum contributions. 4.2 Evaluation of Classic and Hybrid Classic-Quantum DL Models for Sagittal MRI For sagittal MRI images, the classic DL models demonstrated exceptional performance, with ResNet50 achieving the highest metrics accuracy, precision, recall, and F1-score all at 99.15%, and an AUC of 99.93% ( Table 3 ). This performance likely reflects ResNet50’s ability to capture deep residual features, which are critical for identifying MS lesions in the sagittal plane, where lesions may appear as irregularly shaped hyperintensities, particularly in the spinal cord or periventricular regions. View this table: View inline View popup Download powerpoint Table 3. Performance metrics of classic and hybrid classic-quantum algorithms for sagittal MRI images. DenseNet121 has the next position, with an accuracy of 98.87%, precision of 98.89%, recall of 98.87%, F1-score of 98.87%, and an AUC of 99.83%, demonstrating its strength in leveraging dense connectivity to model complex lesion patterns. EfficientNetB3, while still highly effective, showed slightly lower performance (accuracy of 97.46% and AUC of 99.51%), possibly due to its scaling strategy being less optimized for the specific spatial characteristics of sagittal images. The CNN model lags behind, with an accuracy of 93.80% and an AUC of 98.31%, indicating that simpler architectures struggle to capture the nuanced features of MS lesions in this plane. The hybrid classic-quantum models showed mixed results compared to their classic counterparts. QDenseNet121 model slightly underperformed, with accuracy decreasing from 98.87% to 98.30% and AUC slightly increasing from 99.83% to 99.88%. This suggests that quantum enhancements may not significantly improve DenseNet121’s already strong performance. However, the AUC of QDenseNet121 (99.83%) was slightly better than classical counterpart (99.88%), indicating potential for better discriminative power. QEfficientNetB3 model showed a notable improvement in accuracy (from 97.46% to 98.30%) but a slight AUC decrease (from 99.51% to 99.32%), suggesting that quantum layers enhance overall classification, but may slightly reduce the model’s ability to rank positive cases. QResNet50 exhibited a performance decrease across all metrics (accuracy from 99.15% to 98.59% and AUC from 99.93% to 99.61%), indicating that quantum integration may disrupt the model’s finely tuned residual learning for sagittal images. The QCNN model also performed worse (accuracy drops from 93.80% to 92.95% and AUC from 98.31% to 97.82%), reinforcing that simpler architectures may not benefit from quantum enhancements, possibly due to limited quantum circuit complexity. 5 Discussion In this study, we investigated the detection of multiple sclerosis lesions in axial and sagittal MRI scans using classical and hybrid quantum-classical deep learning models. Given the diverse spatial and textural patterns of MS lesions, the adaptability of these models to such variations is critical for accurate diagnosis. Our comparative analysis reveals distinct performance trends across architectures and imaging planes, highlighting the potential and limitations of quantum-enhanced DL in medical imaging. Recent advances in deep learning have significantly improved the classification of MS using MRI data, with numerous studies reporting high-performance metrics ( Table 4 ). View this table: View inline View popup Table 4. Comparative overview of previous studies. Macin et al. achieved an accuracy exceeding 98.37% for axial and 97.75% for sagittal MRI images using ExMPLPQ, a method that integrates exemplar-based multi-parametric Local Phase Quantization (LPQ) features with a k-nearest neighbors (kNN) classifier ( 37 ). This method affirmed the enduring effectiveness of handcrafted feature extraction in MS diagnosis. In another study, Tatli et al. developed MSNet, a hybrid MS classification model that innovatively merges deep learning (DenseNet201 and ResNet50) with feature engineering (NCA, ReliefF, and Chi2) and ensemble learning (SVM/kNN + majority voting) ( 58 ). By extracting and refining deep features through transfer learning and iterative voting, the model achieved 97.13% accuracy, demonstrating the advantages of combining deep neural networks with classical machine learning techniques for medical image analysis. Further improvements were observed in studies utilizing CNNs with innovative pooling strategies, such as Wang et al. ( 20 ) and Alijamaat et al. ( 21 ), who reported accuracies of 95.82% and 98.92%, respectively, reinforcing the effectiveness of convolutional architectures in MS classification. Haggag et al. employed a D-CNN model based on Inception V3 across four datasets containing MRI scans from MS patients and healthy controls, achieving mean average precision (mAP) values of 86.20%, 93.77%, 94.18%, and 90.46% for various datasets ( 59 ). Meanwhile. Ekmekyapar and Tascı utilized a hybrid approach combining Exemplar MobileNetv2 with IMrMr feature selection and kNN, attaining accuracy 99.76% on axial images and 99.48% on sagittal images ( 60 ). In our study, EfficientNetB3 achieved the highest performance among classical models for axial MRI images, with an accuracy of 98.18% and an AUC of 99.02%. This considerable performance is attributed to EfficientNetB3’s compound scaling approach, which systematically optimizes network depth, width, and resolution to capture subtle and heterogeneous MS lesion patterns ( 61 ). ResNet50 and DenseNet121 also demonstrated robust performance, with accuracies of 96.97% and 95.77%, respectively, and AUC values exceeding 98%. Their success can be attributed to residual learning and dense feature reuse, which enhance hierarchical feature extraction ( 49 , 53 ). In contrast, the simpler CNN architecture shows the lowest performance, reflecting its limited capacity to model the complex lesion patterns. For sagittal MRI, ResNet50 excelled with near-perfect metrics (accuracy: 99.15% and AUC: 99.93%). DenseNet121 followed closely with an accuracy of 98.87% and an AUC of 99.83%, leveraging dense connectivity to integrate multi-scale features. EfficientNetB3, while still highly effective, showed slightly lower performance (accuracy 97.46% and AUC 99.51%), suggesting its scaling strategy may be less optimal for sagittal-specific features. The CNN again underperformed, reinforcing the need for deeper architectures in MS lesion detection. The hybrid classic-quantum models introduce additional complexity to traditional deep learning architectures, resulting in varied performance across MRI planes and models, dependent on the classical backbone and imaging plane. For axial MRI, QDenseNet121 improved accuracy by 1.51% (95.77% → 97.28%) and AUC by 0.47% (98.66% → 99.13%), likely due to quantum-enhanced feature disentanglement via amplitude embedding. The variational quantum circuit’s non-linear transformations may refine high-dimensional features, improving lesion separability. QResNet50 showed a 0.61% accuracy gain (96.97% → 97.58%) and a 0.62% AUC improvement (98.69% → 99.31%), suggesting quantum entanglement enhances discriminative power for residual features. QEfficientNetB3 exhibited no accuracy improvement (98.18%) and a slight AUC drop (99.02% → 98.14%), indicating its classical optimization may saturate performance. The QCNN model experienced a modest performance decline, with accuracy dropping from 93.95% to 93.05% and AUC decreasing from 97.81% to 96.85%, suggesting that simpler classical backbones may lack the representational capacity to fully leverage quantum augmentation. For Sagittal MRI, QEfficientNetB3 improved accuracy by 0.84% (97.46% → 98.30%) but slightly reduced AUC (99.51% → 99.32%), suggesting a trade-off between classification and ranking performance. QResNet50 and QDenseNet121 showed modest, possibly due to interference with pre-trained residual/dense features critical for sagittal lesions. QCNN model also underperformed in sagittal MRI, reinforcing the notion that simpler architectures struggle to benefit from quantum enhancements, possibly due to limited quantum circuit complexity and classical representational power. The hybrid models employed two primary quantum feature encoding strategies. First, amplitude embedding used in QDenseNet121 and QResNet50. maps classical feature vectors q∈ ℝ nqubits to a normalized quantum state ∣ψ 0 ⟩= q∥(q∥) 2 . Theoretical analyses show that amplitude embedding can exponentially compress high-dimensional data into quantum states; however, it requires O(2 n ) classical preprocessing, which limits scalability ( 62 ). Second, angle embedding, utilized in QEfficientNetB3, encodes n features as qubit rotations nqubits −1 (i)|0⟩, offering better scalability with complexity O(n), but it may lose some global correlations present in the data ( 63 ). The quantum circuits incorporate parametrized rotation gates, which are optimized via backpropagation. These gates introduce quantum-specific non-linear transformations, potentially enhancing feature extraction, as seen in QDenseNet121’s AUC improvement for axial MRI. CNOT gates in a ring topology create entanglement between adjacent qubits, enabling quantum correlations that may capture long-range dependencies across distant image regions, relevant for MS detection due to lesions’ heterogeneous spatial distributions. This mechanism could contribute to QResNet50’s AUC gain, though QEfficientNetB3’s AUC drop suggests context-specific benefits limited by circuit design (e.g., qubit count, entanglement scope). Measurement of the quantum states is performed via Pauli observables ⟨σ x ⟩ and ⟨σ z ⟩. The ⟨σ z ⟩ observable encodes local qubit polarization, which is sensitive to lesion intensity variations, while ⟨σ x ⟩ captures coherence between lesions and healthy tissue. The classical fully connected layers then map the measured quantum features to output predictions, with quantum noise such as shot noise being regularized through dropout techniques. Despite these promising results, several challenges limit the clinical applicability of hybrid classical-quantum models. Current quantum hardware constraints restrict the number of qubits. impacting the dimensionality of the feature space that can be encoded. Additionally, clinical MRI data often contain artifacts. such as motion blur and partial volume effects, which can degrade quantum coherence and computational fidelity. Future work should prioritize error mitigation strategies. such as dynamical decoupling and probabilistic error cancellation, to enhance robustness under noisy conditions. Furthermore. the theoretical framework for quantum advantage in medical imaging remains underdeveloped, with rigorous performance bounds yet to be established. Future research should focus on deriving rigorous mathematical frameworks to quantify the conditions under which quantum enhancements provide measurable improvements over classical approaches. Addressing these challenges will be essential for translating quantum-based diagnostic tools from theoretical constructs into clinically viable solutions. Conclusion This study demonstrates that classical deep learning architectures achieve robust performance in MS lesion detection across different MRI planes, with residual and densely connected networks showing particular effectiveness. Hybrid quantum-classical models provide improvements, enhancing certain architectures through quantum-enabled feature refinement while offering no advantage for simpler networks. The benefits of quantum integration prove highly dependent on both the base model’s design and the specific imaging plane being analyzed. While quantum circuits show promise for medical image analysis through their unique feature encoding and transformation capabilities, their current utility remains constrained by fundamental limitations in scalability and noise susceptibility. Future progress in this emerging field will depend on co-designed quantum-classical systems. Declarations Human Ethics and Consent to Participate Not applicable. Competing interests I declare that the authors have no competing interests as defined by Springer, or other interests that might be perceived to influence the results and/or discussion reported in this paper. Funding No funding. Availability of data and materials All data generated or analysed during this study are included in this published article [and its supplementary information files]. Authors’ contributions M-ZG implemented and executed all deep learning code, interpreted and visualized the results, drafted the manuscript, and supervised the project. EA investigated the project and contributed to writing the manuscript. All authors reviewed and approved the final version of the manuscript. Data Availability All data generated or analysed during this study are included in this published article [and its supplementary information files]. Acknowledgements I would like to acknowledge support from the ICTP through the Associates Programs (2023–2028). References 1. ↵ Lee C , Araujo IF , Kim D , Lee J , Park S , Ryu J-Y , et al. Optimizing quantum convolutional neural network architectures for arbitrary data dimension . Frontiers in Physics . 2025 ; 13 : 1529188 . 2. ↵ Preskill J . Quantum computing in the NISQ era and beyond . Quantum . 2018 ; 2 : 79 . 3. ↵ Bharti K , Cervera-Lierta A , Kyaw TH , Haug T , Alperin-Lea S , Anand A , et al. Noisy intermediate-scale quantum algorithms . Reviews of Modern Physics . 2022 ; 94 ( 1 ): 015004 . OpenUrl CrossRef 4. ↵ Cong I , Choi S , Lukin MD . Quantum convolutional neural networks . Nature Physics . 2019 ; 15 ( 12 ): 1273 – 8 . OpenUrl 5. ↵ Goldenberg MM . Multiple sclerosis review . Pharmacy and therapeutics . 2012 ; 37 ( 3 ): 175 . OpenUrl 6. ↵ Kister A , Kister I . Overview of myelin, major myelin lipids, and myelin-associated proteins . Frontiers in chemistry . 2023 ; 10 : 1041961 . 7. ↵ Khan G , Hashim MJ . Epidemiology of Multiple Sclerosis: Global, Regional, National and Sub-National-Level Estimates and Future Projections . Journal of Epidemiology and Global Health . 2025 ; 15 ( 1 ): 21 . OpenUrl CrossRef 8. ↵ Dobson R , Giovannoni G . Multiple sclerosis–a review . European journal of neurology . 2019 ; 26 ( 1 ): 27 – 40 . OpenUrl CrossRef PubMed 9. ↵ Haki M , Al-Biati HA , Al-Tameemi ZS , Ali IS , Al-Hussaniy HA . Review of multiple sclerosis: Epidemiology, etiology, pathophysiology, and treatment . Medicine . 2024 ; 103 ( 8 ): e37297 . OpenUrl CrossRef PubMed 10. ↵ Ghadirian P , Dadgostar B , Azani R , Maisonneuve P . A case-control study of the association between socio-demographic, lifestyle and medical history factors and multiple sclerosis . Canadian journal of public health . 2001 ; 92 : 281 – 5 . OpenUrl PubMed Web of Science 11. ↵ Shoeibi A , Khodatars M , Jafari M , Moridian P , Rezaei M , Alizadehsani R , et al. Applications of deep learning techniques for automated multiple sclerosis detection using magnetic resonance imaging: A review . Computers in Biology and Medicine . 2021 ; 136 : 104697 . 12. ↵ Høgestøl EA , Kaufmann T , Nygaard GO , Beyer MK , Sowa P , Nordvik JE , et al. Cross-sectional and longitudinal MRI brain scans reveal accelerated brain aging in multiple sclerosis . Frontiers in neurology . 2019 ; 10 : 450 . 13. Lo Sasso B , Agnello L , Bivona G , Bellia C , Ciaccio M . Cerebrospinal fluid analysis in multiple sclerosis diagnosis: an update . Medicina . 2019 ; 55 ( 6 ): 245 . OpenUrl 14. Coles A. A blood test to predict prognosis in multiple sclerosis?: Oxford University Press UK ; 2024 . p. 3969 -. 15. ↵ Teymoori-Rad M , Mozhgani SH , Zarei-Ghobadi M , Sahraian MA , Nejati A , Amiri MM , et al. Integrational analysis of miRNAs data sets as a plausible missing linker between Epstein-Barr virus and vitamin D in relapsing remitting MS patients . Gene . 2019 ; 689 : 1 – 10 . OpenUrl PubMed 16. ↵ Ge Y . Multiple sclerosis: the role of MR imaging . American Journal of Neuroradiology . 2006 ; 27 ( 6 ): 1165 – 76 . OpenUrl PubMed Web of Science 17. Shiee N , Bazin P-L , Ozturk A , Reich DS , Calabresi PA , Pham DL . A topology-preserving approach to the segmentation of brain images with multiple sclerosis lesions . NeuroImage . 2010 ; 49 ( 2 ): 1524 – 35 . OpenUrl CrossRef PubMed Web of Science 18. Cabezas M , Oliver A , Lladó X , Freixenet J , Cuadra MB . A review of atlas-based segmentation for magnetic resonance brain images . Computer methods and programs in biomedicine . 2011 ; 104 ( 3 ): e158 – 77 . OpenUrl CrossRef PubMed 19. ↵ Tiu VE , Enache I , Panea CA , Tiu C , Popescu BO . Predictive MRI Biomarkers in MS—A Critical Review . Medicina [Internet ]. 2022 ; 58 ( 3 ). 20. ↵ Wang J , Lima D . Multiple sclerosis detection via 6-layer stochastic pooling convolutional neural network and multiple-way data augmentation . STEMedicine . 2021 ; 2 ( 8 ): e101 -e. OpenUrl 21. ↵ Alijamaat A , NikravanShalmani AR , Bayat P . Diagnosis of multiple sclerosis disease in brain MRI images using convolutional neural networks based on wavelet pooling . Journal of AI and Data Mining . 2021 ; 9 ( 2 ): 161 – 8 . OpenUrl 22. ↵ Coll L , Pareto D , Carbonell-Mirabent P , Cobo-Calvo Á , Arrambide G , Vidal-Jordana Á , et al. Deciphering multiple sclerosis disability with deep learning attention maps on clinical MRI . NeuroImage Clinical . 2023 ; 38 : 103376 . 23. ↵ Yoo Y , Tang LYW , Brosch T , Li DKB , Kolind S , Vavasour I , et al. Deep learning of joint myelin and T1w MRI features in normal-appearing brain tissue to distinguish between multiple sclerosis patients and healthy controls . NeuroImage: Clinical . 2018 ; 17 : 169 – 78 . OpenUrl PubMed 24. ↵ Khattap MG , Sallah M , Dahou A , Elaziz MA , Elgarayhi A , Aseeri AO , et al. Advancing multiple sclerosis diagnosis through an innovative hybrid AI framework incorporating Multi-view ResNet and quantum RIME-inspired metaheuristics . Ain Shams Engineering Journal . 2025 ; 16 ( 2 ): 103241 . OpenUrl 25. ↵ Mayfield J , Naqa IE . Evaluation of VQC-LSTM for disability forecasting in multiple sclerosis using sequential multisequence MRI . Quantum Machine Intelligence . 2024 ; 6 ( 2 ): 41 . OpenUrl 26. ↵ Nielsen MA , Chuang IL . Quantum Computation and Quantum Information: 10th Anniversary Edition . Cambridge : Cambridge University Press ; 2010 . 27. ↵ Hughes C , Isaacson J , Perry A , Sun RF , Turner J. Quantum Gates. In: Hughes C, Isaacson J, Perry A, Sun RF, Turner J, editors. Quantum Computing for the Quantum Curious. Cham: Springer International Publishing ; 2021 . p. 49 – 57 . 28. ↵ Shafique MA , Munir A , Latif I. Quantum Computing: Circuits, Algorithms, and Applications . IEEE Access . 2024 ; 12 : 22296 – 314 . OpenUrl 29. ↵ Schuld M , Sweke R , Meyer JJ . Effect of data encoding on the expressive power of variational quantum-machine-learning models . Physical Review A . 2021 ; 103 ( 3 ): 032430 . OpenUrl 30. ↵ Hur T , Kim L , Park DK . Quantum convolutional neural network for classical data classification . Quantum Machine Intelligence . 2022 ; 4 ( 1 ): 3 . OpenUrl 31. ↵ Abbas A , Sutter D , Zoufal C , Lucchi A , Figalli A , Woerner S . The power of quantum neural networks . Nature Computational Science . 2021 ; 1 ( 6 ): 403 – 9 . OpenUrl PubMed 32. ↵ Benedetti M , Lloyd E , Sack S , Fiorentini M . Parameterized quantum circuits as machine learning models . Quantum Science and Technology . 2019 ; 4 ( 4 ): 043001 . OpenUrl CrossRef 33. ↵ Banchi L , Pereira J , Pirandola S . Generalization in Quantum Machine Learning: A Quantum Information Standpoint . PRX Quantum . 2021 ; 2 ( 4 ): 040321 . OpenUrl 34. ↵ Schuld M , Petruccione F. Supervised Learning with Quantum Computers. 1st ed. 2018. ed. Cham: Springer International Publishing ; 2018 . 35. ↵ Rath M , Date H . Quantum data encoding: a comparative analysis of classical-to-quantum mapping techniques and their impact on machine learning accuracy . EPJ Quantum Technology . 2024 ; 11 ( 1 ): 72 . OpenUrl 36. ↵ Weigold M , Barzen J , Leymann F , Salm M . Encoding patterns for quantum algorithms . IET Quantum Communication . 2021 ; 2 ( 4 ): 141 – 52 . OpenUrl 37. ↵ Macin G , Tasci B , Tasci I , Faust O , Barua PD , Dogan S , et al. An accurate multiple sclerosis detection model based on exemplar multiple parameters local phase quantization: ExMPLPQ . Applied Sciences . 2022 ; 12 ( 10 ): 4920 . OpenUrl 38. ↵ Sadaiyandi J , Arumugam P , Sangaiah AK , Zhang CJE. Stratified sampling-based deep learning approach to increase prediction accuracy of unbalanced dataset . 2023 ;12( 21 ): 4423 . 39. ↵ Castellano G , Lella E , Longo V , Placidi G , Polsinelli M , Vessio G , editors. Combining Unsupervised and Supervised Deep Learning for Alzheimer’s Disease Detection by Fractional Anisotropy Imaging 2023 : IEEE. 40. ↵ Dua S , Kumar SS , Albagory Y , Ramalingam R , Dumka A , Singh R , et al. Developing a Speech Recognition System for Recognizing Tonal Speech Signals Using a Convolutional Neural Network . Applied Sciences [Internet ]. 2022 ; 12 ( 12 ). 41. ↵ Afsaneh E , Sharifdini A , Ghazzaghi H , Ghobadi MZ . Recent applications of machine learning and deep learning models in the prediction, diagnosis, and management of diabetes: a comprehensive review . Diabetology & Metabolic Syndrome . 2022 ; 14 ( 1 ): 196 . OpenUrl PubMed 42. ↵ Alem A , and Kumar S . End-to-End Convolutional Neural Network Feature Extraction for Remote Sensed Images Classification . Applied Artificial Intelligence . 2022 ; 36 ( 1 ): 2137650 . OpenUrl 43. ↵ Yamashita R , Nishio M , Do RKG , Togashi K . Convolutional neural networks: an overview and application in radiology . Insights into Imaging . 2018 ; 9 ( 4 ): 611 – 29 . OpenUrl PubMed 44. ↵ Dubey SR , Singh SK , Chaudhuri BB . Activation functions in deep learning: A comprehensive survey and benchmark . Neurocomputing . 2022 ; 503 : 92 – 108 . OpenUrl CrossRef 45. ↵ Zafar A , Aamir M , Mohd Nawi N , Arshad A , Riaz S , Alruban A , et al. A Comparison of Pooling Methods for Convolutional Neural Networks . Applied Sciences [Internet ]. 2022 ; 12 ( 17 ). 46. ↵ Tripathy S , Singh R , editors. Convolutional Neural Network: An Overview and Application in Image Classification. Proceedings of Third International Conference on Sustainable Computing ; 2022 2022//; Singapore: Springer Nature Singapore. 47. ↵ Huang G , Liu Z , Van Der Maaten L , Weinberger KQ , editors. Densely connected convolutional networks 2017 . 48. ↵ Chuenchit C , Bunjaroj K , Larpsongsuk S , Nuntasomboon V , editors. Classification of Six Nail Conditions Using Deep Learning 2024 : IEEE. 49. ↵ He K , Zhang X , Ren S , Sun J , editors. Deep residual learning for image recognition 2016 . 50. ↵ Ali RR , Yaacob NM , Alqaryouti MH , Sadeq AE , Doheir M , Iqtait M , et al. Learning Architecture for Brain Tumor Classification Based on Deep Convolutional Neural Network: Classic and ResNet50 . Diagnostics . 2025 ; 15 ( 5 ): 624 . OpenUrl PubMed 51. ↵ Yan H , Mubonanyikuzo V , Komolafe TE , Zhou L , Wu T , Wang N . Hybrid-RViT: Hybridizing ResNet-50 and Vision Transformer for Enhanced Alzheimer’s disease detection . PloS one . 2025 ; 20 ( 2 ): e0318998 . OpenUrl PubMed 52. ↵ Mohan A. Enhanced Multiple Dense Layer EfficientNet: Purdue University ; 2024 . 53. ↵ Tan M , Le Q , editors. Efficientnet: Rethinking model scaling for convolutional neural networks 2019 : PMLR. 54. ↵ Hu J , Shen L , Sun G , editors. Squeeze-and-Excitation Networks. 2018 IEEE/CVF Conference on Computer Vision and Pattern Recognition ; 2018 18-23 June 2018. 55. ↵ Bergholm V , Izaac J , Schuld M , Gogolin C , Ahmed S , Ajith V , et al. Pennylane: Automatic differentiation of hybrid quantum-classical computations . arXiv preprint arXiv : 181104968 . 2018 . 56. ↵ Akiba T , Sano S , Yanase T , Ohta T , Koyama M , editors. Optuna: A next-generation hyperparameter optimization framework 2019 . 57. ↵ Turisini M , Amati G , Cestari M . Leonardo: A pan-european pre-exascale supercomputer for HPC and AI applications . arXiv preprint arXiv : 230716885 . 2023 . 58. ↵ Tatli S , Macin G , Tasci I , Tasci B , Barua PD , Baygin M , et al. Transfer-transfer model with MSNet: An automated accurate multiple sclerosis and myelitis detection system . Expert Systems with Applications . 2024 ; 236 : 121314 . 59. ↵ Haggag RM , Ali EM , Khalifa ME , Taha M . Multiple sclerosis diagnosis with brain MRI retrieval: A deep learning approach . Results in Control and Optimization . 2025 ; 18 : 100533 . 60. ↵ Ekmekyapar T , Taşcı B . Exemplar MobileNetV2-Based Artificial Intelligence for Robust and Accurate Diagnosis of Multiple Sclerosis . Diagnostics [Internet ]. 2023 ; 13 ( 19 ). 61. ↵ Naeeni Davarani M , Arian Darestani A , Guillen Cañas V , Azimi H , Havadaragh SH , Hashemi H , et al. Efficient segmentation of active and inactive plaques in FLAIR-images using DeepLabV3Plus SE with efficientnetb0 backbone in multiple sclerosis . Scientific Reports . 2024 ; 14 ( 1 ): 16304 . OpenUrl PubMed 62. ↵ Ranga D , Rana A , Prajapat S , Kumar P , Kumar K , Vasilakos AV. Quantum Machine Learning: Exploring the Role of Data Encoding Techniques, Challenges, and Future Directions . Mathematics [Internet] . 2024 ; 12 ( 21 ). 63. ↵ Khan MA , Aman MN , Sikdar B . Beyond bits: A review of quantum embedding techniques for efficient information processing . IEEE access . 2024 . View the discussion thread. Back to top Previous Next Posted November 17, 2025. Download PDF Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Quantum-Enhanced Transfer Learning for MS Lesion Detection in MRI: A Hybrid Classical-Quantum Framework Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Quantum-Enhanced Transfer Learning for MS Lesion Detection in MRI: A Hybrid Classical-Quantum Framework Mohadeseh Zarei Ghobadi , Elaheh Afsaneh medRxiv 2025.11.16.25340339; doi: https://doi.org/10.1101/2025.11.16.25340339 Share This Article: Copy Citation Tools Quantum-Enhanced Transfer Learning for MS Lesion Detection in MRI: A Hybrid Classical-Quantum Framework Mohadeseh Zarei Ghobadi , Elaheh Afsaneh medRxiv 2025.11.16.25340339; doi: https://doi.org/10.1101/2025.11.16.25340339 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Neurology Subject Areas All Articles Addiction Medicine (568) Allergy and Immunology (863) Anesthesia (300) Cardiovascular Medicine (4440) Dentistry and Oral Medicine (444) Dermatology (383) Emergency Medicine (608) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1510) Epidemiology (15229) Forensic Medicine (30) Gastroenterology (1126) Genetic and Genomic Medicine (6605) Geriatric Medicine (668) Health Economics (998) Health Informatics (4541) Health Policy (1369) Health Systems and Quality Improvement (1613) Hematology (543) HIV/AIDS (1265) Infectious Diseases (except HIV/AIDS) (15923) Intensive Care and Critical Care Medicine (1103) Medical Education (623) Medical Ethics (147) Nephrology (668) Neurology (6604) Nursing (346) Nutrition (998) Obstetrics and Gynecology (1145) Occupational and Environmental Health (957) Oncology (3334) Ophthalmology (974) Orthopedics (369) Otolaryngology (420) Pain Medicine (436) Palliative Medicine (130) Pathology (663) Pediatrics (1693) Pharmacology and Therapeutics (692) Primary Care Research (711) Psychiatry and Clinical Psychology (5448) Public and Global Health (9235) Radiology and Imaging (2199) Rehabilitation Medicine and Physical Therapy (1370) Respiratory Medicine (1196) Rheumatology (594) Sexual and Reproductive Health (712) Sports Medicine (530) Surgery (712) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'a0162662ce3273e8',t:'MTc3OTcyODk4OA=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

⚙ Ask this paper AI returns verbatim quotes from the full text · source: preprint-html ⓘ

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc: last seen: 2026-05-20T01:45:00.602351+00:00