Automated Detection of Lacunes in Brain MR Images Using SAM with Robust Prompts via Self-Distillation and Anatomy-Informed Priors

preprint OA: gold CC-BY-NC-ND-4.0
📄 Open PDF Full text JSON View at publisher
Full text 82,572 characters · extracted from preprint-html · click to expand
Automated Detection of Lacunes in Brain MR Images Using SAM with Robust Prompts via Self-Distillation and Anatomy-Informed Priors | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Automated Detection of Lacunes in Brain MR Images Using SAM with Robust Prompts via Self-Distillation and Anatomy-Informed Priors Pon Deepika , Gouri Shanker , Ramanujam Narayanan , View ORCID Profile Vaanathi Sundaresan doi: https://doi.org/10.1101/2025.07.09.25331177 Pon Deepika 1 Department of Computational and Data Sciences, Indian Institute of Science , Bengaluru, Karnataka 560012, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site Gouri Shanker 1 Department of Computational and Data Sciences, Indian Institute of Science , Bengaluru, Karnataka 560012, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site Ramanujam Narayanan 1 Department of Computational and Data Sciences, Indian Institute of Science , Bengaluru, Karnataka 560012, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site Vaanathi Sundaresan 1 Department of Computational and Data Sciences, Indian Institute of Science , Bengaluru, Karnataka 560012, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Vaanathi Sundaresan For correspondence: vaanathi{at}iisc.ac.in Abstract Full Text Info/History Metrics Data/Code Preview PDF Abstract Lacunes, which are small fluid-filled cavities in the brain, are signs of cerebral small vessel disease and have been clinically associated with various neurodegenerative and cerebrovascular diseases. Hence, accurate detection of lacunes is crucial and is one of the initial steps for the precise diagnosis of these diseases. However, developing a robust and consistently reliable method for detecting lacunes is challenging because of the heterogeneity in their appearance, contrast, shape, and size. To address the above challenges, in this study, we propose a lacune detection method using the Segment Anything Model (SAM), guided by point prompts from a candidate prompt generator. The prompt generator initially detects potential lacunes with a high sensitivity using a composite loss function. The SAM model selects true lacunes by delineating their characteristics from mimics such as the sulcus and enlarged perivascular spaces, imitating the clinicians’ strategy of examining the potential lacunes along all three axes. False positives were further reduced by adaptive thresholds based on the region-wise prevalence of lacunes. We evaluated our method on two diverse, multi-centric MRI datasets, VALDO and ISLES, comprising only FLAIR sequences. Despite diverse imaging conditions and significant variations in slice thickness (0.5–6 mm), our method achieved sensitivities of 84% and 92%, with average false positive rates of 0.05 and 0.06 per slice in ISLES and VALDO datasets respectively. The proposed method outperformed the state-of-the-art methods, demonstrating its effectiveness in lacune detection and quantification. 1 Introduction Lacunes of presumed vascular origin appear as round or ovoid subcortical fluid-filled cavities, between 3 and approximately 15 mm in diameter, as defined by the STandards for ReportIng Vascular changes on nEuroimaging (STRIVE) criteria ( Wardlaw et al., 2013 ; Duering et al., 2023 ). Although lacunes are frequently observed in older adults and are often asymptomatic ( Wardlaw, 2008 ), they have been associated with stroke, dementia, cognitive decline, and gait impairments ( Jokinen et al., 2011 ; Vermeer et al., 2003 ; Chen et al., 2020 ). Accurate detection and quantification of lacunes are essential for patient risk stratification, enabling the precise diagnosis of cerebrovascular and neurodegenerative diseases and ensuring timely treatment. In FLAIR sequences, lacunes generally appear as round or ovoid hypointense regions, similar to the CSF (indicating fluid-filled cavities), surrounded by an irregular hyperintense rim ( Duering et al., 2023 ). However, this characteristic rim can also be partially or completely absent, depending on various factors, such as the extent of gliosis, the age of the lesion, and its location ( Duering et al., 2023 , 2013 ). This contributes to the significant diversity in the appearance of lacunes, as shown in Figure 1 , making visual assessment a challenging and time-consuming task for radiologists. The accurate detection of lacunes is further complicated by the presence of mimics, including anatomical structures (e.g., sulci, cerebral ventricle) and other imaging biomarkers of cerebral small vessel disease (CSVD), such as enlarged perivascular spaces (EPVS) ( Duering et al., 2023 ; Uchiyama et al., 2007a ). In particular, EPVS are fluid-filled spaces that typically follow the course of the vessel, exhibiting a signal similar to CSF, and appear round or ovoid when imaged perpendicular to the vessel’s course. This makes them indistinguishable from lacunes when located within white matter hyperintensities and exceeds 3 mm in size ( Duering et al., 2023 ). Download figure Open in new tab Figure 1: Heterogeneity in the appearance of lacunes on fluid-attenuated inversion recovery (FLAIR) sequence. The first two rows show the diversity in lacunes (indicated by green box), while the third row illustrates non-lacune mimics (indicated by red box). Given the inherent complexities in lacune detection, manual lacune labelling is highly time intensive, expensive for larger datasets, and requires a high level of expertise. Additionally, labelling may be prone to high inter-rater variability. Hence, there is a growing need for computer-aided methods to detect lacunes efficiently. While a few semi-automated and automated methods have been proposed, as detailed in Section 1.1 , existing approaches often require human intervention (in the case of semi-supervised methods), provide suboptimal performance due to false detections of mimics, or lack generalisability across multiple resolutions. To address these limitations, we propose a novel fully automated framework for effectively identifying lacunes in brain MRI scans across different image resolutions. The proposed method involves a modular approach comprising lacune candidate detection, identification of lacunes from mimics using representative prompts, and further reduction of false positives using adaptive thresholding. The key contributions of our method include: Developing a Candidate Prompt Generator (CPG), a deep learning module that employs a combination of loss functions to differentiate between tissue characteristics and generate precise lacune candidate prompts to guide the SAM detection process. Leveraging the Segment Anything Model (SAM) to identify true lacunes by analysing the candidate regions along all three anatomical planes, replicating the decision making process of clinical experts. Utilising the prior knowledge of regional lacune distribution at population-level to determine adaptive thresholds for false positive reduction, ensuring high detection accuracy. Implementing a self-distillation approach to significantly enhance lacune detection performance on a smaller dataset. Lacune identification often requires a method that functions robustly at various image resolutions. Hence, we evaluated the effectiveness of our method using two datasets consisting of MRI volumes from four different centres with slice thicknesses ranging from 0.5 to 6 mm. We also conducted ablation studies to evaluate the influence of different components of loss functions and the effect of using simulated lesions in the training data on effective candidate detection. In addition, we performed ablation studies to examine the contribution of different modules to the detection of lacunes. We also compared our results with existing state-of-the-art methods for lacune detection. 1.1 Related Work Several semi-automated and automated methods have been proposed to address the challenges associated with lacune detection. For example, Al-Masni et al . ( Al-Masni et al., 2021 ) proposed a semi-supervised method consisting of a candidate discriminator based on a 3D multiscale residual network to distinguish true lacunes from lacune mimics identified by neuroradiologists. However, manual intervention was required for candidate detection, which was challenging for a wide range of mimics. Early work on automated methods for lacune detection by Yokoyama et al . ( Yokoyama et al., 2007 ) involved a comprehensive method that combined multiphase binarisation, morphological operations, and feature-based classification. Given the challenges of the accurate detection of lacunes, researchers have often adopted multi-stage approaches consisting of potential candidate identification, followed by systematic refinement. In this context, Uchiyama et al . investigated various techniques for false positive reduction by employing rule-based algorithms ( Uchiyama et al., 2007a ), support vector machines ( Uchiyama et al., 2012 ), neural network classifiers ( Uchiyama et al., 2007b , 2008 ), and eigen-template matching ( Uchiyama et al., 2015 ). Furthermore, using conventional methods, Wang et al . ( Wang et al., 2012 ) introduced a multistage framework for segmenting white matter hyperintensities, cortical infarcts, and lacunar infarcts, relying on a rule-based approach driven by absolute voxel intensities. However, these conventional methods face significant challenges in learning robust representations of lacunes, particularly because lacunes are small and their appearance varies with slice thickness, imaging protocols, and the age of the lesion, as evidenced by the high false positive rates of these studies (e.g., 0.47 false positives per slice reported in With advancements in computational capabilities, various deep learning-based methods have recently been explored for detecting lacunes, demonstrating promising performance compared to conventional techniques ( Sudre et al., 2019 ; Al-Masni et al., 2021 ; Ghafoorian et al., 2017 ). In particular, Ghafoorian et al . ( Ghafoorian et al., 2017 ) developed a two-stage deep learning approach to detect potential lacunes, where the initial extraction of candidates was performed using a patch-based 2D CNN segmentation model. To address false positives from the candidate extractor and differentiate lacunes from mimics, several studies, including Ghafoorian et al. ( Ghafoorian et al., 2017 ) have investigated multi-scale 3D patch analysis ( Ghafoorian et al., 2017 ; Al-Masni et al., 2021 ). However, their evaluation was limited to uniform resolution volumes, leaving the effectiveness of the method on multi-resolution data unexplored. Other deep learning-based frameworks explored for lacune detection included U-Net ( Duan et al., 2020 ) and adaptations of the RCNN network for 3D data ( Sudre et al., 2019 ). Despite these advancements, the accurate detection of lacunes remains a significant challenge owing to their diverse appearance, size, and presence of mimics. These factors frequently contribute to high false positive rates, with the lowest reported rate being 0.13 per slice ( Ghafoorian et al., 2017 ). The VAscular Lesions DetectiOn and Segmentation Challenge (VALDO 2021) ( Sudre et al., 2024 ), held in conjunction with MICCAI 2021, the largest platform organised so far for accurate lacune detection, invited research groups to develop automated solutions for detecting and segmenting subtle signs of CSVD, including lacunes. Various methods have been developed for VALDO 2021, including versions of UNet, MaskRCNN, and MaskRetinanet, with different loss functions, such as Dice, blob, binary cross-entropy, focal, or mean absolute error. The top-ranking team employed a 3D UNet model with Dice loss based on the nnUNet framework. Their method achieved a median F1 score of 28.57, indicating the scope for improvement with the need for more advanced deep learning techniques. A major challenge in the development of supervised automated methods for lacune detection is the time-consuming process of annotating small lesions. This is further complicated by the limited availability of training data in various datasets, which affects model generalisation. Recent advances in foundation models, such as the Segment Anything Model (SAM) ( Kirillov et al., 2023 ) and its variants, have been explored to address challenges related to limited data and model generalisability by harnessing their zero-shot segmentation capabilities. SAM has shown promising performance in segmenting various lesions and organs using multiple imaging modalities, including CT, MRI, ultrasound, and PET, using appropriate prompts without requiring additional training ( Mazurowski et al., 2023 ). However, the utility of SAM in detecting smaller lesions such as lacunes remains largely unexplored. Similarly, techniques, such as adversarial learning and feature alignment strategies, have been widely explored ( Singhal et al., 2023 ) to overcome training data scarcity and shifts across datasets. Among these, knowledge distillation has provided improved performance for various tasks, including multi-organ segmentation ( Kim et al., 2024 ), vertebrae detection ( Serrador et al., 2024 ), brain tumour analysis ( Choi et al., 2023 ), white matter hyperintensity segmentation ( Orbes-Arteainst et al., 2019 ), microbleed detection ( Sundaresan et al., 2023 ), and retinal disease classification ( Paluru et al., 2023 ), illustrating its effectiveness in improving model generalisability, even with limited target training data. Hence, given the challenges in lacune detection, as highlighted by prior works ( Al-Masni et al., 2021 ; Ghafoorian et al., 2017 ), there is a need for specialised modular frameworks using foundation models such as SAM with accurate prompts. Additionally, it would be desirable to address challenges such as wide appearance heterogeneity, multi-centre variability, and limited data availability, using techniques such as knowledge distillation, for accurate and generalisable detection of lacunes. 2 Materials and methods In the proposed lacune detection workflow, we initially preprocessed the MRI volumes ( Section 2.1 ) and identified potential lacune candidates using the candidate prompt generator (CPG) ( Section 2.2 ). The aim of the CPG module was to provide precise prompts for SAM. We later performed a systematic detection of true lacunes among the candidates from the CPG module by analysing these prompts across all three anatomical planes using SAM ( Section 2.3 ). Finally, we further improved the lacune-detection accuracy using an adaptive region-aware thresholding (ART) module ( Section 2.4 ). Figure 2 illustrates the workflow of the proposed lacunar detection method. Download figure Open in new tab Figure 2: Workflow of the proposed lacune detection method. The initial lacune candidates that are detected by Candidate Prompt Generator (CPG) are used to extract point prompts for Segment Anything Model (SAM) model for lacune detection from mimics. The Adaptive Region-aware thresholding (ART) module is applied on the SAM output to further reduce the false detections. The CPG module is trained using real-world lacunes and synthetic lacune lesions generated by the Synthetic Lesion Simulator (SLS) module (used only for CPG training) as indicated by the dotted box. 2.1 Data preprocessing We skull-stripped the FLAIR volumes using FSL BET ( Smith, 2002 ), and subsequently corrected them for bias field inhomogeneities using FSL FAST ( Zhang et al., 2001 ). Finally, we cropped the images closer to the edges of the brain to create a tight field of view. 2.2 Candidate prompt generator As a first step towards accurate detection of lacunes, the aim of the CPG module was to identify potential lacune candidates on brain MRI volumes with high sensitivity, and later remove the false positives in the subsequent steps. In the CPG module, we developed a deep learning model that focused on segmenting lacunes from 2D axial slices. We chose to use a 2D model because of the high interslice variation of lacunes across various datasets. Axial slices were used for the 2D model because the spatial resolution was generally optimal in axial slices across the datasets for detecting lacunes. All 2D axial slices were z-score normalised for the CPG. We selected the U 2 Net ( Qin et al., 2020 ) architecture in the CPG module to segment the initial lacune candidates. U 2 Net uses Residual U-Blocks (described in ( Qin et al., 2020 )) to efficiently capture features at multiple scales. This design enabled the model to learn more complex patterns of lacunes, as shown in Figure 1 . U 2 Net provided better sensitivity for the detection of lacune candidates than the other architectures, as described in Section 4.1 . We utilised a composite loss function, that integrated Tversky ( Salehi et al., 2017 ), focal ( Ross and Dollár, 2017 ), and pixel-wise contrastive losses ( Khosla et al., 2020 ) for precise pixel-wise learning of lacune characteristics. First, to maximise recall by detecting as many true lacunes as possible, we used the Tversky loss ( L tver ) given in Equation 1 with a high penalty for false negatives. where p ni and p li are the predicted probabilities of pixel i being a non-lacune and lacune, respectively. The indicator variables g ni and g li are 1 for non-lacune and lacune pixels, respectively, and 0 otherwise. Second, to overcome the class imbalance between lacunes and the background in lacune candidate segmentation, we added focal loss ( L foc ) ( Eqn. 2 ) to help the model focus more on challenging borderline pixels, further enhancing performance. where p t is the predicted probability of the target class, α is the weighting factor for class imbalance, and γ is the focusing parameter that adjusts the rate at which easy samples are downweighted. Finally, to further improve the model’s ability to better discriminate between lacunes and mimics, we incorporated a pixel-wise supervised contrastive loss ( L sup ). The contrastive learning approach aims to bring the pixel embeddings of the same semantic class (lacunes) closer together while pushing apart the embeddings of different classes (lacunes vs. mimics/background). Therefore, we added a projection head after the penultimate layer of the U 2 Net decoder and applied pixel-wise supervised contrastive loss ( Khosla et al., 2020 ) ( Eqn. 3 ) to the embeddings produced by this projection head. where is the projected latent vector corresponding to the pixel x ℓ , τ ∈ ℛ + is a scalar temperature parameter, I represents indices of all sampled pixels in the batch, the index i is the current anchor, A ( i ) represents all the indices except i , out of which P ( i ) represents the indices of positive pixels distinct from i , the · denotes the inner (dot) product and | P ( i )| represents the cardinality of P ( i ). During training, for the first N epochs, negative pixels were randomly sampled from non-lacune pixels within the brain mask. After N epochs, when the model sufficiently learned the patterns, negative pixels were sampled from the false positives of the previous epoch. This approach motivated the model to focus on reducing false positives while improving the recall value. The total loss function for training the CPG module is given by, 2.2.1 Synthetic lesion simulation for robust training The diverse appearance-based characteristics of lacunes, coupled with variations in scan parameters across multi-centre datasets (slice thicknesses ranging from 0.68 to 6 mm) and limited data, affected the sensitivity of the CPG module. To overcome this challenge, in addition to the composite loss function, we augmented our training data with simulated lacunes produced by a Synthetic Lesion Simulator (SLS). The pipeline used to simulate lacune-like lesions using SLS is shown in Figure 3 . In SLS, synthetic lesions were first generated on lacune-free slices of the dataset using the method proposed in our previous work, MedLesSynth-LD ( Narayanan and Sundaresan, 2024 ). In line with emulating the shape and contrast variations of various lesions in MedLesSynth-LD, we created artificial lesions that emulated the structural, shape, and contrast characteristics of the lacunes in the simulation process. Synthetic lacunes were generated as localised structural perturbations of healthy brain tissue and constrained within randomly generated shape priors (formed using a set of ellipsoids). To preserve the inherent noise characteristics in the perturbed lesion textures in MRI, we used the Rician distribution (the underlying noise model for MRI ( Narayanan and Sundaresan, 2024 )) for the perturbation of healthy tissue. Next, to create a shape prior, we used a composite of ellipsoids to capture the shapes of both gliosis and cavitation in the lacunes. Finally, to match the sharp intensity difference observed between hyperintense gliosis and hypointense cavitation, we added perturbations within the two structures by varying the contrast parameters. These created lesions provided good priors, as they mimicked the structure, noise, and intensities of actual lesions. The computational overhead attached to MedLesSynth-LD is negligible because it does not require the training of deep learning models. To render the synthetic lesion much closer to the real lacunes (owing to their small size and variability between datasets), we translated the simulated lesions using cycleGAN ( Zhu et al., 2017 ). For training the cycleGAN, patches of size 32 × 32 mm centred on the 2D real lacune instances were extracted to create the training data. Given that the typical maximum diameter of lacune is 15 mm, the selected patch size ensured that the patch encompassed the lacune with a sufficient amount of background tissue. Extracting localised patches allowed for the inclusion of multiple slices from the same lacune instance, enabling the model to learn inter-slice variations more effectively. The real-world patches with an equal number of simulated lacune patches were used to train the cycleGAN. Once trained, cycleGAN was used to translate the simulated lesion patches, which were then blended back into the original images using Poisson blending within a circular binary mask with a radius of 8 mm (empirically determined using trial and error), as shown in Figure 3 . Download figure Open in new tab Figure 3: Lacune simulation pipeline using Synthetic Lesion Simulator (SLS). Top: Synthetic lacunes are generated using MedLesSynth-LD ( Narayanan and Sundaresan, 2024 ), where healthy tissue is perturbed using a Rician noise model, within synthesised gliosis and cavity shape masks and applied on images at varying contrasts. Bottom: The synthesised lacunes are translated using cycleGAN and blended using Poisson blending to emulate the real lacune characteristics specific to the dataset. 2.3 SAM based Detection As we aimed for high sensitivity in the CPG module, this typically resulted in false positives, mainly from parts of the sulcus and/or mimics such as EPVS, which were indistinguishable from the lacunes on the axial slices. Thus, the prompts generated from the CPG module were provided to the SAM module to reject false positives from slices at the volume level. We used the SAM model with the VIT-H encoder ( Kirillov et al., 2023 ) on the entire 3D volume guided by point prompts from the CPG. This step essentially replicated the clinician’s approach of examining all three axes to distinguish lacune-like false detections from true lacunes. Before applying SAM, we rescaled the intensities of the input volume using square-root transformation (for contrast enhancement) and performed min-max normalisation to facilitate better segmentation with SAM. The predicted 2D probability maps from the CPG module were then stacked together to obtain a 3D volume and thresholded at 0.5, to obtain 3D candidate instances. A threshold value of 0.5 was chosen experimentally based on the Free-Response Receiver Operating Characteristic (FROC) curve (shown in Figure 6 ). For each 3D candidate, its centroid was considered as the point prompt for SAM, and the axial, sagittal, and coronal slices (traversing through the centroid) were fed into SAM with the corresponding 2D coordinates as point prompts. Based on the segmentation output of the SAM, we detected true lacunes from the mimics, as explained below. Figure 4 shows a few examples of CPG-guided SAM-based detection of lacunes and the rejection of false positives. Download figure Open in new tab Figure 4: Lacune detection using SAM with point prompts from the Candidate Prompt Generator(CPG) module. Left to right: (a) candidates predicted by the CPG module (indicated by yellow boxes) shown on the axial slice, (also shown magnified at the top-right corner); the blue dotted line indicates the sagittal/coronal slice passing through the centroid, (b) the corresponding sagittal/coronal slice shown, with the magnified region of interest in the top-right corner, and (c) SAM’s predicted segmentation of the magnified region, with green and red boxes indicating the candidates predicted as lacunes and false-positives respectively. Removal of sulci: We removed the candidates that had SAM’s prediction probability ≥0.75 along any of the three axes, and intersected with the brain boundary, as sulci. Removal of EPVS and other elongated structures: EPVS might resemble lacunes in the axial plane but are more elongated in other planes. Among the three planes, if a lesion predicted by SAM had a major axis to minor axis ratio greater than 5 over any of the planes, then the instance was removed as a false positive. Despite the revised STRIVE criteria ( Duering et al., 2023 ) allowing lacunes smaller than 3 mm, we eliminated SAM predictions with a maximum axial diameter of less than 3 mm to avoid misclassification of EPVS as lacunes. This is because the EPVS diameter typically lies within 3 mm, whereas we observed very few lacunes smaller than 3 mm. Removal of false positives due to low tissue contrast: SAM predictions with the confidence score > 0.75 and predicted pixel area greater than 350 mm 2 along any of the three axes were treated as false positives (due to segmentation of background tissue regions with low contrast) and eliminated. We determined the above threshold values of the confidence scores used in SAM empirically based on the trial-and-error method. Furthermore, to account for the variation in slice thickness in the dataset, we adapted the following approach: for the slice thickness ≤ 4 mm, all three planes were inspected using SAM; for > 4 mm, only the axial plane was examined using SAM, as a higher slice thickness led to less reliable structural integrity and continuity across slices. Note that this SAM-based methodology replicates clinical decision-making in distinguishing lacunes from mimics, leveraging both the 2D deep learning model’s initial prompts and SAM’s detailed segmentations in multiple planes to improve the overall lacune detection accuracy. 2.4 Adaptive region-aware thresholding Lacunes have been shown to occur predominantly in specific regions of the brain, particularly in the white matter and subcortical structures ( Duering et al., 2013 ; Benjamin et al., 2014 ). Hence, as the final step of our method, we utilised this location-based prior and used adaptive region-aware thresholding (ART) to further effectively reduce false positives. In this step, instead of applying a global threshold on candidates retained by SAM, we applied a region-wise threshold determined based on the prevalence of lacunes in different regions of the brain. Candidates were classified as false positives if the prediction softmax probabilities at the centroid of the candidates were below the ART thresholds for that region (shown in Figure 5 ). This adaptive threshold provided a more robust segmentation compared to applying a global threshold by providing a better trade-off in various regions. Additionally, it helped remove false positives that could not be filtered based on their attributes, as described in Section 2.3 . Download figure Open in new tab Figure 5: Parcellation of regions based on MARS scale for adaptive region-based thresholding. Top to bottom: Parcellation of regions according to the MARS atlas shown on the left with the corresponding threshold maps on the right for three different slices of the brain. The table shown below stratifies the brain regions based on the prevalence of lacunes for ART. Download figure Open in new tab Figure 6: Ablation study results with different loss function components on the ISLES dataset. FROC curves illustrating CPG module performance with different components of loss functions, L foc , L foc + L tver and L foc + L tver + L sup , shown in blue, red and green curves respectively for the ISLES Dataset (the operating points that provide the best performance are indicated by dotted lines). To analyse the region-wise distribution of lacunes in the dataset, we obtained segmentation of anatomical structures in the brain based on the microbleed anatomical rating scale (MARS) map ( Gregoire et al., 2009 ). We chose the MARS map because it provided good granularity of the structural parcellation required for lacunes. The generation of MARS maps from various structural atlases in the MNI space was performed as specified by Sundaresan et al . ( Sundaresan et al., 2025 ). Figure 5 shows the MARS atlas for three axial slices across the brain for a sample subject in MNI space. We registered the MARS atlas from the MNI space to the target subject space using the FSL FLIRT ( Jenkinson et al., 2012 ). Once the anatomical regions were obtained in the subject space, we estimated the region-wise prevalence of lacunes in the training data by determining the lacune count in different regions. Finally, region-wise thresholds were assigned in alignment with the region-wise prevalence of lacunes (stratified as high/medium/low prevalence, as shown in Figure 5 ). The threshold values were 0.5, 0.55 and 0.65 for high, medium, and low values, respectively (note that these threshold values provided the best performance in the regions). The regions with a high prevalence of lacunes (specified ‘high’ in Figure 5 ) had lower threshold values compared to the regions with fewer lacunes (indicated as ‘low’ in Figure 5 ). Specifically, in the basal ganglia region where EPVS are usually more common ( Wardlaw et al., 2013 ), a higher threshold (0.55) facilitated the removal of EPVS from predicted lacunes. Given that EPVS could closely mimic the appearance of lacunes, setting a higher threshold helped us retain more confident lacune predictions, while reducing low-confidence false positives representing EPVS. 2.5 Implementation Details We implemented the proposed method using Python 3.11.7 and PyTorch 2.2.1. We trained the CPG module on a Linux workstation with an i9-10980XE CPU, 128 GB RAM, and an NVIDIA RTX A6000 GPU card with 48 GB memory. We used data augmentation techniques, including random rotation ( θ ∈ [−10, 10] degrees) and horizontal and vertical flips. The training dataset for the CPG module contained 2,728 slices, including all positive slices and a subset of sampled negative slices from the ISLES dataset, along with 12,000 synthetic lacune slices generated using the SLS module ( Section 2.2.1 ). The CPG module was trained using 14,728 2D slices with a 90%/10% training/validation split, requiring ≈6 min per epoch. We used the Adam optimiser with a learning rate of 1 × 10 −4 and batch size of 8 for training. Regarding the loss functions in the CPG module, for L foc , we chose α = 0.25 and γ = 2 (as reported in ( Ross and Dollár, 2017 )). For L tver , we chose β = 0.97 and α = 0.03 to enhance the sensitivity of the model to the true lacune features. In our pixel-wise contrastive learning approach, for the initial N = 50 epochs, we sampled negative pixels from the background, whereas after 50 epochs, we sampled negative pixels from the previous epoch’s false positives. In the SLS module, we adopted the recommended loss functions and parameters for cycleGAN as mentioned in ( Zhu et al., 2017 ). Unless specified, the above values were determined empirically using the trial-and-error method. 2.6 Dataset details We used the following datasets for our experiments. As FLAIR is the only sequence common to both datasets, it was used exclusively in this study. Ischemic Stroke Lesion Segmentation (ISLES) 2022 challenge training dataset ( Hernandez Petzsche et al., 2022 ) The primary dataset used in our study was the ISLES dataset, comprising of 250 MRI volumes, including FLAIR, DWI sequences, and ADC maps, collected from individuals aged 18 and older with diagnosed or suspected stroke. Data were collected from two different centres using 3T Philips, 3T Siemens, and 1.5T Siemens MAGNETOM MRI scanners. The slice thickness varied between 0.68 mm and 9.60 mm, as the dataset was originally curated to detect larger lesions such as strokes. However, for lacune detection, we excluded volumes with slice thicknesses greater than 6 mm and those with heavy artefacts, as these are not suitable for detecting smaller lesions such as lacunes. Lacune annotations were performed with the assistance of an expert radiologist using the ITK snap ( Yushkevich et al., 2006 ) (a free, open-source software application developed at the University of North Carolina). This resulted in a final set of 221 volumes consisting of 1,021 lacunes, of which 181 volumes were used for training, validation and 40 volumes for testing. VAscular Lesions Detection and segmentatiOn challenge 2021 (VALDO) dataset (Task-3) This dataset, available as VALDO task-3 training data, comprised MRI data from 40 patients from two different cohorts: 6 from the Southall and Brent Revisited (SABRE) ( Tillin et al., 2012 ; Jones et al., 2020 ) and 34 from the Rotterdam Scan Study (RSS) ( Ikram et al., 2015 ). The RSS cohort included participants aged ≥ 45 years who underwent follow-up every 3-4 years to investigate chronic illness. In SABRE, data were collected from individuals aged 36–92 years (mean age: 72 years) to monitor metabolic and cardiovascular diseases. The imaging protocol included T1-weighted, T2-weighted, and FLAIR sequences acquired using either a 3T Philips (SABRE) or 1.5T GE (RSS) scanner. Thus, the image resolutions varied between cohorts: SABRE had a resolution of 1.09 × 1.09 × 1.09, while RSS had 0.49 × 0.49 × 0.8 mm for all sequences. Manual annotations of lacunes by two independent raters were available for each volume of this dataset. The dataset consisted of 83 lacunes. We used 20 volumes for training and validation and 20 volumes for testing. 3 Experiments 3.1 Evaluation of various model architectures for candidate detection In the CPG module, for detecting lacune candidates to generate prompts for SAM, we evaluated different model architectures, including U 2 Net ( Qin et al., 2020 ), UNet++ ( Zhou et al., 2018 ), Re-sUNet++ ( Jha et al., 2019 ), Attention UNet ( Oktay, 2018 ), and Swin UNETR ( Hatamizadeh et al., 2021 ). These architectures were trained using the methodology outlined in Section 2.2 with the parameters specified in Section 2.5 on the ISLES data, and evaluated using the metrics specified in Section 3.7 . 3.2 Ablation Study I: Effect of components of the loss function on the CPG performance We performed an ablation study to investigate the effect of adding different loss components ( Eqn. 4 ) on the candidate detection performance of the CPG module. For this purpose, we compared the performance of the CPG module by incrementally adding the components of the loss function as follows: (1) L foc , (2) L foc + L tver , and (3) L foc + L tver + L sup . We evaluated performance on the ISLES dataset using the metrics described in Section 3.7 . 3.3 Ablation study II: Effect of different modules on the proposed lacune detection method We also conducted an ablation study to examine the impact of various modules in the lacune detection workflow on the ISLES dataset. For this, we incrementally integrated the modules as follows: (1) candidate detection using CPG, (2) detection of lacune candidates by SAM using prompts generated by CPG (CPG+SAM) by applying a global threshold of 0.5, and (3) applying the adaptive thresholds using ART on SAM output (CPG+SAM+ART). We evaluated the performance enhancement with successive integration of modules using the metrics specified in Section 3.7 . 3.4 Effect of using simulated lesions from SLS on the CPG performance The ISLES dataset was multi-centric data (with two different centres) with different slice thicknesses and lacunes with varying appearances and features. Hence, to address the challenge posed by the limited training data in learning the diverse characteristics of lacunes, we used simulated lesions generated by the SLS module (described in Section 2.2.1 ) to expand the training set. We evaluated the effect of augmenting the training data with simulated lesions on the performance of the CPG module for the ISLES dataset using the metrics specified in Section 3.7 . Additionally, we plotted t-distributed stochastic neighbour embedding (t-SNE) plots and determined the Frechet inception distance (FID) scores ( Heusel et al., 2017 ) to demonstrate the similarity between the simulated and real lacunes. Note that the lower the FIR scores between the simulated and real lacunes, the better is their similarity. 3.5 Self-Distillation for robust lacune candidate detection in a low-data regime The second dataset in this study, the VALDO dataset, contained only a few training samples and exhibited a domain shift, as the data were obtained from two different cohorts. To achieve good performance in this low-data case for the CPG module, it was crucial for the model to retain the knowledge about lacune characteristics learned from a larger dataset, such as ISLES, while adapting to the lesion characteristics within the VALDO dataset. Hence, we implemented self-distillation as a strategy to adapt our method for generalisation across datasets. Self-distillation has been proven to be effective in prior studies ( Paluru et al., 2023 ; Kim et al., 2020 ; Kuang et al., 2024 ), where the model uses its own predictions from a previous epoch as additional training input for subsequent epochs. In this approach, we pretrained the model on the ISLES dataset for the initial 100 epochs. Then, each subsequent epoch was trained as follows: In the first step, the model was trained on the ISLES dataset, with its current state acting as a teacher for the next step within that epoch. In the next step, the same model was trained on the smaller VALDO dataset using the lacune ground truth as hard labels and the teacher’s predictions as soft labels, with a distillation loss described in Eqn. 5 with α = 0.65. We experimented with various values of α and observed that α = 0.65 was optimal. Furthermore, because the predictions for VALDO were made using the self-distilled model, which produces more confident predictions, the optimal ART thresholds for the VALDO dataset were incremented by a factor of 0.1. where ℒ hard represents the Focal loss (ℒ foc , described in eqn. 2 ), and ℒ soft represents the KL divergence between the student and teacher logits. We evaluated the performance of the CPG module on the VALDO dataset using the metrics specified in Section 3.7 with different training strategies, including combinations of both datasets and self-distillation. 3.6 Comparison with existing methods Finally, we compared our performance with that of existing state-of-the-art methods for lacune detection. We included deep learning-based semi-automated and fully automated methods for lacune detection proposed since 2017 in our comparison. 3.7 Performance evaluation metrics and statistical evaluation We used the following evaluation metrics consistent with existing methods ( Ghafoorian et al., 2017 ; Al-Masni et al., 2021 ; Sudre et al., 2024 ): (1) cluster-wise sensitivity , which is the ratio of the number of true positive lacune lesions detected by the model to the total number of true lacune lesions across the entire test set, (2) cluster-wise F1-measure , which is the harmonic mean of cluster-wise precision and cluster-wise sensitivity, and (3) Absolute Element Difference (AED) , the absolute difference between the number of true lacune lesions and the number of predicted lacune lesions. Because the VALDO dataset includes annotations from two raters, we determined the F1-score weighted by inter-rater agreement and average AED, adhering to the metrics used in the VALDO 2021 challenge ( Sudre et al., 2024 ). For statistical evaluations, we used a Wilcoxon signed rank test to assess the statistical significance of performance differences (p < 0.05 for significance; p < 0.001 for stronger significance) in the ablation studies. 4 Results 4.1 Evaluation of different model architectures for Lacune Detection The results of the comparison of the various model architectures on the ISLES dataset are presented in Table 1 . Among the architectures evaluated, Attention UNet achieved the best F1-score and AED. However, we selected U 2 Net for the CPG module because the primary focus of the module was to maximise the sensitivity for the detection of true lacunes. At a threshold of 0.5, U 2 Net achieved the highest sensitivity of 85.19%, thus making it the optimal choice. View this table: View inline View popup Download powerpoint Table 1: Comparison of performance of different deep learning models for CPG module for the ISLES Dataset, with number of parameters and FLOPS (in Giga(G) FLOPS). (↑)/(↓) indicates that higher/lower values are better. The best sensitivity value is reported in bold. The median values (with the interquartile range in brackets) are reported for F1 value and AED. 4.2 Ablation Study I: Effect of components of the loss function on the CPG performance Figure 6 shows the FROC curves indicating the effect of the addition of different loss components on the CPG module for the ISLES dataset. Although focal loss aids in learning more difficult examples, the maximum sensitivity achieved was 84%. With the addition of the Tversky loss with a higher weight of 0.97 for false negatives, the model captures more true lacunes, providing a sensitivity of around 90%, despite greater heterogeneity in the appearance of the lesion. However, the average number of FPs was 32/volume, which would incur higher computational costs in the subsequent stages. With the inclusion of the contrastive learning component in the loss function, the model learned tissue characteristics more effectively, providing far fewer FPs of 15/volume and 6.9/volume for sensitivities of 91% and 85.19%, respectively (as highlighted in Figure 6 ). For subsequent analysis, we selected a high-precision operating point with an 85.19% sensitivity. 4.3 Ablation study II: Effect of different modules on the proposed lacune detection method The ablation study results are presented in Table 2 and the visual results are shown in Figure 7 . As shown in Table 2 , the integration of each module led to an improvement in the F1-scores for both the ISLES and VALDO datasets. The improvements were statistically significant in almost all cases (except for the addition of ART to the VALDO dataset). While the CPG module demonstrated strong performance in capturing true lacunes, the SAM module proved to be very effective in reducing false positives originating from structures such as the sulci, cerebral ventricles, EPVS, and other regions, by analysing candidates along the three axes. In this process, the SAM module retained all the true lacunes and markedly improved the metrics across both datasets. Although the SAM module offered substantial improvements in metrics across both datasets, its ability was constrained by the heterogeneity in the appearance of lacunes. Integration of the ART module helped overcome this constraint by using adaptive thresholds based on knowledge of the region-wise distribution of lacunes. This further improved detection accuracy by eliminating false positives that closely resembled lacunes on all axes, as shown in Figure 7 . Consequently, the proposed method achieved an overall sensitivity of 84.26% for the ISLES dataset and 92.31% for the VALDO dataset. View this table: View inline View popup Download powerpoint Table 2: Ablation Study: Performance metric with the addition of different modules. CPG, SAM, ART represents Candidate prompt Generator, SAM based lacune detection and Adaptive Region-aware thresholding respectively. (↑)/(↓) indicates that higher/lower values are better. The median values (with the interquartile range in brackets) are reported for F1 value and AED. */** indicates p < 0.05/p < 0.001 showing significant difference between successive rows for F1 value and AED. Download figure Open in new tab Figure 7: Sample results of the proposed method from the ISLES and VALDO datasets. Top to bottom: a) axial slice with ground truth (shown in yellow boxes), b) prompts generated by the CPG module, c) predictions from SAM module to reduce false positives and d) detected final lacunes from Adaptive Region-aware Thresholding (ART). In (b)-(d), the yellow and red bounding boxes indicate the true lacunes and false positives respectively. 4.4 Effect of using simulated lesions from SLS on the CPG performance The t-SNE plot in Figure 8 (top panel) illustrates the similarity between the real and simulated lacunes by showing good overlap between them. Hence, the lacunes generated by our SLS module closely resembled the characteristics of real lacunes while effectively capturing the heterogeneity observed in the actual dataset. Notably, despite the small size of the lacunes and wide variability in their appearance, the lacunes simulated using MedLesSynth and those further refined through cycleGAN achieved promising FID scores of 68.36 and 33.56, respectively, with respect to real lacunes. Furthermore, the impact of incorporating simulated lesions during training is evident from the FROC curve shown in Figure 8 (bottom panel). When the CPG module was trained without simulated lesions, using only 2,724 slices from the ISLES dataset (as indicated in Section 2.5 ), it achieved a sensitivity of 79%, despite allowing an average of 21 FPs/subject. In contrast, the inclusion of simulated lesions expanded the training set to 14,724 slices, enabling the CPG module to achieve a higher sensitivity of 91% while also reducing the average FPs to 15/subject, highlighting the effectiveness of the simulated lesion in enhancing the performance. Download figure Open in new tab Figure 8: Effect of simulations from SLS module on CPG performance. Top: T-SNE plot showing good oevrlap between real-world lacunes and synthetic lacunes simulated using SLS. Bottom: FROC curves showing the comparison of the performance of the CPG module trained with and without inclusion of simulated data (green and blue curves respectively) for the ISLES Dataset (the operating points that provide the best performance are indicated by dotted lines). 4.5 Self-Distillation for robust lacune candidate detection in a low-data regime Table 3 reports the results of the comparison of CPG detection performance for self-distillation and with training on a combined dataset (VALDO + ISLES) on the VALDO dataset. The self-distillation approach significantly improved the lacune detection performance of the CPG module, achieving a sensitivity of 92.1% for lacune candidates annotated by both raters. The ISLES dataset was acquired from individuals with suspected or diagnosed stroke, whereas the VALDO dataset was collected from an asymptomatic population. This resulted in significant variations in the appearance of lacunes, which were influenced by differences in lesion location and age. Owing to these disparities in lacune characteristics, the model trained on the combined dataset could not adapt exclusively to the VALDO dataset, and hence showed reduced sensitivity. This was further exacerbated by a significant sample size imbalance between the VALDO and ISLES datasets. However, self-distillation effectively captured true lacunes in the VALDO dataset, despite a slight increase in AED, which was addressed in subsequent modules to improve the performance. View this table: View inline View popup Download powerpoint Table 3: Comparison of the CPG module’s performance on the VALDO dataset using a combination of both datasets and self-distillation as training strategies, with the best sensitivity value reported in bold. (↑)/(↓) indicates that higher/lower values are better. The median values (with the interquartile range in brackets) are reported for F1 value and AED. 4.6 Comparison with existing methods The proposed lacune detection method demonstrated superior performance compared with existing approaches across multiple metrics, as shown in Table 4 . It consistently achieved high accuracy across varying image resolutions, with significantly lower false positive rates of 0.05 and 0.06 per slice for both datasets which is less than half the rate reported by Ghafoorian et al. ( Ghafoorian et al., 2017 ). This significant reduction in false positives can be attributed to our novel modular strategy of examining candidates across all three axes using SAM and integrating knowledge of the regional distribution of lacunes. View this table: View inline View popup Download powerpoint Table 4: Comparison of the performance of proposed method for detection of lacunes with the existing semi-automated and automated methods. (↑)/(↓) indicates that higher/lower values are better. The median values are reported for F1 value and AED. Although Ghafoorian et al.’s approach achieved a sensitivity of 97.4% for lacunes agreed upon by three out of four raters, with 0.13 false positives per slice, their false positive rate was significantly higher than our reported rate of 0.05 per slice, corresponding to a sensitivity of 84.26% on lacunes agreed upon by any two of the four raters involved in their study. In addition, while their model was evaluated on uniform resolution volumes from a single scanner model, our approach demonstrated greater versatility, maintaining strong performance across multi-resolution data from four different imaging centres. In particular, our method demonstrated improved performance compared to the top entries in the VALDO challenge, achieving a sensitivity of 92.31% on lacune candidates agreed upon by both raters in VALDO and 84.26% in ISLES, supported by higher F1 scores computed for comparable numbers of lacunes across both datasets. The method proposed by Duan et al . ( Duan et al., 2020 ) achieved a region-wise F1 score of 68.3, while our method achieved an on-par F1-score on a volume-wise basis, despite the fact that the region-wise F1 scores typically surpass volume-wise scores. Furthermore, unlike existing methods that depend on multiple imaging sequences for decision making (summarised in Table 4 ), our approach maintains optimal performance while relying solely on FLAIR sequences. 5 Discussion In this study, we proposed a modular framework for lacune detection that integrates lacune candidate prompt generation, SAM-based morphological examination, and adaptive thresholding for false positive reduction. Given the wide range of appearance-based heterogeneity, inter-slice variations, and multi-centre datasets with limited training data from specific target datasets, the proposed method augmented the training data using simulated lesions and used contrastive learning and knowledge distillation approaches to ensure the accurate detection of lacunes. Using only FLAIR sequences, our method achieved sensitivities of 84.26% and 92.31% on the ISLES and VALDO datasets, respectively, with corresponding F1 scores of 67.38% and 69.92%, respectively, compared favourably with existing state-of-the-art approaches. In general, the detection of lacunes is challenging owing to their small size and heterogeneous appearance, and often leads to diagnostic disagreement, even among experienced clinicians, as evidenced in previous studies ( Ghafoorian et al., 2017 ; Sudre et al., 2024 ; Duan et al., 2020 ). These challenges resulted in existing approaches reporting a higher number of false positives, as shown in Table 4 . The existing methods also exhibit limitations when processing datasets with varying resolutions and cannot efficiently handle volumes of higher slice thicknesses. This is particularly common in stroke imaging (given that lacunes are crucial biomarkers for stroke diagnosis), which typically involves larger slice thicknesses for quicker acquisition. Hence, an automated lacune detection method should be capable of working reliably across a range of image resolutions, irrespective of its small size. Our methodology successfully addressed these limitations by implementing specialised modules, each targeting distinct aspects of lacune detection. The initial CPG module identified potential lacune candidates with high sensitivity, although it allowed for some false positives. The CPG module used the U 2 Net model, which incorporated multiple Residual U-blocks (RSUs) that effectively processed features across various receptive fields while preserving fine details. This is a crucial requirement for detecting small lesions, such as lacunes, thus providing sufficiently high sensitivities of 85.19% and 92.31% for the ISLES and VALDO datasets, respectively, as indicated in Table 2 . Furthermore, our data augmentation strategy implemented a lesion simulation process that generated realistic lacune lesions using shape- and noise-based texture priors, followed by translation using a cycle-GAN to match the dataset-specific lacune characteristics. This two-phase approach proved essential for lacune simulation, as in general, GANs struggle with the generation of small lesions from scratch, while simple contrast blending of shape and texture priors failed to accurately replicate actual lacune characteristics because of their small size and unique appearance (hypointense centre with a hyperintense rim). However, the inclusion of simulated lesions for training addressed the challenge of limited data, generating synthetic lesions with typical lacune characteristics with sufficient diversity. This enabled the model to learn the complex characteristics of lacunes better, leading to an improvement in the sensitivity of the CPG module from 75% to 91%, while significantly reducing false positives (as shown in Figure 8 (bottom panel)). Finally, the training process of the CPG module utilized 2D axial slices and employed a combination of focal, Tversky, and contrastive loss functions, enhancing the module’s capability to learn subtle inter-slice variations and challenging lacune examples while differentiating tissue characteristics (as shown in Figure 6 ). In the proposed method, the SAM module played a major role in the reduction of false positives and effectively mimicked the clinical expert’s decision making for distinguishing true lacunes from the mimics. In the SAM-based selection module, we examined potential lacunes from all three anatomical axes to distinguish true lacunes from false positives, such as sulci, EPVS, and low-contrast regions. SAM proved particularly well suited for this task because of its zero-shot segmentation capabilities ( Kirillov et al., 2023 ), offering precise segmentation of lacunes when provided with representative point prompts from candidates, regardless of domain shifts. We strategically extracted point prompts (rather than bounding boxes) to enable unrestricted segmentation along elongated structures such as sulci or ventricles, provided the prompt was positioned well within the structure. Additionally, the ART module helped eliminating challenging mimics that closely resembled lacunes (when viewed from all axes, thus being overlooked by SAM) by employing adaptive thresholds. For this, we utilised the MARS map which was originally designed as a standard region-based atlas for rating another CSVD sign: cerebral microbleeds. In addition to the common risk factors associated with both signs, the MARS map also provided detailed parcellation of the brain that was sufficient to analyse the spatial distribution of lacunes. To the best of our knowledge, this is the first approach to use population-level insights and lacune incidence to define region-specific adaptive thresholds, filter false positives, and improve the precision of lacune detection. The datasets used in our evaluation were distinct with notably different characteristics. The ISLES dataset comprised patients with diagnosed or suspected stroke (from two different centres), whereas the VALDO dataset was collected from individuals without dementia who were being monitored for chronic illnesses, metabolic conditions, and cardiovascular diseases (from 2 different cohorts), as detailed in Section 2.6 . These distinct patient populations exhibit markedly different lacune characteristics. For instance, lacunes in the ISLES dataset were predominantly extensively cavitated, with highly irregular, thin, or completely absent hyperintense rims. In contrast, the lacunes in the VALDO dataset featured prominent hyperintense rims and small cavitated areas, consistent with the asymptomatic population. For the VALDO dataset, despite the significant domain shift from the ISLES dataset, varying appearance characteristics, and limited size of the VALDO training set, our method achieved its highest performance owing to our self-distillation strategy for initial prompt generation, as indicated in Table 3 . This approach focused on minimising distillation loss and aligning the student model’s outputs with the teacher’s softened predictions, which allowed the model to learn high-level abstractions that best discriminated lacunes from the mimics, which were invariant across datasets. Our method compared favourably with the existing method and achieved high detection sensitivity with minimal false positives at rates of 0.05 and 0.06 per slice for the ISLES and VALDO datasets, respectively. However, there is still scope for improvement in the generalisability and computational complexity of the proposed method. For instance, the limitations include the additional computation required to train the cycleGAN model for synthetic lacune simulations on individual datasets to match its specific characteristics. In addition, the adaptive threshold values relied on the lacune features learned by the model on the individual datasets, hence segmenting lacunes with higher/lower softmax scores. Note that despite the minor increment in the threshold values, the overall trend of the threshold across different regions remained consistent (high > medium > low), thus illustrating the importance of adaptive thresholds. 6 Conclusions The proposed method achieved sensitivity values of 84.26% and 92.31%, with average FP of 0.05 and 0.06 per slice, and median F1-scores of 67.38 and 69.92 on the ISLES and VALDO datasets, respectively, outperforming the existing state-of-the-art methods. The proposed method could enable the determination of lacune counts in various brain regions, which is crucial for analysing the spatial distribution of lacunes and their joint effect with other comorbidities related to neurodegeneration. Future research directions include studying the population-level correlation between lacune characteristics and several clinical/demographic factors, with a focus on risk prediction and prognosis for various neurological and neurodegenerative diseases. The code files have been made available at https://github.com/PonDeepika/Lacune_Detection Data Availability All data produced are available online at 1) https://zenodo.org/records/7153326 2) https://zenodo.org/records/4520773 https://zenodo.org/records/7153326 https://zenodo.org/records/4520773 CRediT authorship contribution statement Pon Deepika: Conceptualization, Methodology, Software, Validation, Investigation, Formal analysis, Writing - original draft, Visualization. Gouri Shanker: Writing - review & editing, Validation, Investigation. Ramanujam Narayanan: Writing - review & editing, Validation, Investigation. Vaanathi Sundaresan: Conceptualization, Writing – review & editing, Supervision, Resources, Project administration, Funding acquisition, Data curation. Declaration of Competing Interest The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper. Ethics Statement For the VALDO dataset, all cohorts were retrospective studies for which local ethical approval had already been obtained from the National Research Ethics Service Committee, London-Fulham (14/LO/0108) for SABRE and the Population Research Act from the Ministry of Health for RSS. For all datasets, acquisition of the data was performed by a trained radiographer according to a predefined research protocol. For the ISLES dataset, the retrospective evaluation of imaging data was approved by the local ethics boards of all participating centers. Requirement of written informed consent was waived by all ethics boards due to the retrospective nature of the study and the rigorous patient de-identification of the data. Funding This work was supported by DBT/Wellcome Trust India Alliance Fellowship [IA/E/22/1/506763]. This work was also supported in part by a grant from the Council of Scientific & Industrial Research (CSIR) under its ASPIRE (Women Scientist Scheme) program [25WS(013)/2023-24/EMR-II/ASPIRE], in part by Start-up Research Grant [SRG/2023/001406] from the Science and Engineering Research Board, India and in part by Siemens Healthineers-CDS Collaborative Laboratory of Artificial Intelligence in Precision Medicine, India. VS is also supported by Pratiksha Trust, Bangalore, India [FG/PTCH-23-1004] and the Seed Research Grant [IE/RERE-22-0583] from the Indian Institute of Science, India. Data availability The ISLES dataset is publicly available at https://zenodo.org/records/7153326 Acknowledgements The VALDO Dataset study was funded by Wellcome Trust (082464/Z/07/Z), British Heart Foundation (SP/07/001/ 23603, PG/08/103, PG/12/29/29497 and CS/13/1/30327), Erasmus MC University Medical Center, the Erasmus University Rotterdam, the Netherlands Organization for Scientific Research (NWO) Grant 918-46-615, the Netherlands Organization for Health Research and Development (ZonMW), the Research Institute for Disease in the Elderly (RIDE), and the European Union Seventh Framework Programme (FP7/2007–2013) under grant agreement No. 601055, VPHDARE@IT, the Dutch Technology Foundation STW. References ↵ Al-Masni , M.A. , Kim , W.R. , Kim , E.Y. , Noh , Y. , et al. , 2021 . 3d multi-scale residual network toward lacunar infarcts identification from mr images with minimal user intervention . IEEE Access 9 , 11787 – 11797 . OpenUrl ↵ Benjamin , P. , Lawrence , A.J. , Lambert , C. , Patel , B. , et al. , 2014 . Strategic lacunes and their relationship to cognitive impairment in cerebral small vessel disease . NeuroImage: Clinical 4 , 828 – 837 . OpenUrl PubMed ↵ Chen , H. , Zhang , M. , Liu , G. , Wang , X. , et al. , 2020 . Effect of small vessel disease burden and lacunes on gait/posture impairment in parkinson’s disease . Neurological Sciences 41 , 3617 – 3624 . OpenUrl PubMed ↵ Choi , Y. , Al-Masni , M.A. , Jung , K.J. , Yoo , R.E. , et al. , 2023 . A single stage knowledge distillation network for brain tumor segmentation on limited mr image modalities . Computer Methods and Programs in Biomedicine 240 , 107644 . OpenUrl PubMed ↵ Duan , Y. , Shan , W. , Liu , L. , Wang , Q. , et al. , 2020 . Primary categorizing and masking cerebral small vessel disease based on “deep learning system” . Frontiers in Neuroinformatics 14 , 17 . OpenUrl PubMed ↵ Duering , M. , Biessels , G.J. , Brodtmann , A. , Chen , C. , et al. , 2023 . Neuroimaging standards for research into small vessel disease—advances since 2013 . The Lancet Neurology 22 , 602 – 618 . OpenUrl PubMed ↵ Duering , M. , Csanadi , E. , Gesierich , B. , Jouvent , E. , et al. , 2013 . Incident lacunes preferentially localize to the edge of white matter hyperintensities: insights into the pathophysiology of cerebral small vessel disease . Brain 136 , 2717 – 2726 . OpenUrl CrossRef PubMed Web of Science ↵ Ghafoorian , M. , Karssemeijer , N. , Heskes , T. , Bergkamp , M. , et al. , 2017 . Deep multi-scale location-aware 3d convolutional neural networks for automated detection of lacunes of presumed vascular origin . NeuroImage: Clinical 14 , 391 – 399 . OpenUrl PubMed ↵ Gregoire , S. , Chaudhary , U. , Brown , M. , Yousry , T. , et al. , 2009 . The microbleed anatomical rating scale (mars) reliability of a tool to map brain microbleeds . Neurology 73 , 1759 – 1766 . OpenUrl CrossRef PubMed ↵ Hatamizadeh , A. , Nath , V. , Tang , Y. , Yang , D. , et al. , 2021 . Swin unetr: Swin transformers for semantic segmentation of brain tumors in mri images , in: International MICCAI brainlesion workshop , Springer . pp. 272 – 284 . ↵ Hernandez Petzsche , M.R. , de la Rosa , E. , Hanning , U. , Wiest , R. , et al. , 2022 . Isles 2022: A multi-center magnetic resonance imaging stroke lesion segmentation dataset . Scientific data 9 , 762 . OpenUrl PubMed ↵ Heusel , M. , Ramsauer , H. , Unterthiner , T. , Nessler , B. , et al. , 2017 . Gans trained by a two timescale update rule converge to a local nash equilibrium . Advances in neural information processing systems 30 . ↵ Ikram , M.A. , van der Lugt , A. , Niessen , W.J. , Koudstaal , P.J. , et al. , 2015 . The rotterdam scan study: design update 2016 and main findings . European journal of epidemiology 30 , 1299 – 1315 . OpenUrl CrossRef PubMed ↵ Jenkinson , M. , Beckmann , C.F. , Behrens , T.E. , Woolrich , M.W. , et al. , 2012 . Fsl . Neuroimage 62 , 782 – 790 . OpenUrl CrossRef PubMed Web of Science ↵ Jha , D. , Smedsrud , P.H. , Riegler , M.A. , Johansen , D. , et al. , 2019 . Resunet++: An advanced architecture for medical image segmentation , in: 2019 IEEE international symposium on multimedia (ISM) , IEEE . pp. 225 – 2255 . ↵ Jokinen , H. , Gouw , A. , Madureira , S. , Ylikoski , R. , et al. , 2011 . Incident lacunes influence cognitive decline: the ladis study . Neurology 76 , 1872 – 1878 . OpenUrl CrossRef PubMed ↵ Jones , S. , Tillin , T. , Park , C. , Williams , S. , et al. , 2020 . Cohort profile update: Southall and brent revisited (sabre) study: a uk population-based comparison of cardiovascular disease and diabetes in people of european, south asian and african caribbean heritage . International journal of epidemiology 49 , 1441 – 1442e . OpenUrl CrossRef PubMed ↵ Khosla , P. , Teterwak , P. , Wang , C. , Sarna , A. , et al. , 2020 . Supervised contrastive learning . Advances in neural information processing systems 33 , 18661 – 18673 . OpenUrl ↵ Kim , K. , Ji , B. , Yoon , D. , Hwang , S. , 2020 . Self-knowledge distillation: A simple way for better generalization . arXiv preprint arxiv: 2006.12000 3. ↵ Kim , S. , Park , H. , Kang , M. , Jin , K.H. , et al. , 2024 . Federated learning with knowledge distillation for multi-organ segmentation with partially labeled datasets . Medical Image Analysis 95 , 103156 . OpenUrl PubMed ↵ Kirillov , A. , Mintun , E. , Ravi , N. , Mao , H. , Rolland , C. , et al. , 2023 . Segment anything , in: Proceedings of the IEEE/CVF International Conference on Computer Vision , pp. 4015 – 4026 . ↵ Kuang , Z. , Wang , J. , Sun , D. , Zhao , J. , et al. , 2024 . Incremental attribute learning by knowledge distillation method . Journal of Computational Design and Engineering 11 , 259 – 283 . OpenUrl ↵ Mazurowski , M.A. , Dong , H. , Gu , H. , Yang , J. , et al. , 2023 . Segment anything model for medical image analysis: an experimental study . Medical Image Analysis 89 , 102918 . OpenUrl CrossRef PubMed ↵ Narayanan , R. , Sundaresan , V. , 2024 . Medlessynth-ld: Lesion synthesis using physics-based noise models for robust lesion segmentation in low-data medical imaging regimes . Pattern Recognition Letters . ↵ Oktay , O. , 2018 . Attention u-net: Learning where to look for the pancreas . arXiv preprint arxiv: 1804.03999 . ↵ Orbes-Arteainst , M. , Cardoso , J. , Sørensen , L. , Igel , C. , et al. , 2019 . Knowledge distillation for semi-supervised domain adaptation , in: OR 2.0 Context-Aware Operating Theaters and Machine Learning in Clinical Neuroimaging: Second International Workshop, OR 2.0 2019, and Second International Workshop, MLCN 2019, Held in Conjunction with MICCAI 2019, Shenzhen, China , Springer . pp. 68 – 76 . ↵ Paluru , N. , Ravishankar , H. , Hegde , S. , Yalavarthy , P.K. , 2023 . Self distillation for improving the generalizability of retinal disease diagnosis using optical coherence tomography images . IEEE Journal of Selected Topics in Quantum Electronics 29 , 1 – 12 . OpenUrl ↵ Qin , X. , Zhang , Z. , Huang , C. , Dehghan , M. , et al. , 2020 . U2-net: Going deeper with nested ustructure for salient object detection . Pattern recognition 106 , 107404 . OpenUrl CrossRef ↵ Ross , T.Y. , Dollár , G. , 2017 . Focal loss for dense object detection , in: proceedings of the IEEE conference on computer vision and pattern recognition , pp. 2980 – 2988 . ↵ Salehi , S.S.M. , Erdogmus , D. , Gholipour , A. , 2017 . Tversky loss function for image segmentation using 3d fully convolutional deep networks , in: International workshop on machine learning in medical imaging , Springer . pp. 379 – 387 . ↵ Serrador , L. , Villani , F.P. , Moccia , S. , Santos , C.P. , 2024 . Knowledge distillation on individual vertebrae segmentation exploiting 3d u-net . Computerized Medical Imaging and Graphics 113 , 102350 . OpenUrl PubMed ↵ Singhal , P. , Walambe , R. , Ramanna , S. , Kotecha , K. , 2023 . Domain adaptation: challenges, methods, datasets, and applications . IEEE access 11 , 6973 – 7020 . OpenUrl ↵ Smith , S.M. , 2002 . Fast robust automated brain extraction . Human brain mapping 17 , 143 – 155 . OpenUrl CrossRef PubMed Web of Science ↵ Sudre , C.H. , Anson , B.G. , Ingala , S. , Lane , C.D. , et al. , 2019 . 3d multirater rcnn for multimodal multiclass detection and characterisation of extremely small objects , in: International Conference on Medical Imaging with Deep Learning , PMLR . pp. 447 – 456 . ↵ Sudre , C.H. , Van Wijnen , K. , Dubost , F. , Adams , H. , et al. , 2024 . Where is valdo? vascular lesions detection and segmentation challenge at miccai 2021 . Medical Image Analysis 91 , 103029 . OpenUrl PubMed ↵ Sundaresan , V. , Arthofer , C. , Zamboni , G. , Murchison , A.G. , Dineen , R.A. , et al. , 2023 . Automated detection of cerebral microbleeds on mr images using knowledge distillation framework . Frontiers in Neuroinformatics 17 , 1204186 . OpenUrl PubMed ↵ Sundaresan , V. , Zamboni , G. , Dineen , R.A. , Auer , D.P. , Sotiropoulos , S.N. , Sprigg , N. , Jenkinson , M. , Griffanti , L. , 2025 . Automated characterisation of cerebral microbleeds using their size and spatial distribution on brain mri . European Radiology Experimental 9 , 5 . OpenUrl PubMed ↵ Tillin , T. , Forouhi , N.G. , McKeigue , P.M. , Chaturvedi , N. , 2012 . Southall and brent revisited: Cohort profile of sabre, a uk population-based comparison of cardiovascular disease and diabetes in people of european, indian asian and african caribbean origins . International journal of epidemiology 41 , 33 – 42 . OpenUrl CrossRef PubMed Web of Science ↵ Uchiyama , Y. , Abe , A. , Muramatsu , C. , Hara , T. , et al. , 2015 . Eigenspace template matching for detection of lacunar infarcts on mr images . Journal of digital imaging 28 , 116 – 122 . OpenUrl PubMed ↵ Uchiyama , Y. , Asano , T. , Kato , H. , Hara , T. , et al. , 2012 . Computer-aided diagnosis for detection of lacunar infarcts on mr images: Roc analysis of radiologists’ performance . Journal of digital imaging 25 , 497 – 503 . OpenUrl CrossRef PubMed ↵ Uchiyama , Y. , Kunieda , T. , Asano , T. , Kato , H. , et al. , 2008 . Computer-aided diagnosis scheme for classification of lacunar infarcts and enlarged virchow-robin spaces in brain mr images , in: 2008 30th Annual International Conference of the IEEE Engineering in Medicine and Biology Society , IEEE . pp. 3908 – 3911 . ↵ Uchiyama , Y. , Yokoyama , R. , Ando , H. , Asano , T. , et al. , 2007a . Computer-aided diagnosis scheme for detection of lacunar infarcts on mr images . Academic radiology 14 , 1554 – 1561 . OpenUrl PubMed ↵ Uchiyama , Y. , Yokoyama , R. , Ando , H. , Asano , T. , et al. , 2007b . Improvement of automated detection method of lacunar infarcts in brain mr images , in: 2007 29th Annual International Conference of the IEEE Engineering in Medicine and Biology Society , IEEE . pp. 1599 – 1602 . ↵ Vermeer , S.E. , Hollander , M. , van Dijk , E.J. , Hofman , A. , et al. , 2003 . Silent brain infarcts and white matter lesions increase stroke risk in the general population: the rotterdam scan study . Stroke 34 , 1126 – 1129 . OpenUrl Abstract / FREE Full Text ↵ Wang , Y. , Catindig , J.A. , Hilal , S. , Soon , H.W. , et al. , 2012 . Multi-stage segmentation of white matter hyperintensity, cortical and lacunar infarcts . Neuroimage 60 , 2379 – 2388 . OpenUrl CrossRef PubMed ↵ Wardlaw , J.M. , 2008 . What is a lacune? ↵ Wardlaw , J.M. , Smith , E.E. , Biessels , G.J. , Cordonnier , C. , et al. , 2013 . Neuroimaging standards for research into small vessel disease and its contribution to ageing and neurodegeneration . The Lancet Neurology 12 , 822 – 838 . OpenUrl PubMed ↵ Yokoyama , R. , Zhang , X. , Uchiyama , Y. , Fujita , H. , et al. , 2007 . Development of an automated method for the detection of chronic lacunar infarct regions in brain mr images . IEICE transactions on information and systems 90 , 943 – 954 . OpenUrl ↵ Yushkevich , P.A. , Piven , J. , Hazlett , H.C. , Smith , R.G. , et al. , 2006 . User-guided 3d active contour segmentation of anatomical structures: significantly improved efficiency and reliability . Neuroimage 31 , 1116 – 1128 . OpenUrl CrossRef PubMed Web of Science ↵ Zhang , Y. , Brady , M. , Smith , S. , 2001 . Segmentation of brain mr images through a hidden markov random field model and the expectation-maximization algorithm . IEEE transactions on medical imaging 20 , 45 – 57 . OpenUrl CrossRef PubMed Web of Science ↵ Zhou , Z. , Rahman Siddiquee , M.M., Tajbakhsh , N. , Liang , J. , 2018 . Unet++: A nested u-net architecture for medical image segmentation , in: Deep Learning in Medical Image Analysis and Multimodal Learning for Clinical Decision Support: 4th International Workshop, DLMIA 2018, and 8th International Workshop, ML-CDS 2018, Held in Conjunction with MICCAI 2018 , Granada, Spain , Springer . pp. 3 – 11 . ↵ Zhu , J.Y. , Park , T. , Isola , P. , Efros , A.A. , 2017 . Unpaired image-to-image translation using cycleconsistent adversarial networks , in: Proceedings of the IEEE international conference on computer vision , pp. 2223 – 2232 . View the discussion thread. Back to top Previous Next Posted July 10, 2025. Download PDF Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Automated Detection of Lacunes in Brain MR Images Using SAM with Robust Prompts via Self-Distillation and Anatomy-Informed Priors Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Automated Detection of Lacunes in Brain MR Images Using SAM with Robust Prompts via Self-Distillation and Anatomy-Informed Priors Pon Deepika , Gouri Shanker , Ramanujam Narayanan , Vaanathi Sundaresan medRxiv 2025.07.09.25331177; doi: https://doi.org/10.1101/2025.07.09.25331177 Share This Article: Copy Citation Tools Automated Detection of Lacunes in Brain MR Images Using SAM with Robust Prompts via Self-Distillation and Anatomy-Informed Priors Pon Deepika , Gouri Shanker , Ramanujam Narayanan , Vaanathi Sundaresan medRxiv 2025.07.09.25331177; doi: https://doi.org/10.1101/2025.07.09.25331177 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Radiology and Imaging Subject Areas All Articles Addiction Medicine (568) Allergy and Immunology (863) Anesthesia (297) Cardiovascular Medicine (4421) Dentistry and Oral Medicine (443) Dermatology (382) Emergency Medicine (606) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1507) Epidemiology (15212) Forensic Medicine (30) Gastroenterology (1121) Genetic and Genomic Medicine (6581) Geriatric Medicine (667) Health Economics (996) Health Informatics (4520) Health Policy (1366) Health Systems and Quality Improvement (1611) Hematology (539) HIV/AIDS (1264) Infectious Diseases (except HIV/AIDS) (15906) Intensive Care and Critical Care Medicine (1103) Medical Education (620) Medical Ethics (144) Nephrology (667) Neurology (6580) Nursing (345) Nutrition (998) Obstetrics and Gynecology (1141) Occupational and Environmental Health (956) Oncology (3324) Ophthalmology (970) Orthopedics (369) Otolaryngology (420) Pain Medicine (435) Palliative Medicine (129) Pathology (663) Pediatrics (1689) Pharmacology and Therapeutics (691) Primary Care Research (710) Psychiatry and Clinical Psychology (5432) Public and Global Health (9212) Radiology and Imaging (2193) Rehabilitation Medicine and Physical Therapy (1368) Respiratory Medicine (1194) Rheumatology (593) Sexual and Reproductive Health (709) Sports Medicine (529) Surgery (709) Toxicology (99) Transplantation (288) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'9ff4a87b7fc14193',t:'MTc3OTM3NzgwMQ=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00
unpaywall
last seen: 2026-05-21T05:10:58.409756+00:00
License: CC-BY-NC-ND-4.0