Breast Cancer Detection with Topological Deep Learning

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 84,346 characters · extracted from preprint-html · click to expand
Breast Cancer Detection with Topological Deep Learning | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Breast Cancer Detection with Topological Deep Learning View ORCID Profile Brighton Nuwagira , Adrian Rodriguez , View ORCID Profile Qiwei Li , View ORCID Profile Baris Coskunuzer doi: https://doi.org/10.1101/2025.10.15.25338098 Brighton Nuwagira 1 Dept. of Math. Sciences, UT Dallas Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Brighton Nuwagira Adrian Rodriguez 2 Dept. of Computer Science, UT Dallas Find this author on Google Scholar Find this author on PubMed Search for this author on this site Qiwei Li 1 Dept. of Math. Sciences, UT Dallas Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Qiwei Li Baris Coskunuzer 1 Dept. of Math. Sciences, UT Dallas Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Baris Coskunuzer For correspondence: coskunuz{at}utdallas.edu Abstract Full Text Info/History Metrics Data/Code Preview PDF Abstract In this paper, we investigate the integration of topological data analysis (TDA) techniques with deep learning (DL) models to improve breast cancer diagnosis from ultrasound images. By leveraging persistent homology, a TDA method that captures global structural patterns, we enrich the local spatial features typically learned by DL models. We in-corporate topological features into various pre-trained architectures, including CNNs and vision transformers (VTs), aiming to enhance screening accuracy for breast cancer, which remains the most common cancer among women. Experiments on publicly available ultrasound datasets demonstrate that combining CNNs and VTs with topological features consistently yields statistically significant performance improvements. Notably, this approach also helps to address challenges faced by DL models, such as interpretability and reliance on large labeled datasets. Further-more, we generalize the Alexander duality theorem to cubical persistence, showing that persistent homology remains invariant under sublevel and superlevel filtrations for image data. This advancement reduces computational costs, making TDA methods more practical for image analysis. 1. Introduction Medical image analysis plays a pivotal role in modern healthcare, revolutionizing diagnostics, treatment planning, and patient care. The application of deep learning (DL) models in medical image analysis has drastically transformed diagnostic procedures, significantly improving disease detection and categorization [ 44 , 60 ]. DL models excel in extracting intricate patterns from complex medical images like Magnetic resonance imaging (MRI) scans, computed tomography (CT) scans, and X-rays, empowering healthcare professionals with enhanced capabilities. They have demonstrated exceptional performance in tasks such as tumor detection, organ segmentation, and anomaly identification, reducing human error and expediting analyses [ 79 ]. However, challenges such as data scarcity, interpretability, and clinical validation remain areas of active research and development [ 6 , 64 ]. On the other hand, topological machine learning (ML) presents promising solutions to address the limitations of DL models. Its primary strength lies in its ability to systematically analyze complex spatial relationships within images, surpassing traditional pixel-based analysis [ 65 , 66 ]. Topological methods delve into the inherent structure of data, providing deeper insights into intricate anatomical features and their connections. Unlike DL models, which rely on predefined architectures, topological ML adapts more flexibly to diverse data complexities and irregularities [ 35 ]. Moreover, these techniques offer robustness against noise and yield more interpretable outcomes, crucial in medical contexts where transparency and reliability are critical. Furthermore, DL models are adept at capturing intricate local spatial relationships within images, whereas topological data analysis (TDA) methods offer a holistic viewpoint by globally analyzing data, thus providing complementary in-sights to DL features. By integrating topological insights with DL models, medical image analysis stands to gain improved accuracy, sensitivity to subtle changes, and a comprehensive understanding of biological structures, thus advancing precise diagnostics and treatments. In this paper, we aim to demonstrate the effectiveness of topological methods in medical image analysis and high-light their synergistic potential with DL models by demonstrating their practical applications. While the incorporation of topological features with graph neural networks (GNNs) has been a very active area of research in graph representation learning [ 39 , 77 ], the potential synergy of combining these features with DL models in computer vision and medical image analysis remains largely unexplored. With the adaptation of topological features, we aim to enhance the capabilities of DL models for computer-aided diagnosis. We study the performance of integration of topological features to pre-trained DL models in breast cancer screening, which is the most prevalent cancer in women [ 70 ]. Our experiments showed that topological features consistently give a significant boost to the performance of various convolutional neural networks (CNN) and vision transformer (VT) models. Furthermore, the choice of filtration type is the key question in persistent homology (PH) to produce effective topological features. We establish that for image data, an elegant duality pattern emerges, indicating that sub-level and superlevel filtrations produce virtually identical output for cubical persistence. Our contributions can be summarized as follows: ⋄ We investigate the effectiveness of incorporating topological features to enhance DL models for computer-aided diagnosis, showing that this integration results in statistically significant improvements in performance across ultrasound and other medical imaging tasks. ⋄ We further demonstrate the value of topological features in addressing critical challenges in breast cancer diagnostics, such as limited data and interpretability . ⋄ We prove the Alexander duality theorem for cubical persistence, showing that sublevel or superlevel filtrations yield virtually identical output for image data. This result significantly enhances the applicability of TDA in image analysis by effectively halving the computation time. 2. Related Work 2.1. Deep Learning in Breast Cancer Diagnosis Breast cancer stands as a formidable challenge for women, lacking a definitive cure to date. However, the emergence of DL techniques has introduced promising avenues in breast cancer screening, diagnosis, and prognosis. These methods have demonstrated remarkable efficacy in identifying breast cancer early on, thereby enhancing the prospects of patient survival [ 57 ]. Notably, DL surpasses traditional ML approaches by demanding minimal human intervention while achieving comparable levels of feature extraction [ 61 ]. Over the years, the main methods to detect breast cancer have been through various methods like mammography [ 3 ], histopathology [ 59 ], positron emission tomography (PET) [ 16 ], digital breast tomosynthesis (DBT) [ 8 ], ultrasound [ 52 ], CT [ 43 ], and MRI [ 48 ]. For a thorough review of these approaches, see excellent surveys [ 1 , 32 , 36 ]. Among these approaches, breast ultrasound stands out as a low-cost, user-friendly, radiation-free, portable technique, particularly adept at differentiating between cystic and solid breast masses. Recent advancements in DL methods for breast cancer diagnosis through ultrasound screening have shown considerable promise for clinical implementation, as evidenced by several studies in recent years [ 20 , 25 ]. In the past couple of years, the latest DL models in image analysis, namely vision transformers (VTs), have demonstrated remarkable success in the field [ 7 , 26 , 53 ]. Furthermore, several recent reports have indicated that DL-based evaluation of breast ultrasound is comparable to that of a human radiologist [ 23 , 62 ]. In this paper, we aim to demonstrate the efficacy of topological features in enhancing the performance of DL methods in medical imaging, specifically in breast cancer screening using ultrasound images. 2.2. TDA in Medical Image Analysis PH has been quite effective for pattern recognition in image and shape analysis in the past two decades. In medical image analysis, PH produced power results in cell development [ 47 ], tumor detection [ 19 ], histopathology [ 51 , 76 ], neuronal morphology [ 41 ], brain functionality analysis [ 12 ], functional MRI (fMRI) data [ 55 ], and genomic data [ 54 ]. For a thorough review of TDA methods in biomedicine and medical imaging, see the excellent surveys [ 65 , 67 ]. For a collection of TDA applications in several domains, see TDA Applications Library [ 28 , 29 ]. Recently, there has been a surge of interest in topological deep learning within the ML community, showing great potential to augment existing DL methodologies [ 49 , 80 ]. The effective utilization of topological features has notably enhanced CNN models, particularly in tasks such as image segmentation [ 17 , 58 , 69 , 75 ]. More-over, there is growing recognition of the pivotal role of topological features in diagnostic tasks across various medical domains [ 31 , 40 , 42 , 68 ]. In the case of breast cancer detection, recent works have effectively utilized TDA methods for mammogram and MRI screening [ 50 , 74 ]. While they incorporate TDA output into DL models to regularize the loss function, our approach is more direct. In our study, we directly integrate topological features into DL architectures to improve the latent embeddings to demonstrate their effectiveness, particularly in breast cancer diagnosis. 3. Methodology In this section, we first present the methodology for extracting topological features from an image using cubical persistence. Next, we elaborate on our ML models, wherein we incorporate these features into DL models. Then, we prove Alexander duality result between sublevel-superlevel filtrations for cubical persistence. 3.1. Cubical Persistence PH in TDA reveals patterns in complex datasets by analyzing shapes at multiple resolutions [ 18 ]. While effective for various data formats, we focus on its application in image analysis through cubical persistence . PH involves three steps: (1) generating nested topological spaces ( Filtration ), (2) capturing topological changes ( Persistence Diagrams ), and (3) transforming these diagrams into ML-ready vectors ( Vectorization ) [ 24 ]. Step 1 - Constructing Filtrations Since PH essentially functions as a mechanism for monitoring the progression of topological characteristics within a sequence of simplicial complexes, constructing this sequence stands out as a crucial step. In image analysis, the common approach involves generating a nested sequence of binary images, also known as cubical complexes . To achieve this from a given grayscale image χ (with dimensions r ×s ), grayscale values γ ij of individual pixels Δ ij ⊂ χ are utilized. Specifically, for a sequence of grayscale values (0 = t 1 < t 2 < · · · < t N = 255), a nested succession of binary images χ 1 ⊂ χ 2 ⊂ · · · χ N is obtained, where χ n ={Δ ij ⊂ χ| γ ij ≤ t n } (See Figures 1 and 2 ). In essence, this involves starting with a blank r × s image and progressively activating (coloring black) pixels as their color values reach the specified threshold t n . This process, known as sublevel filtration , is conducted on χ relative to a designated function (in this instance, grayscale). Alternatively, one can activate pixels in a descending order, referred to as superlevel filtration . In other words, let 𝒴 n = {Δ ij ⊂ χ | γ ij ≥ s n } for (255 = s 1 > s 2 > · · · > s M = 0), and 𝒴 1 ⊂ 𝒴 2 ⊂ · · · ⊂ 𝒴 M is called superlevel filtration. Download figure Open in new tab Figure 1. For the 5 × 5 image χ , the sublevel filtration is the sequence of binary images χ 1 ⊂ χ 2 ⊂ χ 3 ⊂ χ 4 ⊂ χ 5 . Download figure Open in new tab Figure 2. On the left, we have a sample ultrasound image χ from BUS-BRA dataset. Next three images χ 60 , χ 90 , and χ 120 are binary images in the filtration where in χ k , pixels with grayscale values ≤ k are activated (marked black), while all other pixels remain white. Step 2 - Persistence Diagrams PH tracks the evolution of topological features within the filtration sequence {χ n } and represents it as a persistence diagram (PD). Specifically, if a topological feature σ emerges in χ m and vanishes in χ n with 1 ≤ m < n ≤ N , the thresholds t m and t n are termed the birth time b σ and death time d σ of σ , respectively ( b σ = t m and d σ = t n ). Hence, PD comprises all such 2-tuples PD k (χ) = {( b σ , d σ )} where k denotes the dimension of the topological features. The duration d σ ™ b σ is referred to as the lifespan of σ . Formally, the k th persistence diagram can be defined as PD k ( χ) = {( b σ , d σ )| σ ∈ H k (χ n )for b σ ≤ t n < d σ }, where H k ( χ n ) represents the k th homology group of the cubical complex χ n . Thus, PD k (χ) comprises 2-tuples indicating the birth and death times of k -dimensional voids { σ } (such as connected components, holes, and cavities) in the filtration sequence {χ n }. For example, for χ in Figure 1 , PD 0 (χ) = (1, ∞ ), (1, 2), (1, 2), (1, 3) } denotes the connected components, while PD 1 (χ) = {(2, 4), (3, 5), (4, 5)} represents the holes in the corresponding binary images in Figure 1 . Step 3 – Vectorizations Persistence Diagrams (PDs), consisting of collections of 2-tuples, are not inherently practical for utilization with ML tools. Instead, a common strategy is to transform PD information into a vector or function, a process referred to as vectorization [ 5 ]. A commonly employed function for this purpose is the Betti function , which monitors the quantity of alive topological features at each threshold. In particular, the Betti function is a step function where β 0 ( t n ) denotes the count of connected components in the binary image χ n , and β 1 ( t n ) indicates the number of holes (loops) in χ n . In ML contexts, Betti functions are typically represented as vectors of size N with entries β k ( t n ) for 1 ≤ n ≤ N , defined as . For instance, in Figure 1 , we observe , which denotes the count of connected components in the binary images {χ i }, while , represents the counts of holes in i , i.e., β 0 (1) = 4 signifies the count of components in χ 1 , and β 1 (3) = 2 denotes the count of holes (loops) in χ 3 . There are several approaches for converting PDs into vector representations, such as Persistence Images [ 2 ], Persistence Landscapes [ 11 ], Silhouettes [ 14 ], and kernel-based methods [ 5 ]. Here, we use Betti functions due to their computational efficiency and interpretability. Furthermore, Betti functions serve not only as vector representations but also as sequences summarizing the number of topological features in the filtration sequence, making them well-suited for use with transformers to enhance information extraction. We also employ Persistence Images (Appendix A.5) to study the impact of vectorization on model performance. 3.2 ML Models In this section, we outline our ML models, focusing on approaches that leverage topological features. To evaluate the impact of these features on model performance, we first introduce a baseline model, Topo-ML. This model avoids deep learning, using a traditional ML classifier applied solely to the topological features. Topo-ML is computationally efficient, interpretable, and ideal for scenarios with limited data, thanks to its reliance on direct embeddings. We then present two distinct architectures that integrate these topological features into pre-trained CNN and VT models, enabling deeper exploration of their contributions in more complex frameworks. Topo-ML model In our basic Topo-ML model, we assessed the standalone performance of topological features using Betti vectors as input. For classification, we employed two standard ML models: eXtreme Gradient Boosting (XG-Boost) [ 15 ], Multilayer Perceptron (MLP) [ 22 ] and Transformer Encoder [ 73 ]. These models are well-suited for handling high-dimensional data, with MLP often excelling in scenarios with large or imbalanced datasets, while XGBoost is known for its robust performance across diverse conditions. A summary of our model structure is shown in Figure 9 , and detailed descriptions of our ML procedures, including hyperparameter tuning, are provided in Section 4 . Topo-CNN model In our second model, Topo-CNN ( Figure 3 ), we evaluated the impact of incorporating topological features with pre-trained CNN models. The rationale is that topological features capture the image’s global patterns, while convolutional features focus on localized details. By combining these, we aim to achieve synergistic effects that enhance performance. Specifically, we employed two distinct vectorization methods for topological features to test their effectiveness in deep learning: Betti functions and Persistence Images (PIs). This led to two model variants: Betti-CNN (B-CNN), which uses Betti vectors, and PI-CNN, which incorporates persistence images (Appendix A.5). Download figure Open in new tab Figure 3. Topo-CNN framework merges the topological features of images with convolutional vectors derived from a pre-trained CNN model, followed by further processing via a fully connected layer. In our PI-CNN model , persistence images are used as topological features and processed through a 2D MLP. In our Betti-CNN model, persistence images are replaced with Betti vectors, which are processed through a 1D MLP. The Topo-CNN model framework involves selecting a CNN backbone from a collection of state-of-the-art architectures ( Section 4.2 ). To analyze the contribution of topological vectors within the DL framework, we employed a simple architecture: convolutional vectors are concatenated with topological vectors after passing through an MLP layer. A flowchart of this model is shown in Figure 3 , with hyperparameters and further details provided in Section 4.2 . Topo-VT model In our third model, Topo-VT ( Figure 4 ), we integrate topological features with a vision transformer architecture. This approach leverages the strengths of both global representations, enabling them to complement each other and enhance performance. By facilitating communication between the feature representations of the transformer stages and a transformer-encoded version of topological features, we aim to improve model efficacy. Download figure Open in new tab Figure 4. Topo-VT framework fuses topological features with ViT, applying Betti vector encodings after each stage via cross-attention to incorporate topological insights. The Topo-VT architecture uses the SwinV2 back-bone [ 45 , 46 ] and introduces Betti vector encodings after each stage to complement the model’s global properties through cross-attention. Each Betti vector for connected components and for loops—has its own transformer encoding. We first apply to the feature map after each stage, followed by using cross-attention. Given that Betti vectors are sequential data derived from cubical filtration ( Section 3.1 ), transformer encoders are well-suited for integrating topological and transformer-based representations. A flowchart of the model is shown in Figure 4 . 3.3. Alexander Duality for Cubical Persistence When employing PH in practical applications, how the filtration is constructed stands out as the most crucial aspect of the process ( Section 3.1 ). For computational efficiency, the sublevel/superlevel filtration method is most preferable, utilizing a suitable filtering function on the data. Particularly in a graph setting, sublevel and superlevel filtrations can yield vastly different outputs depending on the filtering function utilized, and the model’s performance can hinge on the chosen filtration [ 13 ]. Hence, users typically need to examine both filtrations in most TDA applications . In the following, we demonstrate that the sublevel and superlevel filtrations produce virtually identical outputs in complementary dimensions for PH with cubical complexes . As a result, unlike in the graph setting, the choice between sublevel and superlevel filtration for image analysis has no importance, as long as all relevant dimensions’ outputs are used. We establish this result by adapting Alexander Duality to this context. In particular, we prove the following: Theorem 1 Let χ be a cubical complex of dimension d, and f be the filtering function on χ. Let be its extended image with Then, the persistence diagrams for the sub-level and superlevel filtration of with respect to in complementary dimensions are equivalent . The proof of the theorem and the further details are given in Appendix B. Here, the extended image condition is to make sure that the pixels (or voxels) at the boundary of the image have dark or light color. In particular, if the image has already a dark or light background, this condition is automatically satisfied. To illustrate this duality, we present the Betti curves for an ultrasound image using both sublevel and superlevel filtrations ( Figure 5 ). Download figure Open in new tab Figure 5. Betti-0 and Betti-1 curves using sublevel and superlevel filtrations for an ultrasound image from the BUS-BRA dataset. As Theorem 1 indicates, sublevel Betti-0 (a) and superlevel Betti-1 (b) curves show mirrored patterns, as do sublevel Betti-1 (c) and superlevel Betti-0 (d) curves. One way to interpret our result is that if one uses the sublevel filtration for PH with cubical complexes and uses all the relevant dimensions, then there is no need to check superlevel filtration in the same setting . In practice, this cuts the computation time by half, and boosts the applicability of TDA methods in image analysis. 4. Experiments 4.1. Datasets In our research, we utilized three publicly accessible breast ultrasound datasets (see Table 1 ). The first dataset, known as BUSI [ 4 ], comprises 780 breast ultrasound images collected from 600 women aged 25 to 75 years old. The second ultrasound dataset, BUS-BRA [ 30 ], comprises 1875 anonymized images from 1064 female patients. The third ultrasound dataset, MENDELEY [ 56 ] consists of 250 breast cancer images, including 100 benign and 150 malignant cases. In addition to these, to show the applicability of our Topo-DL models in different image formats, we employed three other datasets from the MedMNIST collection [ 78 ], namely RETINAMNIST (Fundus images), PneuMNIST (Chest X-ray) and BloodMNIST (Blood Cell) (see Table 8 ). View this table: View inline View popup Download powerpoint Table 1. Characteristics of breast cancer ultrasound datasets. 4.2. Experimental Setup We provide details of our datasets in Table 1 . It is important to note that the majority of datasets do not come with a predefined train-test split. Hence, many models utilized their own train-test splits. In this study, we employed 5-fold CV in all datasets except BUSI (3 class) which has a pre-defined split - 10-fold CV. Furthermore, each experiment was run 20 times with different seeds, and the average results were reported in Table 2 , and Table 9 . View this table: View inline View popup Download powerpoint Table 2. Topo-CNN results. Performance comparison between vanilla-CNN and Topo-CNN models (Betti-CNN and PI-CNN) for breast ultrasound datasets. For each dataset, the best two accuracy and AUC improvements are marked blue . In each block, the best performance is underlined . The statistical significance of each improvement is given in Tables 13 and 14 in the appendix. We did not use any data augmentation method in this study as the topological features extracted are invariant under rotations or flips and demonstrate robust performance on small and unbalanced datasets. As a result, our TDA models do not require any form of data augmentation or preprocessing. This aspect contributes to the computational efficiency of our models while maintaining a high level of robustness against minor image alterations. Our implementation is available at the following link: https://github.com/BrightonNuwagira/topo_vt Topological Features We first resized each ultrasound image χ to 224 × 224, then generated topological feature vectors using a sublevel filtration, χ 1 ⊂ χ N , based on grayscale pixel values (see Section 3.1 ). With N = 100 thresholds evenly dividing the color interval [0, 255], we produced 200-dimensional feature vectors by combining Betti vectors and , each with 100 dimensions. We also used Persistence Images as vectorization, where the details are given in Appendix A.5. Topo-ML Hyperparameters In our basic model Topo-ML ( Figure 9 ), we simply use XGBoost, MLP, and Transformer classifiers with the induced Betti vectors across all datasets. In the case of XGBoost, we adopted parametric tuning strategies. This approach involved configuring the learning rate to 0.1 and limiting the maximum depth to 5. As for the MLP architecture, it comprised a single input layer followed by two hidden layers, each containing 256, and 128 neurons respectively, all utilizing the RELU activation function. We also included an output layer in the architecture. The training of MLP models encompassed 100 epochs, employing a batch size of 64 for all datasets. We used Adam optimizer and retained the default settings for the remaining parameters. For Transformers, we used the same hyperparameter setting with the transformer encoder in Topo-VT model. CNN Backbones In our study, we investigated the alignment between topological features and current DL models using the architectures outlined in Section 3.2 . Our rationale stems from the notion that while topological features capture global patterns within images, convolutional vectors focus more on local patterns. For the evaluation of our Topo-CNN models, we selected well-known CNN backbones, ResNet50, ResNet101 [ 34 ], Efficient-NetB0 [ 72 ], InceptionV3 [ 71 ], InceptionResNetv2 [ 71 ], MobileNetV2 [ 37 ], DenseNet121 [ 38 ], or VGG16 [ 63 ]. For Topo-VT model, we used SwinV2 [ 46 ]. Topo-CNN Hyperparameters Our Topo-CNN model ( Figure 3 ) integrates a pre-trained CNN with additional frozen layers, enhanced by a 1D Multi-Layer Perceptron (MLP). The augmented CNN includes a convolutional layer with 64 filters of size (3, 3) and ReLU activation, followed by a max-pooling layer with a pool size of (2, 2), a flattening layer, and a dense layer with 64 neurons. Simultaneously, the 1D MLP contributes with three dense layers having 800, 256, and 128 neurons respectively, all utilizing the ReLU activation function. The concatenated outputs from both models are further processed by fully connected layers, including 256, 128, and 128 neurons each with ReLU activation, culminating in the model’s final output. To investigate the utility of different vectorizations for topological features, we also employed Persistence Images (PI), and replaced Betti vectors with PI vectors. We give the details of this model (PI-CNN) in Appendix A.5. Topo-VT Hyperparameters Our transformer architecture ( Figure 4 ) uses the pre-trained SwinV2 model [ 46 ] with all layers unfrozen for end-to-end learning. We extract feature maps from each Swin stage, compute Betti vector encodings and , project them onto stage features, and apply cross-attention. The enriched features are then fed into the Swin head for baseline comparison. The model was trained for 100 epochs and using the AdamW optimizer with learning rate 1e-4, weight decay of 0.9, and dropout rate of 0.1. As previously stated, both Topo-Swin and the Betti encoders were trained together. In the Betti Transformer Encoder, each Betti vector has its own trainable encoder. Although Betti vectors are sequential data, they cannot be encoded to be at a specific patch of the image, so we let the model learn what the best positional encodings are. We utilize a Transformer Encoder which projects the Betti vectors to dimension 512. The encoders were trained with 4 heads, 4 layers, with a feed-forward dimension of 256, a dropout rate of 0.1, and ReLU activation. The encoders are trained end-to-end along with the Topo-Swin. Runtimes The time taken to generate topological features for the BUS-BRA dataset (consisting of 1875 images sized 275×375) on a personal laptop was 15 minutes for Betti vectors and 2.5 hours for persistence images. These computations were conducted on a personal laptop equipped with a 12th Gen Intel(R) Core(TM) i7 12650H processor clocked at 2.30 GHz, and supported by 64.0 GB of RAM. After the extraction of topological features, the overall average runtime for the Topo-CNN models was less than 3 hours on the same laptop. Performance Metrics We primarily used accuracy and ROC-AUC to evaluate model performance, but also report additional metrics, including F1 score, precision, and recall, in Appendix A.3. 4.3. Results In this part, we discuss the results of our models utilizing topological features in different ways. Topo-ML Model As previously mentioned, the Topo-ML model ( Figure 9 ) shows the standalone performance of topological vectors. Its primary advantages lie in its interpretability and computational efficiency. While its performance may not excel across all datasets, this straight-forward model offers a viable solution, particularly when data scarcity hampers the training of more complex CNN models. We present our Topo-ML results with different classifiers in Table 9 . The performance of Topo-ML often aligns with several vanilla-CNN models in terms of accuracy. However, in terms of AUC, the Topo-ML model generally lags behind CNN models. Topo-DL Models In these models, our primary aim is to assess how topological features impact the enhancement of pretrained CNN and VT model performance. Our hypothesis posits that while DL models excel at capturing local image features, TDA grasps global features, offering complementary insights to DL models. Our findings, as depicted in Tables 2 and 3 , clearly support this hypothesis. View this table: View inline View popup Download powerpoint Table 3. DL vs. Topo-DL. Performance comparison of vanilla DL models vs. Topo-DL models for breast ultrasound datasets. The last two columns show average improvements in accuracy and AUC. For each dataset, highest performances are given in bold . Table 2 presents the results of our Topo-CNN model, showing that topological features consistently improve CNN performance across all datasets and backbone architectures. Incorporating topological features yields consistent accuracy and AUC gains of up to 6% for several back-bones. Additionally, F1-scores for these models are reported in Table 11 . Table 3 summarizes the performance across all models, with the rightmost columns highlighting the average improvements contributed by topological features to pretrained deep learning models. We observe up to 5% and 3% average gains in accuracy and AUC, respectively. Given that these models are already pre-trained, these results indicate that topological features provide additional, valuable information that enhances the performance of these highly optimized models. Notably, the state-of-the-art VT model outperforms all CNN models in this setting, yet topological features still significantly boost the performance of these advanced architectures. Furthermore, our Topo-VT model outperforms recent Topo-DL approaches (Appendix A.2). These results underscore the considerable potential for performance enhancement through the fusion of topological and DL features, even with a basic approach to inject topological features in CNN models. With tailored modifications based on specific domains, these findings suggest significant avenues for further performance gains leveraging the synergy between topological and DL features. Limited Data Setting We evaluated the effectiveness of topological features in limited data settings by randomly splitting the datasets into an 80:20 train-test ratio. With the test set held constant, we reduced the training set to 10, 20, and 50 images per class to evaluate performance with varying levels of limited data. Our results in Table 4 show that topological features significantly enhance DL model performance, especially when training data is limited. These findings demonstrate the model’s robustness in low-data settings. Unlike traditional DL approaches, which often rely heavily on large datasets, topological features embed images directly into a latent space, reducing dependence on training set size. View this table: View inline View popup Download powerpoint Table 4. Performance with Limited Data: AUC scores for three models—TOPO (Betti vectors only), CNN (ResNet50), and TOPO-CNN (combined approach)—evaluated on the same test set with training data limited to 10, 20, or 50 samples per class. In few-shot learning or data-scarce conditions, our results indicate that topological features can improve model accuracy by providing reliable representations and stable anchors for each class, emphasizing their practical value in medical imaging, where labeled data is often scarce. Topo-CNN in other medical domains While we mainly focus on the breast ultrasound setting to maintain a clear scope, we also demonstrate the versatility and adaptability of our topological vectors and Topo-CNN model by showcasing their performance across various medical image formats. Utilizing the MedMNIST dataset [ 78 ], we employed three benchmark datasets RetinaMNIST (Fundus images), PneuMNIST (Chest X-ray) and BloodMNIST (Blood Cell) (see Table 8 ), applying our Betti-CNN model to 128 × 128 images with predefined splits. Notably, we observe up to 15% accuracy and 23% AUC improvements on CNN models by integrating topological features ( Table 5 ). View this table: View inline View popup Download powerpoint Table 5. Topo-CNN on additional datasets. Performance comparison between vanilla-CNN and Topo-CNN models on MedMNIST datasets. For each dataset, the best two accuracy improvements are underlined , and the best two AUC improvements are marked blue . Complementary Nature of Topo & CNN models Our results confirm that topological vectors improve DL performance. To validate their complementarity, we ran an 80:20 XGBoost experiment using 200-dim topological and 128-dim ResNet50 vectors (after 100 epochs). AUC and accuracy in Table 6 show the hybrid model outperforms both. The last two columns show the number of selected features in the hybrid model, with a balanced split further supporting complementarity. View this table: View inline View popup Download powerpoint Table 6. Complementarity of Topo and CNN Features. XGBoost performance on topological and CNN vectors, showing the hybrid model outperforms each alone. The balanced feature selection in the last two columns supports their complementarity. View this table: View inline View popup Download powerpoint Table 7. Performances of Topo-ML model with sublevel and superlevel filtrations are virtually same. View this table: View inline View popup Download powerpoint Table 8. MedMNIST Dataset Details. * means varying image sizes. View this table: View inline View popup Download powerpoint Table 9. ML Classifiers. Performance of our basic Topo-ML model with XGBoost, MLP and Transformer classifiers on breast ultrasound datasets. Alexander Duality To empirically verify our Alexander duality result, we give performances of our Topo-ML model with topological vectors obtained via sublevel and superlevel filtrations. As claimed, sublevel and superlevel vectors are virtually mirror images of each other in complementary dimensions ( Figure 5 ), and using one of these settings do not have any significant effect on the performance. Statistical Analysis To ensure a robust evaluation of model performance, we utilized 5 or 10-fold cross-validation, which inherently introduces variability in the performance metrics (e.g., accuracy, AUC, and F1-score). To further investigate the hypothesis that TDA can provide insights that complement CNN models, we further implemented a rigorous statistical analysis. This involved repeating the cross-validation process 20 times for each dataset across each model architecture, including B-CNN and PI-CNN. We then conducted a one-tailed paired t-test to statistically test whether the performance improvements observed with B-CNN or PI-CNN were significant over the baseline CNN model or if they could be attributed to random variation. Predicated on the premise that B-CNN generally outperforms P-CNN, we subjected this hypothesis to the same statistical test. To mitigate potential bias in our hypothesis testing, we complemented the t-test with the non-parametric Wilcoxon signed-rank test, a more robust test that does not assume a specific data distribution. The resulting p -values, which signify statistical significance, are reported in Table 13 . Further details can be found in Appendix A.4, which provides statistical evidence that Topo-CNN models outperforms the baseline CNN models. 4.4. Interpretability of Topological Features In this section, we explore the interpretability of topological features, focusing on Betti vectors as a straightforward yet effective method for vectorizing persistence diagrams, known for their high interpretability. In Figure 7 , we present the Betti curves for the MENDELEY dataset, incorporating nonparametric confidence bands [ 27 ]. The figure reveals a distinct difference between the benign and malignant classes, particularly around β 0 (40) and β 1 (50). To interpret these features: β 0 (40) refers to the number of components in the binary image χ 100 , where 100 represents the grayscale value corresponding to the 40 th thresh-old of the 100 thresholds within the [0, 255] grayscale range. Likewise, β 1 (50) denotes the count of white spots (holes) in χ 128 , with 128 corresponding to the grayscale value at the 50 th threshold. In Fig. 6 , we show boxplots and violin plots for these values, { β 0 (40)} and { β 1 (50)}, highlighting the clear distinction between the malignant and benign classes. Also, in Fig. 8 , we display sample binary images χ 128 with the 128 grayscale threshold for both classes, where the difference in the count of white spots (i.e., β 1 (50)) is clearly visible. Download figure Open in new tab Figure 6. Boxplots with violin plots comparing the distributions of β 0 (40) and β 1 (50) coefficients of benign and malignant classes in MENDELEY dataset. Download figure Open in new tab Figure 7. 40% confidence bands for Betti-0 and Betti-1 curves for Benign and Malignant classes in the MENDELEY dataset. Bold curves represent the median for each class. Download figure Open in new tab Figure 8. Sample binary images extracted from ultrasound images in the MENDELEY dataset. These binary images {χ 128 } are generated by marking all pixels with grayscale value ≤ 128 (threshold 50/100) black ( Section 3.1 ). As suggested by Figures 6 and 7 , the malignant images exhibit a significantly higher number of white spots (holes) compared to the benign images. Download figure Open in new tab Figure 9. Topo-ML model. In our basic model, we first generate persistence diagrams for any input image. Next, we derive our topological feature vectors, which are then inputted into an ML classifier to produce classification results. 5. Conclusion We investigated the effectiveness of topological features in enhancing DL models for breast cancer screening. Notably, we found that TDA offers a distinct approach to image analysis, diverging from conventional DL models and addressing key limitations. Our findings yield two main results. First, when combined with simple ML methods, topological features offer a viable alternative to DL models due to their efficiency, interpretability, and solid performance on limited data. Second, when integrated with DL models, they significantly improve accuracy and robustness. Moving forward, we aim to leverage this potential to develop specialized tools for medical image analysis by merging TDA outputs with DL models to create advanced, reliable decision support systems for breast cancer screening and beyond. Data Availability All datasets are publicly available and links are provided in the paper. https://www.kaggle.com/datasets/subhajournal/busi-breast-ultrasound-images-dataset Acknowledgements This work was partially supported by National Science Foundation under grants DMS-2113674, DMS-2210912, DMS-2220613, and DMS-2229417. The authors acknowledge the Texas Advanced Computing Center (TACC) at UT Austin for providing computational resources that have contributed to the research results reported within this paper. http://www.tacc.utexas.edu . Appendix A. More on Experimental Results In this part, we give additional results and details of our models. A.1. MedMNIST datasets While the main part of our paper focuses on the Breast Ultrasound setting to maintain a clear scope, we also demonstrate the versatility and adaptability of our topological vectors and their significant contributions to existing deep learning models by showcasing their performance across various medical image formats. Utilizing the MedMNIST dataset [ 78 ], we employed three benchmark datasets, RETINAMNIST, PneuMNIST and BloodMNIST(see Table 8 ), applying our Betti-CNN model to 128 × 128 images with predefined splits. Note that the BreastMNIST dataset corresponds to the BUSI dataset used in this paper. The performance of our model for BUSI is detailed in the main text (see Table 2 ). A.2. Comparison with Other Topo-DL Models We conducted experiments using PHG-Net [ 50 ], and the performance comparison in terms of AUC and Accuracy is presented in Table 10 . View this table: View inline View popup Download powerpoint Table 10. Comparison of Topo-DL Models. AUC and Accuracy comparisons for PHG-Net and Topo-Swin. View this table: View inline View popup Download powerpoint Table 11. Comparison of F1-scores between CNN and Topo-CNN models. View this table: View inline View popup Download powerpoint Table 12. Performance metrics for SwinV2 and Topo-VT models. A.3. Additional Performance Metrics In medical image analysis, F1-scores is a very common metric incorporating both precision and recall. Precision (also called positive predictive value) measures the accuracy of positive predictions, while recall (also called sensitivity or true positive rate) measures the proportion of actual positives that were correctly identified by the model. The F1-score is the harmonic mean of precision and recall and is calculated as . In Table 11 , we present the F1-scores of our models. It’s worth noting that although the improvements may appear marginal, our findings in Table 13 demonstrate that most of these enhancements are statistically highly significant. A.4. Significance Test In Table 2 and Table 11 , we outlined the three performance metrics for vanilla-CNN and our Topo-CNN models, highlighting the integration of topological features into conventional CNN architectures has potential to enhance the breast cancer screening. To evaluate the statistical significance of these enhancements, we utilized two distinct methods: the t-test and the Wilcoxon signed-rank test. The results, including all p -values, are documented in Table 13 and Table 14 . A significant majority of these p -values fell below the 0.05 threshold, indicating statistical significance, and are accordingly highlighted in blue for easy identification. View this table: View inline View popup Download powerpoint Table 13. Summary of p -values derived from t-tests indicating the performance disparity between vanilla-CNN and Topo-CNN models (Betti-CNN and Persistence Image-CNN) through t-test for BUSI, BUS-BRA, and MENDELEY datasets. To condense, we denote e n as 10 n . Outcomes with p < 0.05 are statistically significant and are highlighted in blue. View this table: View inline View popup Download powerpoint Table 14. Summary of p -values derived from Wilcoxon signed-rank test indicating the performance disparity between vanilla-CNN and Topo-CNN models (Betti-CNN and Persistence Image-CNN) through t-test for BUSI, BUS-BRA, and MENDELEY datasets. To condense, we denote e n as 10 n . Outcomes with p < 0.05 are statistically significant and are highlighted in blue. Our analysis showed that the B-CNN model outperformed the standard CNN model with a notable margin, as evidenced by the prevalence of blue in its respective subsection. Similarly, the P-CNN model demonstrated a significant improvement over the conventional CNN, with more than half of the comparative tests yielding significant results, also marked in blue. When comparing P-CNN against B-CNN, our findings suggest a superior performance by B-CNN, particularly on the BUSI and BUS-BRA datasets. To conclude, the statistical evidence supports that both Topo-CNN models, namely P-CNN and B-CNN, significantly surpass the baseline CNN model in terms of performance by leveraging topological features. Despite this, the performance gap between P-CNN and B-CNN, while present, often does not reach statistical significance, suggesting a nuanced comparison that varies by dataset and context. A.5. Persistence Images and PI-CNN model To explore the effect of vectorization on our models, we also employed a different vectorization to replace Betti vectors in our models. Persistence Images Persistence Images is one of the most common vectorization methods in TDA, introduced by Adams et al. [ 2 ]. Unlike most vectorizations, Persistence Images, as the name suggests, produce 2 D -arrays (tensors). The idea is to capture the location of the points in the PDs with a multivariable function by using the 2 D Gaussian functions centered at these points. For PD ( G ) = {( b i , d i )}, let ϕ i represent a 2 D -Gaussian centered at the point ( b i , d i ) ∈ ℝ 2 . Then, one defines a multivariable function, Persistence Surface , where w i is the weight, mostly a function of the life span d i − b i . To represent this multivariable function as a 2 D -vector, one defines a k × l grid (resolution size) on the domain of , i.e., threshold domain of PD ( G ). Then, one obtains the Persistence Image , a 2 D -vector (matrix) of size k × l such that where Δ rs = pixel with index rs in the k × l grid. Note that the resolution size k × l is independent of the number of thresholds used in the filtering; the choice of k and l is completely up to the user. There are two other important tuning parameters for persistence images, namely the weight w i and the variance σ (the width of the Gaussian functions). Like Silhouettes, one can choose w i = ( d i ™ b i ) p to emphasize large or small features in the PD. Similarly, the width parameter σ determines the sharpness of Gaussian, where smaller σ would make the Gaussian functions more like Dirac δ-function, and larger σ would make the Gaussians flat. Depending on the context, σ can be chosen a constant (e.g. σ = 0.1) or depending on the point ( b i , d i ), e.g., σ i = k ( d i − b i ) for some constant k > 0. Hyperparameters for PI-CNN model For each image χ, we first generated two 50 by 50 persistence images 𝒫ℐ 0 (χ) and 𝒫ℐ 1 (χ) corresponding to homology groups 0 and 1 respectively. These two persistence images were concatenated to obtain 50 by 100 matrix, which serves as a topological representation for each 2D image. Our PI-CNN model (Figure Figure 3 ) integrates a pretrained CNN with inputs of size 224 × 224 with additional frozen layers, enhanced by a 2D Multi-Layer Perceptron (2D MLP). The augmented CNN includes a convolutional layer with 64 filters of size (3, 3) and ReLU activation, followed by a max-pooling layer with a pool size of (2, 2), a flatten layer, and a dense layer with 64 neurons. Simultaneously, the 2D MLP consists of a convolutional layer with 32 filters of size (3, 3), a max pooling layer of size (2, 2), a flatten layer, and a dense layer with 128 neurons using ReLU activation. The concatenated outputs from both models are further processed by fully connected layers, including 256, 128, and 128 neurons each with ReLU activation, culminating in the model’s final output. B. Alexander Duality for Cubical Persistence In this section, we show the duality between sublevel filtration and superlevel filtration for cubical persistence. We note that in [ 9 ], the authors prove a duality result for cubical complexes, however their duality results are completely unrelated to ours. In their work, the authors study pixel connectivity in cubical complexes and construct dual graph filtrations for given cubical complex filtration. In our case, we relate one cubical complex filtration to another one (sublevel-superlevel) and show their duality in complementary dimensions. First, we recall some earlier results from algebraic topology, which is essential for the proof. Next, we give the setup and introduce the notation which we use in upcoming sections. B.1. Preliminaries In this part, we recall some of the well-known results which we use in the proof of the duality theorem [ 33 ]. Lemma 2 (Alexander Duality) Let χ be a compact, locally contractible subspace of d-sphere S d . Then , where represents reduced (co)homology . Since we only use field coefficients F in persistence modules, the Universal Coefficients Theorem [ 33 ] comes in a very simple form as follows. Lemma 3 (Universal Coefficients Theorem) Let F be a field. Then, for any k , Next, we will need the following duality result between persistent homology and persistent cohomology [ 21 ]. Lemma 4 (Persistent Cohomology) For a given filtration {χ n }, persistent homology (H k ( χ i ) → H k ( χ j ) ) and persistent cohomology (H k ( χ i ) ← H k ( χ j ) ) have identical barcodes: Finally, we quote the celebrated result on the uniqueness of the barcode decomposition in persistence module [ 10 ]. Lemma 5 (Krull-Schmidt Theorem) Any finite-dimensional persistence module has a unique (up to isomorphism) decomposition into indecomposable modules . In other words, the dimension of the homology groups { H k (χ i )}, and ranks of the homomorphisms φ ij : { H k (χ i ) → H k (χ j )}, uniquely determines the persistence barcode. Here, each bar in the persistence barcode corresponds to an indecomposable module in the theorem. B.2. Notation and Setup In the following, we will work with 3 different cubical complexes (CC): The original CC χ, the extended CC , and the extended sphere . The image χ : Let χ be a d -dimensional cubical complex of resolution Let η = ( η 1 , η 2 , …, η N ) represent the index of the voxels in the cubical complex χ, i.e., 1 ≤ η j ≤ r j . By abusing the notation, we will call the collection of voxels in χ as ℛ = {Δ η }. Let f : ℛ → ℝ be the filtering function assigning each voxel Δ η with corresponding (color) value f ( η ). Let m = min f and M = max f . Notice that the only interesting persistence diagrams for d -dimensional cubical complex are k = 0, 1, 2, …, d ™ 1 as for k ≥ d , PD k (χ) is trivial. The extended (padded) image : First, we induce a slightly larger complex of resolution with indices η = ( η 1 , η 2 , …, η N ) again where 0 ≤ η j ≤ r j + 1. In other words, we attach a padding of thickness-1 along the boundary of our original cubical complex χ. Then, we extend f to such that for any η ∈ ℛ , and for any , e.g., the value of for any voxel in the boundary shell . The extended sphere : Our second extension is to double topologically and obtain a d -sphere . In particular, glueing two d -balls along their boundaries with an identity map gives a d -sphere [ 33 ]. Here, we do the same by taking an exact copy of and glue it to the original one along the boundary. Hence, we double the number of voxels in , and we have a new index set . Again, we extend f to as before. i.e., for any η ∈ R , and for any . In other words, in the and d -sphere is defined as M for any voxel in . In the following, we will represent k th persistence diagram for sublevel filtration as and k th persistence diagram for superlevel filtration as . Proof of the Theorem Now, we are ready to prove our main duality result. In the following theorem, we prove the equivalence of persistence diagrams of sublevel and superlevel filtrations in complementary dimensions. In Remark 7, we give the explicit description of the correspondence between the bars in these persistence barcodes. Theorem 6 Let χ be a cubical complex of dimension d, and f be the filtering function on χ. Let be its extended image with . Then, the persistence diagrams for the sub-level and superlevel filtration of with respect to in complementary dimensions are equivalent . Proof: We prove the theorem in 2 steps. In the first step, we prove the duality in the sphere setting . In this version, we prove the equivalence between the reduced persistence diagrams which means that for dimension k = 0, the main barcode corresponding to the connected component with infinite lifespan is removed. Then, in the second step, we adapt this result to extended images setting and finish the proof. Step 1: Let be the extended sphere of, and f be the corresponding extension of . Then, the following reduced persistence diagrams are equivalent: Proof of Step 1: Let t 0 < t 1 = min f < t 2 < · · · < t N −1 < t N = max f be the threshold set for f . Let . As before, define the sublevel filtration for such that . Similarly, let . Now, the superlevel filtration can be defined as , ie., . Note that to avoid crowding the notation, we slightly modify superlevel filtration with strict inequality . This only shifts the indexes by one from the original superlevel filtration ( Section 3.1 ). By definition, we have . Recall that is a d -sphere. Hence, by Alexander duality (Lemma 2), for any 0 ≤ k ≤ d − 1, we have Notice that the Alexander duality uses reduced homology, hence infinite barcode for k = 0 is removed in this correspondence. Now, consider the persistent cohomology induced by the filtration , where as for i < j . Notice that by the naturality of H k ( χ; F ) = Hom( H k ( χ; F ), F ) (Lemma 3), we have the following commutative diagram: Now, we claim that k th persistent homology module for is equivalent to ( d − k − 1) th persistent cohomology module of . By Equation 1 , we have the dimensions of the corresponding homologies are same . By Equation 2 , we have ranks of the maps and are the same. Since the persistence barcode is uniquely determined by these dimensions and the ranks (Lemma 5), we have that the corresponding persistence diagrams are equivalent . i.e., Now, to finish the proof of Step 1, we need to show equivalence of the persistent cohomology with the persistent homology for superlevel filtration . This step directly follows from the duality of persistent homology and cohomology (Lemma 4) as follows: For superlevel filtration, we use the . Similarly, for persistent cohomology, we use the same filtration in reverse order . Then, by Lemma 4, their barcodes are identical: Note that to avoid crowded notation, we defined n with f ( η ) > t n condition, while the original superlevel filtration has 𝒳 n with f ( η ) ≥ t n . Hence, in our setup f ( η ) > t n is equivalent condition to f ( η ) ≥ t n +1 . Therefore, for any with our convention shifts each barcode by one ([ b, d ) → ([ b +1, d +1)) from the original superlevel . Hence, we have the equivalence: The proof of Step 1 follows from Equations 3 , 4 , 5 . □ Step 2: Proof of Step 2: After Step 1, all we need to do is to relate the homology groups in the persistence modules induced by the extended spheres and the extended images . Recall that is obtained by doubling . Hence, is an open ball, say U . By applying Mayer-Vietoris sequence to , we see that for any 0 ≤ k d ™ 2 as which is a ( d ™ 1)- sphere, and is contractible. For n < N , as removed ball U only effects the homology class corresponding to which is nontrivial in for n < N , while it is trivial in for any n . In Alexander duality, this homology class corresponds to the complement of the main connected component, but it is trivial in extended sphere setting. Hence, in the extended image setting, we recover this dual class in as a nontrivial homology class corresponding to the infinite bar removed sphere setting. in reduced persistence diagram in Step 1. In other words, corresponds to the bar which does not exist in extended Since other dimensions are not affected, and the correspondence in k = 0 is recovered as explained in the previous paragraph, the correspondence between the (unreduced) persistence diagrams in the extended image setting follows. □ With Step 1 and Step 2, the proof of the theorem follows. □ Remark 7 (Explicit Barcode Correspondence) In the theorem above, the explicit barcode correspondence is as follows: Let the sublevel filtration is defined as with consists of voxels Δ η with f ( η ) ≤ t n . Let the superlevel filtration for the same threshold set is defined as with consists of voxels Δ η with f ( η ) t n . Then, if σ represents a k-dimensional topological feature in the sublevel filtration { χ n } with barcode [ b σ , d σ ), then the last time appears in the sequence at . The complement of is (f ( η ) > d σ ). Hence, the corresponding (dual) ( d – k ™ 1) -dimensional topological feature σ ∗ first time appears in in the sequence , i . e ., b σ ∗ = d σ . Similarly, one can show d σ ∗ = b σ . Therefore, the isomorphism can be defined as where φ([ b σ , d σ )) = [ d σ , b σ ) = [ b σ ∗ , d σ ∗ ) Notice that in superlevel filtration since the nested sequence comes with decreasing thresholds, with our convention, the birth time (b σ ∗ = t i ) is larger than the death time (d σ ∗ = t j ) in superlevel filtration. Recall that for k = 0, the infinite barcode corresponds to as explained in Step 2 above . Remark 8 (Alternative extension for ) When defining for the extended image , one can use choose the value of on all boundary voxels in as min f instead of max f. The whole proof would go through by swapping sublevel and superlevel filtrations with the function ™ f instead of f. Note that the original extended image condition on is automatically satisfied by light background images while alternative extended image condition on is automatically satisfied by dark background images. This observation is important in applications of our result . Footnotes Brighton.Nuwagira{at}utdallas.edu , Adrian.Rodriguez{at}utdallas.edu , Qiwei.Li{at}utdallas.edu References [1]. ↵ Barsha Abhisheka , Saroj Kumar Biswas , and Biswajit Purkayastha . A comprehensive review on breast cancer detection, classification and segmentation using deep learning . Archives of Computational Methods in Engineering , 30 ( 8 ): 5023 – 5052 , 2023 . 2 OpenUrl [2]. ↵ Henry Adams , Tegan Emerson , Michael Kirby , Rachel Neville , Chris Peterson , Patrick Shipman , Sofya Chepushtanova , Eric Hanson , Francis Motta , and Lori Ziegelmeier . Persistence images: A stable vector representation of persistent homology . Journal of Machine Learning Research , 18 ( 1 ): 218 – 252 , 2017 . 3, 13 OpenUrl [3]. ↵ Mugahed A Al-Antari , Mohammed A Al-Masni , Mun-Taek Choi , Seung-Moo Han , and Tae-Seong Kim . A fully integrated computer-aided diagnosis system for digital x-ray mammograms via deep learning detection, segmentation, and classification . International journal of medical informatics , 117 : 44 – 54 , 2018 . 2 OpenUrl CrossRef PubMed [4]. ↵ Walid Al-Dhabyani , Mohammed Gomaa , Hussien Khaled , and Aly Fahmy . Dataset of breast ultrasound images . Data in brief , 28 : 104863 , 2020 . 5 OpenUrl PubMed [5]. ↵ Dashti Ali , Aras Asaad , Maria-Jose Jimenez , Vidit Nanda , Eduardo Paluzo-Hidalgo , and Manuel Soriano-Trigueros . A survey of vectorization methods in topological data analysis . IEEE Transactions on Pattern Analysis and Machine Intelligence , 2023 . 3 [6]. ↵ Fouzia Altaf , Syed MS Islam , Naveed Akhtar , and Naeem Khalid Janjua . Going deep in medical image analysis: concepts, methods, challenges, and future directions . IEEE Access , 7 : 99540 – 99572 , 2019 . 1 OpenUrl [7]. ↵ Gelan Ayana and Se-Woon Choe . BUVITNET: Breast ultrasound detection via vision transformers . Diagnostics , 12 ( 11 ): 2654 , 2022 . 2 OpenUrl PubMed [8]. ↵ Jun Bai , Russell Posner , Tianyu Wang , Clifford Yang , and Sheida Nabavi . Applying deep learning in digital breast to-mosynthesis for automatic breast cancer detection: A review . Medical image analysis , 71 : 102049 , 2021 . 2 OpenUrl CrossRef PubMed [9]. ↵ Bea Bleile , Adélie Garin , Teresa Heiss , Kelly Maggs , and Vanessa Robins . The persistent homology of dual digital image constructions . In Research in Computational Topology 2 , pages 1 – 26 . Springer , 2022 . 14 OpenUrl [10]. ↵ Magnus Botnan and Michael Lesnick . An introduction to multiparameter persistence . In Representations of Algebras and Related Structures , pages 77 – 150 . 2023 . 14 [11]. ↵ Peter Bubenik and Paweł Dłotko . A persistence landscapes toolbox for topological statistics . Journal of Symbolic Computation , 78 : 91 – 114 , 2017 . 3 OpenUrl CrossRef [12]. ↵ Luigi Caputi , Anna Pidnebesna , and Jaroslav Hlinka . Promises and pitfalls of topological data analysis for brain connectivity analysis . NeuroImage , 238 : 118245 , 2021 . 2 OpenUrl CrossRef PubMed [13]. ↵ Mathieu Carrière , Frédéric Chazal , Yuichi Ike , Théo Lacombe , Martin Royer , and Yuhei Umeda . Perslay: A neural network layer for persistence diagrams and new graph topological signatures . In International Conference on Artificial Intelligence and Statistics , pages 2786 – 2796 , 2020 . 4 [14]. ↵ Frédéric Chazal , Brittany Terese Fasy , Fabrizio Lecci , Alessandro Rinaldo , and Larry Wasserman . Stochastic convergence of persistence landscapes and silhouettes . In Proceedings of the thirtieth annual symposium on Computational geometry , pages 474 – 483 , 2014 . 3 [15]. ↵ Tianqi Chen and Carlos Guestrin . Xgboost: A scalable tree boosting system . In Proceedings of the 22nd acm sigkdd international conference on knowledge discovery and data mining , pages 785 – 794 , 2016 . 4 [16]. ↵ Joon Ho Choi , Hyun-Ah Kim , Wook Kim , Ilhan Lim , Inki Lee , Byung Hyun Byun , Woo Chul Noh , Min-Ki Seong , Seung-Sook Lee , Byung Il Kim , et al. Early prediction of neoadjuvant chemotherapy response for advanced breast cancer using pet/mri image deep learning . Scientific reports , 10 ( 1 ): 21149 , 2020 . 2 OpenUrl PubMed [17]. ↵ James R Clough , Nicholas Byrne , Ilkay Oksuz , Veronika A Zimmer , Julia A Schnabel , and Andrew P King . A topological loss function for deep-learning based image segmentation using persistent homology . IEEE transactions on pattern analysis and machine intelligence , 44 ( 12 ): 8766 – 8778 , 2020 . 2 OpenUrl [18]. ↵ Baris Coskunuzer and Cüneyt Gürcan Akçora . Topological methods in machine learning: A tutorial for practitioners . arXiv preprint arxiv: 2409.02901 , 2024 . 2 [19]. ↵ Lorin Crawford , Anthea Monod , Andrew X Chen , Sayan Mukherjee , and Raúl Rabadán . Predicting clinical outcomes in glioblastoma: an application of topological and functional data analysis . Journal of the American Statistical Association , 115 ( 531 ): 1139 – 1150 , 2020 . 2 OpenUrl CrossRef [20]. ↵ Qing Dan , Ziting Xu , Hannah Burrows , Jennifer Bissram , Jeffrey SA Stringer , and Yingjia Li . Diagnostic performance of deep learning in ultrasound diagnosis of breast cancer: a systematic review . NPJ Precision Oncology , 8 ( 1 ): 21 , 2024 . 2 OpenUrl PubMed [21]. ↵ Vin De Silva , Dmitriy Morozov , and Mikael Vejdemo-Johansson . Dualities in persistent (co) homology . Inverse Problems , 27 ( 12 ): 124003 , 2011 . 14 OpenUrl CrossRef [22]. ↵ Walter H Delashmit , Michael T Manry , et al. Recent developments in multilayer perceptron neural networks . In Proceedings of the seventh annual memphis area engineering and science conference, MAESC , page 33 , 2005 . 4 [23]. ↵ Karin Dembrower , Erik Wåhlin , Yue Liu , Mattie Salim , Kevin Smith , Peter Lindholm , Martin Eklund , and Fredrik Strand . Effect of artificial intelligence-based triaging of breast cancer screening mammograms on cancer detection and radiologist workload: a retrospective simulation study . The Lancet Digital Health , 2 ( 9 ): e468 – e474 , 2020 . 2 OpenUrl [24]. ↵ Tamal Krishna Dey and Yusu Wang . Computational topology for data analysis . Cambridge University Press , 2022 . 2 [25]. ↵ Tomoyuki Fujioka , Mio Mori , Kazunori Kubota , Jun Oyama , Emi Yamaga , Yuka Yashima , Leona Katsuta , Kyoko Nomura , Miyako Nara , Goshi Oda , et al. The utility of deep learning in breast ultrasonic imaging: a review . Diagnostics , 10 ( 12 ): 1055 , 2020 . 2 OpenUrl PubMed [26]. ↵ Behnaz Gheflati and Hassan Rivaz . Vision transformers for classification of breast ultrasound images . In IEEE EMBC , pages 480 – 483 . IEEE , 2022 . 2 [27]. ↵ Jean Dickinson Gibbons and Subhabrata Chakraborti . Nonparametric statistical inference . CRC press , 2014 . 8 [28]. ↵ Barbara Giunti . TDA applications library , 2022 . https://www.zotero.org/groups/2425412/tda-applications/library . 2 [29]. ↵ Barbara Giunti , Janis Lazovskis , and Bastian Rieck . DONUT: Database of Original & Non-Theoretical Uses of Topology , 2022 . https://donut.topology.rocks . 2 [30]. ↵ Wilfrido Gómez-Flores , Maria Julia Gregorio-Calas , and Wagner Coelho de Albuquerque Pereira . Bus-bra: A breast ultrasound dataset for assessing computer-aided diagnosis systems . Medical Physics , 2023 . 5 [31]. ↵ Mustafa Hajij , Ghada Zamzmi , and Fawwaz Batayneh . Tdanet: fusion of persistent homology and deep learning features for covid-19 detection from chest x-ray images . In 2021 43rd Annual International Conference of the IEEE Engineering in Medicine & Biology Society (EMBC) , pages 4115 – 4119 . IEEE , 2021 . 2 [32]. ↵ Ghada Hamed , Mohammed Abd El-Rahman Marey , Safaa El-Sayed Amin , and Mohamed Fahmy Tolba . Deep learning in breast cancer detection and classification . In Proceedings of the International Conference on Artificial Intelligence and Computer Vision (AICV2020) , pages 322 – 333 . Springer , 2020 . 2 [33]. ↵ Allen Hatcher . Algebraic Topology . Cambridge University Press , 2002 . 14, 15 [34]. ↵ Kaiming He et al. Deep residual learning for image recognition . In CVPR , pages 770 – 778 , 2016 . 5 [35]. ↵ Felix Hensel , Michael Moor , and Bastian Rieck . A survey of topological machine learning methods . Frontiers in Artificial Intelligence , 4 : 52 , 2021 . 1 OpenUrl [36]. ↵ Essam H Houssein , Marwa M Emam , Abdelmgeid A Ali , and Ponnuthurai Nagaratnam Suganthan . Deep and machine learning techniques for medical imaging-based breast cancer: A comprehensive review . Expert Systems with Applications , 167 : 114161 , 2021 . 2 OpenUrl [37]. ↵ Andrew G Howard , Menglong Zhu , Bo Chen , Dmitry Kalenichenko , Weijun Wang , Tobias Weyand , Marco Andreetto , and Hartwig Adam . Mobilenets: Efficient convolutional neural networks for mobile vision applications . arXiv preprint arxiv: 1704.04861 , 2017 . 5 [38]. ↵ Gao Huang , Zhuang Liu , Laurens Van Der Maaten , and Kilian Q Weinberger . Densely connected convolutional networks . In CVPR , pages 4700 – 4708 , 2017 . 5 [39]. ↵ Johanna Immonen , Amauri Souza , and Vikas Garg . Going beyond persistent homology using persistent homology . Advances in Neural Information Processing Systems , 36 , 2024 . 1 [40]. ↵ Sohail Iqbal , H Fareed Ahmed , Talha Qaiser , Muhammad Imran Qureshi , and Nasir Rajpoot . Classification of covid-19 via homology of ct-scan . arXiv preprint arxiv: 2102.10593 , 2021 . 2 [41]. ↵ Lida Kanari , Paweł Dłotko , Martina Scolamiero , Ran Levi , Julian Shillcock , Kathryn Hess , and Henry Markram . A topological representation of branching neuronal morphologies . Neuroinformatics , 16 ( 1 ): 3 – 13 , 2018 . 2 OpenUrl CrossRef PubMed [42]. ↵ Ekaterina Khramtsova , Guido Zuccon , Xi Wang , and Mahsa Baktashmotlagh . Rethinking persistent homology for visual recognition . In Topological, Algebraic and Geometric Learning Workshops 2022, pages 206 – 215 . PMLR , 2022 . 2 [43]. ↵ Jieun Koh , Youngno Yoon , Sungwon Kim , Kyunghwa Han , and Eun-Kyung Kim . Deep learning for the detection of breast cancers on chest computed tomography . Clinical breast cancer , 22 ( 1 ): 26 – 31 , 2022 . 2 OpenUrl PubMed [44]. ↵ Geert Litjens , Thijs Kooi , Babak Ehteshami Bejnordi , Arnaud Arindra Adiyoso Setio , Francesco Ciompi , Mohsen Ghafoorian , Jeroen Awm Van Der Laak , Bram Van Ginneken , and Clara I Sánchez . A survey on deep learning in medical image analysis . Medical Image Analysis , 42 : 60 – 88 , 2017 . 1 OpenUrl CrossRef PubMed [45]. ↵ Ze Liu , Yutong Lin , Yue Cao , Han Hu , Yixuan Wei , Zheng Zhang , Stephen Lin , and Baining Guo . Swin transformer: Hierarchical vision transformer using shifted windows . In Proceedings of the IEEE/CVF international conference on computer vision , pages 10012 – 10022 , 2021 . 4 [46]. ↵ Ze Liu , Han Hu , Yutong Lin , Zhuliang Yao , Zhenda Xie , Yixuan Wei , Jia Ning , Yue Cao , Zheng Zhang , Li Dong , et al. Swin transformer v2: Scaling up capacity and resolution . In Proceedings of the IEEE/CVF conference on computer vision and pattern recognition , pages 12009 – 12019 , 2022 . 4, 5, 6 [47]. ↵ Melissa R McGuirl , Alexandria Volkening , and Björn Sandstede . Topological data analysis of zebrafish patterns . Proceedings of the National Academy of Sciences , 117 ( 10 ): 5113 – 5124 , 2020 . 2 OpenUrl Abstract / FREE Full Text [48]. ↵ Maged Nasser and Umi Kalsom Yusof . Deep learning based methods for breast cancer diagnosis: A systematic review and future direction . Diagnostics , 13 ( 1 ): 161 , 2023 . 2 OpenUrl PubMed [49]. ↵ Theodore Papamarkou , Tolga Birdal , Michael Bronstein , Gunnar Carlsson , Justin Curry , Yue Gao , Mustafa Hajij , Roland Kwitt , Pietro Liò , Paolo Di Lorenzo , et al. Position paper: Challenges and opportunities in topological deep learning . arXiv preprint arxiv: 2402.08871 , 2024 . 2 [50]. ↵ Yaopeng Peng , Hongxiao Wang , Milan Sonka , and Danny Z Chen . Phg-net: Persistent homology guided medical image classification . In Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision , pages 7583 – 7592 , 2024 . 2, 12 [51]. ↵ Talha Qaiser , Yee-Wah Tsang , Daiki Taniyama , Naoya Sakamoto , Kazuaki Nakane , David Epstein , and Nasir Rajpoot . Fast and accurate tumor segmentation of histology images using persistent homology and deep convolutional features . Medical image analysis , 55 : 1 – 14 , 2019 . 2 OpenUrl CrossRef PubMed [52]. ↵ Xuejun Qian , Jing Pei , Hui Zheng , Xinxin Xie , Lin Yan , Hao Zhang , Chunguang Han , Xiang Gao , Hanqi Zhang , Weiwei Zheng , et al. Prospective assessment of breast cancer risk from multimodal multiview ultrasound images via clinically applicable deep learning . Nature biomedical engineering , 5 ( 6 ): 522 – 532 , 2021 . 2 OpenUrl PubMed [53]. ↵ Xiaolei Qu , Hongyan Lu , Wenzhong Tang , Shuai Wang , Dezhi Zheng , Yaxin Hou , and Jue Jiang . A vgg attention vision transformer network for benign and malignant classification of breast ultrasound images . Medical Physics , 49 ( 9 ): 5787 – 5798 , 2022 . 2 OpenUrl PubMed [54]. ↵ Raúl Rabadán and Andrew J Blumberg . Topological data analysis for genomics and evolution: topology in biology . Cambridge University Press , 2019 . 2 [55]. ↵ Bastian Rieck , Tristan Yates , Christian Bock , Karsten Borgwardt , Guy Wolf , Nicholas Turk-Browne , and Smita Krishnaswamy . Uncovering the topology of time-varying fMRI data using cubical persistence . NeurIPS , 33 : 6900 – 6912 , 2020 . 2 OpenUrl [56]. ↵ Paulo Sergio Rodrigues . Breast ultrasound image . Mendeley Data , 1 ( 10.17632 ), 2017 . 5 [57]. ↵ Roslidar Roslidar , Aulia Rahman , Rusdha Muharar , Muhammad Rizky Syahputra , Fitri Arnia , Maimun Syukri , Biswajeet Pradhan , and Khairul Munadi . A review on recent progress in thermal imaging and deep learning approaches for breast cancer detection . IEEE Access , 8 : 116176 – 116194 , 2020 . 2 OpenUrl [58]. ↵ Ainkaran Santhirasekaram , Mathias Winkler , Andrea Rockall , and Ben Glocker . Topology preserving compositionality for robust medical image segmentation . In CVPR , pages 543 – 552 , 2023 . 2 [59]. ↵ Shallu Sharma and Rajesh Mehra . Conventional machine learning and deep learning approach for multi-classification of breast cancer histopathology images—a comparative insight . Journal of digital imaging , 33 : 632 – 654 , 2020 . 2 OpenUrl CrossRef PubMed [60]. ↵ Dinggang Shen , Guorong Wu , and Heung-Il Suk . Deep learning in medical image analysis . Annual review of biomedical engineering , 19 : 221 – 248 , 2017 . 1 OpenUrl CrossRef PubMed [61]. ↵ Li Shen , Laurie R Margolies , Joseph H Rothstein , Eugene Fluder , Russell McBride , and Weiva Sieh . Deep learning to improve breast cancer detection on screening mammography . Scientific reports , 9 ( 1 ): 12495 , 2019 . 2 OpenUrl PubMed [62]. ↵ Yiqiu Shen , Farah E Shamout , Jamie R Oliver , Jan Witowski , Kawshik Kannan , Jungkyu Park , Nan Wu , Connor Huddleston , Stacey Wolfson , Alexandra Millet , et al. Artificial intelligence system reduces false-positive findings in the interpretation of breast ultrasound exams . Nature communications , 12 ( 1 ): 5645 , 2021 . 2 OpenUrl PubMed [63]. ↵ K Simonyan and A Zisserman . Very deep convolutional networks for large-scale image recognition . In ICLR , 2015 . 5 [64]. ↵ Amitojdeep Singh , Sourya Sengupta , and Vasudevan Lakshminarayanan . Explainable deep learning models in medical image analysis . Journal of imaging , 6 ( 6 ): 52 , 2020 . 1 OpenUrl PubMed [65]. ↵ Yashbir Singh et al. TDA in Medical Imaging: Current state of the art . Insights into Imaging , 14 ( 1 ): 1 – 10 , 2023 . 1, 2 OpenUrl PubMed [66]. ↵ Ann E Sizemore , Jennifer E Phillips-Cremins , Robert Ghrist , and Danielle S Bassett . The importance of the whole: topological data analysis for the network neuroscientist . Network Neuroscience , 3 ( 3 ): 656 – 673 , 2019 . 1 OpenUrl PubMed [67]. ↵ Yara Skaf and Reinhard Laubenbacher . Topological data analysis in biomedicine: A review . Journal of Biomedical Informatics, page 104082 , 2022 . 2 [68]. ↵ Eashwar Somasundaram , Adam Litzler , Raoul Wadhwa , Steph Owen , and Jacob Scott . Persistent homology of tumor ct scans is associated with survival in lung cancer . Medical physics , 48 ( 11 ): 7043 – 7051 , 2021 . 2 OpenUrl PubMed [69]. ↵ N. Stucki et al. Topologically faithful image segmentation via induced matching of persistence barcodes . In ICML , 2023 . 2 [70]. ↵ Hyuna Sung , Jacques Ferlay , Rebecca L Siegel , Mathieu Laversanne , Isabelle Soerjomataram , Ahmedin Jemal , and Freddie Bray . Global cancer statistics 2020: Globocan estimates of incidence and mortality worldwide for 36 cancers in 185 countries . CA: a cancer journal for clinicians , 71 ( 3 ): 209 – 249 , 2021 . 1 OpenUrl CrossRef PubMed [71]. ↵ Christian Szegedy , Sergey Ioffe , Vincent Vanhoucke , and Alexander Alemi . Inception-v4, inception-resnet and the impact of residual connections on learning . In Proceedings of the AAAI conference on artificial intelligence , 2017 . 5 [72]. ↵ Mingxing Tan and Quoc Le . Efficientnet: Rethinking model scaling for convolutional neural networks . In ICML , pages 6105 – 6114 . PMLR , 2019 . 5 [73]. ↵ A Vaswani et al. Attention is all you need . Advances in Neural Information Processing Systems , 2017 . 4 [74]. ↵ Fan Wang , Saarthak Kapse , Steven Liu , Prateek Prasanna , and Chao Chen . Topotxr: a topological biomarker for predicting treatment response in breast cancer . In International Conference on Information Processing in Medical Imaging , pages 386 – 397 . Springer , 2021 . 2 [75]. ↵ Chi-Chong Wong and Chi-Man Vong . Persistent homology based graph convolution network for fine-grained 3D shape segmentation . In ICCV , pages 7098 – 7107 , 2021 . 2 [76]. ↵ Ankur Yadav , Faisal Ahmed , Ovidiu Daescu , Reyhan Gedik , and Baris Coskunuzer . Histopathological cancer detection with topological signatures . In 2023 IEEE International Conference on Bioinformatics and Biomedicine (BIBM) , pages 1610 – 1619 . IEEE , 2023 . 2 [77]. ↵ Zuoyu Yan and Tengfei Ma . Neural approximation of extended persistent homology on graphs . In Advances in Neural Information Processing Systems , 2022 . 1 [78]. ↵ Jiancheng Yang , Rui Shi , Donglai Wei , Zequan Liu , Lin Zhao , Bilian Ke , Hanspeter Pfister , and Bingbing Ni . Medmnist v2-a large-scale lightweight benchmark for 2D and 3D biomedical image classification . Scientific Data , 10 ( 1 ): 41 , 2023 . https://medmnist.com . 5, 7, 12 OpenUrl PubMed [79]. ↵ Xujing Yao , Xinyue Wang , Shui-Hua Wang , and Yu-Dong Zhang . A comprehensive survey on convolutional neural network in medical image analysis . Multimedia Tools and Applications , 81 ( 29 ): 41361 – 41405 , 2022 . 1 OpenUrl [80]. ↵ Ali Zia , Abdelwahed Khamis , James Nichols , Zeeshan Hayder , Vivien Rolland , and Lars Petersson . Topological deep learning: A review of an emerging paradigm . arXiv preprint arxiv: 2302.03836 , 2023 . 2 View the discussion thread. Back to top Previous Next Posted October 17, 2025. Download PDF Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Breast Cancer Detection with Topological Deep Learning Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Breast Cancer Detection with Topological Deep Learning Brighton Nuwagira , Adrian Rodriguez , Qiwei Li , Baris Coskunuzer medRxiv 2025.10.15.25338098; doi: https://doi.org/10.1101/2025.10.15.25338098 Share This Article: Copy Citation Tools Breast Cancer Detection with Topological Deep Learning Brighton Nuwagira , Adrian Rodriguez , Qiwei Li , Baris Coskunuzer medRxiv 2025.10.15.25338098; doi: https://doi.org/10.1101/2025.10.15.25338098 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Radiology and Imaging Subject Areas All Articles Addiction Medicine (568) Allergy and Immunology (863) Anesthesia (297) Cardiovascular Medicine (4421) Dentistry and Oral Medicine (443) Dermatology (381) Emergency Medicine (606) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1507) Epidemiology (15212) Forensic Medicine (30) Gastroenterology (1121) Genetic and Genomic Medicine (6581) Geriatric Medicine (667) Health Economics (996) Health Informatics (4520) Health Policy (1366) Health Systems and Quality Improvement (1611) Hematology (539) HIV/AIDS (1264) Infectious Diseases (except HIV/AIDS) (15906) Intensive Care and Critical Care Medicine (1103) Medical Education (620) Medical Ethics (144) Nephrology (667) Neurology (6580) Nursing (345) Nutrition (998) Obstetrics and Gynecology (1141) Occupational and Environmental Health (956) Oncology (3324) Ophthalmology (970) Orthopedics (369) Otolaryngology (420) Pain Medicine (435) Palliative Medicine (129) Pathology (663) Pediatrics (1689) Pharmacology and Therapeutics (691) Primary Care Research (710) Psychiatry and Clinical Psychology (5431) Public and Global Health (9212) Radiology and Imaging (2193) Rehabilitation Medicine and Physical Therapy (1368) Respiratory Medicine (1194) Rheumatology (593) Sexual and Reproductive Health (709) Sports Medicine (529) Surgery (709) Toxicology (99) Transplantation (288) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'9ff18d08ac5141e2',t:'MTc3OTM0NTIxOQ=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00