Full text
36,478 characters
· extracted from
preprint-html
· click to expand
Estimating drivers of breast tissue transitions from normal to tumor state | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Estimating drivers of breast tissue transitions from normal to tumor state View ORCID Profile Swapnil Kumar , Vaibhav Vindal doi: https://doi.org/10.1101/2025.04.14.648655 Swapnil Kumar 1 Department of Biotechnology & Bioinformatics, School of Life Sciences, University of Hyderabad , Hyderabad, 500046, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Swapnil Kumar Vaibhav Vindal 1 Department of Biotechnology & Bioinformatics, School of Life Sciences, University of Hyderabad , Hyderabad, 500046, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: vaibhav{at}uohyd.ac.in Abstract Full Text Info/History Metrics Supplementary material Preview PDF Abstract Tumor tissues are characterized by dysregulated gene expression patterns leading to altered cellular pathways and molecular functions as a result of their transition from normal to tumor state. Further, tumor-adjacent normal tissues (TANTs), utilized as a control in cancer research, are not molecularly normal and differ from healthy normal tissues. These TANTs represent a distinctive transitional state betwixt normal and tumor states. However, the mechanism underlying this state transition, expression dysregulation, and perturbed regulation remain largely unexplored and hence elusive. Herein, the transitions of breast tissues from normal and TANT to tumor states were modeled using gene expression and regulation data to estimate key drivers underlying these transitions. As a result, we identified 645 shared driver genes underlying the transitions of breast tissues from the healthy normal state to the adjacent normal and tumor states. Besides, we identified 635 shared driver genes underlying the transitions of TANTs to different subtypes. When we intersected both lists of shared driver genes, a total of 615 commonly shared driver genes across the state transitions were observed. Subsequently, functional annotations of these driver genes revealed their involvement in the growth and maintenance-related activity of cells. Additionally, key pathways associated with cancer pathogenesis, such as Wnt signaling, Notch signaling, NF-kappa B signaling, and PD-L1 expression and PD-1 checkpoint pathway in cancer, were found significantly enriched with these shared driver genes. Thus, the shared driver genes identified across tissue transitions provide ways forward to devise more efficient diagnostic and therapeutic strategies for early and effective disease management. Introduction Breast cancer is a major women’s health concern due to high morbidity and mortality across the globe (Bray et al., 2024). It arises from abnormal growth in breast tissues, mainly lobules and ducts. It is complex and heterogeneous in nature and has multiple subtypes. These molecular subtypes are classified by the presence and absence of hormone receptors, viz., “Estrogen receptor” (ER), “Progesterone receptor” (PR), and “Human epidermal growth factor receptor 2” (HER2). Further, these subtypes of breast cancer include “Basal-Like” (Basal) (ER-/PR- and HER2-), “Luminal A” (LumA) (ER+/PR+, HER2-, and Ki67 low), “Luminal B” (LumB) (ER+/PR+, HER2+ or HER2-, and Ki67 high), “HER2-enriched” (Her2) (ER+/PR+ and HER2+), and “Normal-Like” (NormL) (ER+/PR+, HER2-, and Ki67 low) (Dai et al., 2015). Each of these subtypes exhibits different gene expression profiles and, hence, distinct gene regulatory network (GRN) systems. Besides, the gene expression profiles and GRNs of these subtypes also differ from their adjacent normal and even completely normal healthy tissues ( Kumar & Vindal, 2023 ). Moreover, every cancer study employing patient samples include the tumor-adjacent normal tissue (TANT) samples as control for studying the tumor tissues. However, these morphologically and histologically looking normal TANTs are not completely normal and are different from healthy normal tissues (HNTs) derived from non-tumor-bearing healthy individuals. For example, the TANTs have various tumorigenic features, including altered pathways ( Aran et al., 2017 ) and gene expression profiles ( Kumar & Vindal, 2023 ). Despite this, there is a substantial lack of related knowledge as well as thorough experimental studies on the driver genes underlying the transitions of normal breast tissues into different subtypes of the same breast cancer. It is experimentally well-documented that alterations in gene expressions lead normal tissues to proceed toward diseased ones. When normal tissues transform into tumors, the exact attribute of the alteration of cellular pathways and loss of functions specifically depends on differentially expressed genes and pathways varying between different cell or tissue types. Therefore, specific states of any tissues, e.g., normal and tumor tissues, harbor distinct gene expression profiles. Further, these normal and tumor states might be representative of changes that occurred during the transition or transformation from one to another condition, e.g., healthy to tumor condition. Different tissue types can be classified by their gene expression profiles and, hence, GRNs; consequently, the transitions between different states can be modeled using any changes occurred in their underlying GRNs. In this study, we have applied modeling of network state transition using gene expression and regulation data, a regression-based method implemented in MONSTER ( Schlauch et al., 2017 ), for inferring transcription factors (TFs) as drivers of tissue state transformation at the GRN level. We analyzed TANTs along with all five subtypes of breast cancer to identify TFs that lead to the alteration of the network structure as the healthy tissues progress toward the diseased state. For this, first, TF-target gene regulations were predicted using gene expression profiles of TANTs and subtypes; then, driver genes and TFs present in TANTs and subtypes were identified using the corresponding expression profiles coupled with the predicted TF-target gene regulations. Thus, our results demonstrate the key candidate genes and TFs associated with TANTs and subtypes, offering a promising avenue toward designing and developing more efficient, early-stage-specific diagnostic and therapeutic interventions. Methods Acquisition of tumor and normal tissue data Gene expression datasets of tumor tissues and TANTs were retrieved using the recount2 project (Collado-Torres et al., 2017) from the portal of genomic data commons of “The Cancer Genome Atlas” (TCGA) ( Tomczak et al. 2015 ; Weinstein et al. 2013 ). However, the gene expression data of healthy normal tissues (HNTs) were retrieved using the recount2 project from “The Genotype-Tissue Expression” (GTEx) portal ( Lonsdale et al., 2013 ). These data were downloaded with the help of the “TCGAbiolinks” R package (Colaprico et al., 2016). Subsequently, all three types of gene expression data were pre-processed, filtered, and normalized using the “TCGAbiolinks” R package for further analysis. Motif mapping data for TF-target gene regulations Motif mapping data contain information on which genes have likely binding sites for a particular TF in their promoter and vicinity. This serves as the prior on TF-gene regulations and informs the network inferential method with a prior network of TFs targeting genes. Each row of this prior data defines one regulatory edge with TF, the corresponding targeted gene, and the edge’s strength. For the current study, we have considered networks as unweighted and, hence, have populated the entire data with one as the strength of the edges. The TF-gene motif mapping data were collected from the motif mappings provided in online documentation and resources of PANDA (Glass et al., 2013). Prediction of transitioning drivers Driver genes underlying the transition of breast tissues from the normal state to the tumor state were predicted using the MONSTER package ( Schlauch et al., 2017 ) as implemented in netZooR v1.4 ( Ben Guebila et al, 2023 ) and R v4.2. It first predicts the regulatory relations of TFs and their target genes using the PANDA implementation (Glass et al., 2013) by utilizing gene expression data of each tissue type along with prior information on the TF-gene motif mapping. Herein, the gene expression data of genes with counts per million (CPM) values of one or more across 50% or more samples were only considered in the case of each tissue type. However, the predicted gene regulations for initial and terminal conditions, i.e., normal and tumor tissues using the PANDA package, can also be used directly as input in the MONSTER algorithm for the transition driver predictions. Subsequently, this calculates a transition matrix by mapping the GRN of the initial state to the GRN of the final state and follows the identification of a set of significant and critical driver genes potentially responsible for the transition of normal tissues and TANTs to tumor tissues. To determine the statistical significance of the results produced by the MONSTER, the samples were permuted 100 times, and the analysis was re-run for each permutation. Further, the state transition matrices, along with the rewired regulations of differential TFs involved in the state transition process, were visualized. Functional and pathway annotation of key drivers Key driver genes for the modeled tissue transitions were checked for their involvement in molecular functions (MFs) and biological processes (BPs) utilizing the Gene Ontology (GO) and pathways by the KEGG pathway-based over-representation analysis method implemented in the clusterProfiler R package ( Xu et al., 2024 ). To identify significantly associated or enriched MF, BP, and pathway terms with key driver genes, the significance level was set to an adjusted P-value of 0.05. Herein, the P-value was adjusted by the method of “Benjamini-Hochberg” (BH) to control the false positive rate. Disease association of key drivers Driver genes underlying the transition of tissues from a normal to tumor state were subjected to Disease Ontology (DO)-based enrichment analysis using the DOSE R package ( Yu et al., 2015 ) with the “BH” method of P-value adjustment. All the enriched terms with adjusted P-values ≤ 0.05 were regarded as significant for the result inference purpose. Further, these driver genes were also searched for their previously known association with any diseases, including cancers, using disease-gene association information from the database of DisGeNET ( Piñero et al., 2020 ) and the catalog of known and candidate cancer genes from the database of Network of Cancer Genes (NCG) ( Repana et al., 2019 ). Results and discussion Expression data of tumor tissues, TANTs, and HNTs Gene expression profiles of all six tissue types were processed together for further analysis. Herein, only expressions of protein-coding genes were considered as per the list of genes and their details retrieved from the Human Gene Nomenclature Committee. The detailed distribution of samples and genes across all tissue data are provided in Table 1 . The LumA subtype had the highest number of samples (570), while the NormL subtype had the lowest (40). The gene expression data of only female samples, from both TCGA and GTEx, were used for the current study. View this table: View inline View popup Table 1. Samples and genes across all six tissue types Driver genes underlying transitions of tumors and TANTs from HNTs The modeling of state transition from normal state, i.e., HNTs, to tumor state, i.e., different subtypes and TANTs, resulted in the identification of differential TFs as potential drivers involved in the state transitions. Herein, we have considered the TANTs similar to tumors because it is well-proven that the TANTs are not entirely normal and have tumorigenic features at the molecular level. When state transitions were modeled for HNTs with tumor tissues and TANTs, a maximum of 830 driver genes were identified for Basal, Her2, and TANT, whereas a minimum of 812 for LumA. The detailed distributions of identified driver genes across all modeled transitions are available in Table 2 and Fig. 1 . There were a total of 645 commonly shared driver genes underlying the modeled transitions of tumor tissues and TANTs from the HNTs (Table S1). These shared common driver genes included some well-known cancer-associated genes such as ATM, BCL11A, BRCA2, E2F1, ESR1, FOXA1, JUN, MYC, RUNX1, TP53 , and TP63 . View this table: View inline View popup Table 2. Distribution of genes with a CPM value of more than one and number of drivers identified across all possible transitions Download figure Open in new tab Fig. 1. Distribution of driver genes underlying transitions of tumor tissues and TANTs from HNTs Driver genes underlying transitions of subtypes from TANTs We also modeled the state transitions of tumor tissues (five subtypes, viz., Basal, LumA, LumB, Her2, and NormL) from the TANTs, which resulted in the identification of differential TFs as potential drivers involved in the respective state transitions. Consequently, a maximum of 850 driver genes were identified for the Basal subtype, whereas a minimum of 808 for the NormL. The detailed distributions of identified driver genes across all modeled transitions are available in Table 2 and Fig. 2 . There were a total of 635 commonly shared driver genes across all the five modeled state transitions of tumor tissues (breast cancer subtypes) from the TANTs (Table S2). These shared common driver genes across transitions also included some well-known cancer-associated genes, such as ATM, BCL11A, BRCA2, E2F1, ESR1, FOXA1, JUN, MYC, RUNX1, TP53 , and TP63 , which were even present in the transitions of HNTs to tumor tissues. Download figure Open in new tab Fig. 2. Distribution of driver genes underlying transitions of tumor tissues from TANTs When we looked for the common driver genes in both transitions, i.e., from HNTs to TANTs and tumors and from TANTs to tumors, most of the driver genes from both transitions were common, and hence, there were 615 shared driver genes. These commonly shared driver genes across all the transitions can serve as key candidates for the design and development of potential diagnostics and therapeutics specifically for the effective management and treatment of the disease at an early-stage. It has been reported that the mutated ATM gene is associated with a higher breast cancer risk and contributes to its development (Dork et al., 2001; Soukupova et al., 2008 ; Bogdanova et al., 2009 ). Next, the gene BCL11A , a B-cell proto-oncogene, has previously been found to be associated with transcriptional regulation and as a mutated gene in breast cancer ( Sjoblom et al. 2006 ). Similarly, the DNA repair-associated gene BRCA2 has been identified as a mutated gene in the case of breast cancer ( Valarmathi et al., 2004 ; Hall et al., 2009 ; Vaidyanathan et al., 2009 ). Functions and processes of key drivers GO-based enrichment analysis revealed a total of 66 MF and 369 BP terms significantly enriched or over-represented with commonly shared driver genes. Among all enriched MF terms, terms related to transcription regulations, including “DNA-binding transcription activator and repressor activity,” “transcription coactivator and corepressor activity,” “histone deacetylase activity,” and “promoter-specific chromatin binding” were most significantly enriched with the maximum number of the shared driver genes ( Fig. 3 ). Moreover, among all enriched BP terms, terms related to developmental and transcriptional processes, such as “gland development,” “mononuclear cell differentiation,” “intracellular receptor signaling pathway,” “regulation of miRNA transcription,” “miRNA metabolic process,” etc., were the most enriched terms with the majority of the shared driver genes ( Fig. 4 ). These MF and BP terms associated with the shared driver genes indicate that these driver genes play vital roles in the growth and maintenance-related activity of cells and, hence, the constituting tissues. Download figure Open in new tab Fig. 3. Top MF terms significantly associated with shared driver genes Download figure Open in new tab Fig. 4. Top BP ontology terms significantly associated with shared driver genes Enriched pathways of key drivers When the commonly shared driver genes across all types of modeled transitions were subjected to pathway analysis, 83 pathways were identified as significantly associated with these driver genes. Among all these pathways, the pathway of “Transcriptional misregulation in cancer” (hsa05202) was found to be significantly enriched or over-represented with the maximum number of shared driver genes. Transcriptional misregulation is a hallmark of cancer that is driven by genetic alterations that disrupt the transcriptional control of genes. Further, genetic alterations can affect transcriptional controls at many levels, including Cis-elements and Trans-factors, which can lead to a variety of alterations in cellular properties that contribute to tumor development. These alterations in cellular properties can include dysregulated transcriptional programs ( Koschmieder et al., 2009 ) and fusion oncoproteins ( Prensner & Chinnaiyan, 2009 ). Other significantly enriched pathways included “Breast cancer pathway,” “TGF-beta signaling pathway,” “Notch signaling pathway,” “Wnt signaling pathway,” “Cell cycle,” “Estrogen signaling pathway,” “MAPK signaling pathway,” “NF-kappa B signaling pathway,” “Toll-like receptor signaling pathway,” and “PD-L1 expression and PD-1 checkpoint pathway in cancer” ( Fig. 5 ). It is interesting to note that these pathways are well-known for their involvement in the pathogenesis of various types of cancers, including breast cancer. For example, the altered form of the MAPK signaling pathway is known for its association with the development of various diseases, including cancers ( Qi & Elion, 2005 ; Kim & Choi, 2010 ). Thus, these significantly over-represented pathways with shared driver genes highlight their importance in the transitions of normal tissues to tumor tissues and, hence, the tumorigenesis of breast cancer. Download figure Open in new tab Fig. 5. Top KEGG pathway terms significantly associated with shared driver genes Enriched diseases of key drivers The DO and NCG-based enrichment analysis of the shared driver genes revealed their significant associations with various cancer types and other diseases. It was noticed that 135 DO terms and 37 NCG terms were significantly enriched with these common driver genes. Among DO terms, cancer-related terms such as “breast cancer,” “lung cancer,” “liver cancer,” and “prostate cancer” were enriched with a majority of the shared driver genes ( Fig. 6 ). Similarly, NCG terms, including “breast cancer,” “bladder cancer,” “liver cancer,” and “prostate cancer,” were found to be significantly enriched with the majority of the shared driver genes ( Fig. 7 ). These enriched terms show that all the shared driver genes identified herein have potential implications in the transitions of normal breast tissues to tumor forms. Download figure Open in new tab Fig. 6. Disease ontology terms significantly associated with shared driver genes Download figure Open in new tab Fig. 7. NCG terms significantly associated with shared driver genes Limitations of the current study It is the first study to date on modeling the transitions of breast tissues from normal to tumor state using gene expression and TF-gene regulatory data of tumor tissues, TANTs, and normal tissues to estimate the underlying driver genes. However, the present study has some limitations, too. First, we have considered the samples of TANTs as one group of tissues that represents the intermediate state between normal and tumor states, irrespective of which subtypes these TANTs belong to due to the low number of samples of TANTs to individual subtypes. Thus, with the future availability of more expression data on TANTs of different subtypes, transitions of each subtype can be modeled to estimate the underlying driver genes towards the inference of pathway mechanisms transforming breast tissues from normal to tumor forms more accurately and efficiently. Second, we computed only 10 null permutations to determine the statistical significance of our result for each modeled transition due to the requirement of a large amount of computational processing therein. However, computing high numbers of null permutations, such as 1000, would likely ensure more sufficient null observations for estimating null distributions and computing empirical P-values. In turn, it will produce comparatively more significant predictions of transitioning driver genes. Third, annotations retrieved from the databases of GO and pathways tend to be biased toward genes and pathways that are well-studied and properly characterized. Consequently, genes that lack functional and pathway-based annotations get ignored while performing GO and pathway-based annotation analyses; hence, those genes are required to be investigated separately. Conclusions The transitions between two states of phenotypes, viz., normal and tumor, can be modeled in terms of gene expression space, where a change in phenotype correlates with the transition between gene expression profiles of the two states. Here, we implemented the framework of network modeling for inferring state transitions between HNT/TANT and five subtypes (Basal, LumA, LumB, Her2, and NormL) using gene expression and regulatory data by assuming that gene expression patterns were driven by perturbations in gene regulation patterns and therefore, subsequent changes in the underlying GRN. It helped us to explore and decode how phenotypic alterations and the associated regulatory changes were driven by the “rewiring” of TF-target regulations and to identify all those TFs that were involved in the alteration of their targets. As a result, it revealed critical driver genes underlying the transitions of all five subtypes from the HNTs and TANTs and also the TANTs from the HNTs. These key drivers included genes such as ATM, BCL11A, BRCA2, E2F1, ESR1, FOXA1, JUN, MYC, RUNX1, TP53 , and TP63 . Thus, the current study paved the way to identify and explore the TFs that drive the transition occurring from normal healthy to tumor states, and it can be applied to a wide range of systems, such as Type 2 diabetes, Cardiovascular diseases, Neurodegenerative diseases, and other types of cancers. Funding This study was supported by the extramural research grant from the Indian Council of Medical Research (ICMR) New Delhi (ISRM/12(72)/2020, ID: 2020-2951). Contributions SK and VV conceived and designed the study. SK performed the experiments and analyzed the data. SK drafted, wrote, and edited the manuscript. VV reviewed and edited the manuscript. VV supervised the study. All authors read and approved the final manuscript. Declaration of Competing Interests The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper. Ethics Statement This manuscript does not involve human subjects, animals, or any form of experimentation requiring ethical approval or consent. Data availability statement The common driver genes for two transitions, viz., transition from HNTs to TANTs and tumor tissues and transition from TANTs to tumor tissues identified in the current study are available in the supplementary data files. Further, the gene expression datasets of tumors, TANTs, and HNTs used in this study are publicly available and can be downloaded from the portals of TCGA (tumors and TANTs) and GTEx (HNTs). Supplementary Tables Table S1. Driver genes underlying transition from HNTs to TANTs and tumor tissues Table S2. Driver genes underlying transition from TANTs to tumor tissues Acknowledgements The authors thank the Center for Modeling, Simulation & Design (CMSD), University of Hyderabad, for providing computational facilities. Further, VV would like to thank the Indian Council of Medical Research (ICMR), New Delhi (ISRM/12(72)/2020, ID: 2020-2951), Institution of Eminence – University of Hyderabad (No. UoH/IoE/RC3-21-052), and Department of Biotechnology (DBT), Government of India (No. BUILDER-DBT-BT/INF/22/SP41176/2020), for their financial support. SK also acknowledges the Institution of Eminence – UoH for the Performance-Based Publication Incentives, University of Hyderabad for the Non-NET Fellowship, and ICMR for the Senior Research Fellowship (Grant No.: 3/2/2/113/2019/NCD-III, ID: 2019-6723). Funding Indian Council of Medical Research, https://ror.org/0492wrx28 , ISRM/12(72)/2020, ID: 2020-2951 References 1. ↵ Aran D , Camarda R , Odegaard J et al. ( 2017 ) Comprehensive analysis of normal adjacent to tumor transcriptomes . Nat Commun , 8 : 1077 OpenUrl CrossRef PubMed 2. ↵ Ben Guebila M , Wang T , Lopes-Ramos CM , Fanfani V , Weighill D , Burkholz R , et al. ( 2023 ) The Network Zoo: a multilingual package for the inference and analysis of gene regulatory networks . Genome Biology , 24 ( 1 ): 45 . doi: 10.1186/s13059-023-02877-1 OpenUrl CrossRef PubMed 3. ↵ Bogdanova N , Cybulski C , Bermisheva M , Datsyuk I , Yamini P , Hillemanns P , et al. ( 2009 ) A nonsense mutation (E1978X) in the ATM gene is associated with breast cancer . Breast Cancer Res Treat , 118 ( 1 ): 207 – 11 . doi: 10.1007/s10549-008-0189-9 OpenUrl CrossRef PubMed 4. Bray F , Laversanne M , Sung H , Ferlay J , Siegel RL , Soerjomataram I , et al. ( 2024 ) Global cancer statistics 2022: GLOBOCAN estimates of incidence and mortality worldwide for 36 cancers in 185 countries . CA Cancer J Clin , 74 ( 3 ): 229 – 263 . OpenUrl CrossRef PubMed 5. Colaprico A , Silva TC , Olsen C , Garofano L , Cava C , Garolini D , et al. ( 2016 ) TCGAbiolinks: an R/Bioconductor package for integrative analysis of TCGA data . Nucleic acids research , 44 ( 8 ): e71. . OpenUrl CrossRef PubMed 6. Collado-Torres L , Nellore A , Kammers K , Ellis SE , Taub MA , Hansen KD , et al. ( 2017 ) Reproducible RNA-seq analysis using recount2 . Nature biotechnology , 35 ( 4 ): 319 – 21 . OpenUrl CrossRef PubMed 7. Dai X , Li T , Bai Z , Yang Y , Liu X , Zhan J , et al. ( 2015 ) Breast cancer intrinsic subtype classification, clinical use and future trends . Am J Cancer Res 5 ( 10 ): 2929 – 2943 OpenUrl CrossRef PubMed 8. Dörk T , Bendix R , Bremer M , Rades D , Klöpper K , Nicke M , et al. ( 2001 ) Spectrum of ATM gene mutations in a hospital-based series of unselected breast cancer patients . Cancer Res , 61 ( 20 ): 7608 – 15 . OpenUrl Abstract / FREE Full Text 9. Glass K , Huttenhower C , Quackenbush J , Yuan GC . ( 2013 ) Passing messages between biological networks to refine predicted interactions . PloS ONE , 8 ( 5 ): 64832 . OpenUrl CrossRef 10. ↵ Hall MJ , Reid JE , Burbidge LA , Pruss D , Deffenbaugh AM , Frye C , et al. ( 2009 ) BRCA1 and BRCA2 mutations in women of different ethnicities undergoing testing for hereditary breast-ovarian cancer . Cancer , 115 ( 10 ): 2222 – 33 . doi: 10.1002/cncr.24200 . Erratum in: Cancer, 115(12):2804 OpenUrl CrossRef PubMed Web of Science 11. ↵ Kim EK , Choi EJ . ( 2010 ) Pathological roles of MAPK signaling pathways in human diseases . Biochim. Biophys. Acta (BBA) - Mol. Basis Dis ., 1802 ( 4 ), 396 – 405 OpenUrl CrossRef 12. ↵ Koschmieder S , Halmos B , Levantini E , Tenen DG . ( 2009 ) Dysregulation of the C/EBPalpha differentiation pathway in human cancer . J Clin Oncol , 27 : 619 – 628 . DOI: 10.1200/JCO.2008.17.9812 OpenUrl CrossRef PubMed 13. ↵ Kumar S , Vindal V. ( 2023 ) Architecture and topologies of gene regulatory networks associated with breast cancer, adjacent normal, and normal tissues . Funct Integr Genomics 23 , 324 . doi: 10.1007/s10142-023-01251-5 OpenUrl CrossRef PubMed 14. ↵ Lonsdale J , Thomas J , Salvatore M , Phillips R , Lo E , Shad S , et al. ( 2013 ) The genotype-tissue expression (GTEx) project . Nature genetics , 45 ( 6 ): 580 – 5 . OpenUrl CrossRef PubMed 15. ↵ Piñero J , Ramírez-Anguita JM , Saüch-Pitarch J , Ronzano F , Centeno E , Sanz F , et al. ( 2020 ) The DisGeNET knowledge platform for disease genomics: 2019 update . Nucleic acids research , 48 ( D1 ): D845 – 55 . OpenUrl CrossRef PubMed 16. ↵ Prensner JR , Chinnaiyan AM . ( 2009 ) Oncogenic gene fusions in epithelial carcinomas . Curr Opin Genet Dev 19 : 82 – 91 . DOI: 10.1016/j.gde.2008.11.008 OpenUrl CrossRef PubMed Web of Science 17. ↵ Qi M , Elion EA . ( 2005 ) MAP kinase pathways . J Cell Sci , 118 , 3569 – 3572 . OpenUrl FREE Full Text 18. ↵ Repana D , Nulsen J , Dressler L , Bortolomeazzi M , Venkata SK , Tourna A , et al. ( 2019 ) The Network of Cancer Genes (NCG): a comprehensive catalogue of known and candidate cancer genes from cancer sequencing screens . Genome biology . 20 : 1 – 2 . OpenUrl CrossRef PubMed 19. ↵ Schlauch D , Glass K , Hersh C , et al. ( 2017 ) Estimating drivers of cell state transitions using gene regulatory network models . BMC Syst Biol , 11 , 139 . doi: 10.1186/s12918-017-0517-y OpenUrl CrossRef PubMed 20. ↵ Sjoblom T , Jones S , Wood LD , et al. ( 2006 ) The consensus coding sequences of human breast and colorectal cancers . Science , 314 268 – 274 OpenUrl Abstract / FREE Full Text 21. ↵ Soukupova J , Dundr P , Kleibl Z , Pohlreich P. ( 2008 ) Contribution of mutations in ATM to breast cancer development in the Czech population . Oncol Rep , 19 ( 6 ): 1505 – 10 . OpenUrl PubMed 22. ↵ Tomczak K , Czerwińska P , Wiznerowicz M ( 2015 ) The Cancer Genome Atlas (TCGA): an immeasurable source of knowledge . Contemp Oncol (Pozn) 19 ( 1A ): A68 – A77 OpenUrl 23. ↵ Vaidyanathan K , Lakhotia S , Ravishankar HM , Tabassum U , Mukherjee G , Somasundaram K. ( 2009 ) BRCA1 and BRCA2 germline mutation analysis among Indian women from south India: identification of four novel mutations and high-frequency occurrence of 185delAG mutation . J Biosci , 34 ( 3 ): 415 – 22 . doi: 10.1007/s12038-009-0048-9 OpenUrl CrossRef PubMed 24. ↵ Valarmathi MT , Sawhney M , Deo SSV , Shukla NK , Das SN . ( 2004 ) Novel germline mutations in the BRCA1 and BRCA2 genes in Indian breast and breast-ovarian cancer families . Hum Mutat , 23 ( 2 ): 205 . doi: 10.1002/humu.9213 OpenUrl CrossRef PubMed 25. ↵ Weinstein JN , Collisson EA , Mills GB , Shaw KR , Ozenberger BA , Ellrott K , et al. ( 2013 ) The Cancer Genome Atlas pan-cancer analysis project . Nat Genet 45 : 1113 – 1120 OpenUrl CrossRef PubMed 26. ↵ Xu S , Hu E , Cai Y , Xie Z , Luo X , Zhan L , et al. ( 2024 ) Using clusterProfiler to characterize multiomics data . Nature Protocols. 2024 , doi: 10.1038/s41596-024-01020-z OpenUrl CrossRef PubMed 27. ↵ Yu G , Wang LG , Yan GR , He QY . ( 2015 ) DOSE: an R/Bioconductor package for Disease Ontology Semantic and Enrichment analysis . Bioinformatics , 31 ( 4 ): 608 – 609 OpenUrl CrossRef PubMed Web of Science View the discussion thread. Back to top Previous Next Posted April 19, 2025. Download PDF Supplementary Material Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Estimating drivers of breast tissue transitions from normal to tumor state Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Estimating drivers of breast tissue transitions from normal to tumor state Swapnil Kumar , Vaibhav Vindal bioRxiv 2025.04.14.648655; doi: https://doi.org/10.1101/2025.04.14.648655 Share This Article: Copy Citation Tools Estimating drivers of breast tissue transitions from normal to tumor state Swapnil Kumar , Vaibhav Vindal bioRxiv 2025.04.14.648655; doi: https://doi.org/10.1101/2025.04.14.648655 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Bioinformatics Subject Areas All Articles Animal Behavior and Cognition (7636) Biochemistry (17704) Bioengineering (13898) Bioinformatics (41967) Biophysics (21460) Cancer Biology (18599) Cell Biology (25525) Clinical Trials (138) Developmental Biology (13384) Ecology (19909) Epidemiology (2067) Evolutionary Biology (24326) Genetics (15613) Genomics (22512) Immunology (17740) Microbiology (40423) Molecular Biology (17191) Neuroscience (88645) Paleontology (667) Pathology (2835) Pharmacology and Toxicology (4825) Physiology (7646) Plant Biology (15158) Scientific Communication and Education (2046) Synthetic Biology (4302) Systems Biology (9825) Zoology (2271)
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.