BLOBFISH: Bipartite Limited Subnetworks from Multiple Observations using Breadth-First Search with Constrained Hops

preprint OA: closed CC-BY-NC-ND-4.0
📄 Open PDF Full text JSON View at publisher
Full text 29,280 characters · extracted from preprint-html · click to expand
BLOBFISH: Bipartite Limited Subnetworks from Multiple Observations using Breadth-First Search with Constrained Hops | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results BLOBFISH: Bipartite Limited Subnetworks from Multiple Observations using Breadth-First Search with Constrained Hops View ORCID Profile Tara Eicher , Marouen Ben Guebila , View ORCID Profile John Quackenbush doi: https://doi.org/10.1101/2025.03.11.642378 Tara Eicher 1 Department of Biostatistics, T.H. Chan School of Public Health, Harvard University , Boston, MA, 02115, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Tara Eicher Marouen Ben Guebila 1 Department of Biostatistics, T.H. Chan School of Public Health, Harvard University , Boston, MA, 02115, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site John Quackenbush 1 Department of Biostatistics, T.H. Chan School of Public Health, Harvard University , Boston, MA, 02115, USA 2 Channing Division of Network Medicine, Brigham and Women’s Hospital , Boston, MA, 02115, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for John Quackenbush For correspondence: johnq{at}hsph.harvard.edu Abstract Full Text Info/History Metrics Supplementary material Preview PDF Abstract Summary In analyzing gene regulatory network models, a common question is how members of a particular set of genes are connected. For example, one might want to explore network relationship between a set of differentially expressed genes, a gene set previously reported in the literature, or elements of one or more pathways. BLOBFISH uses a breadth-first search algorithm adapted to bipartite graphs to identify a compact subnetwork connecting the members of a pre-specified set of genes, providing a regulatory context that can shed light on specific mechanisms involved in a phenotype and its development. We demonstrate the use of BLOBFISH to extract gene regulatory subnetworks reflecting tissue specificity using publicly available data from the Genotype Tissue Expression (GTEx) project. Introduction It is common to think of biological states as being defined by specific genetic variants or patterns of expression, but we have come to recognize that the real drivers of phenotypes are complex networks of interacting cellular elements that drive the processes specific to each phenotype and that characterize the transitions between states. There are many tools for inferring networks that represent specific aspects of biological systems and these have proven their value in characterizing the relationships between genes and other entities in the context of understanding phenotypic differences ( Eicher, et al., 2020 ; Weighill, et al., 2021 ). Although unipartite networks such as gene co-expression based on correlations or partial correlations are frequently used ( Langfelder and Horvath, 2008 ), bipartite networks provide the opportunity to identify interactions between different types of cellular elements, including genes and their regulators. Examples of bipartite networks include expression quantitative trait loci (eQTL) networks ( Fagny, et al., 2017 ; Platig, et al., 2016 ), gene regulatory networks (GRNs) ( Glass, et al., 2013 ; Glass, et al., 2013 ; Kuijjer, et al., 2020 ), and multi-omic partial correlation networks ( Eicher, et al., 2023 ; Shutta, et al., 2023 ). Although networks can capture genome-scale interactions, interpreting such results can be challenging, particularly in the context of exploring a hypothesis regarding a subset of genes thought to be relevant to a phenotype under study ( Edge, et al., 2019 ). Interest in examining network relationships between a subset of “interesting” genes has motivated the development of tools to evaluate connectivity between a set of “seed” nodes, including methods based on random walks with restarts ( Chakrabarty, et al., 2021 ; Liao, et al., 2020 ) and Steiner trees ( White and Ma’ayan, 2007 ). However, most subgraph extracting methods have a stochastic component so that multiple applications to the same starting network, or changes in how the network is recorded, may lead to different results. There are also deterministic methods that can identify unique paths connecting seed nodes, including some based on depth-first traversal ( Berger, et al., 2007 ) and shortest paths ( Ho, et al., 2012 ; Keane, et al., 2015 ), but in applications such as drug targeting and pathway analysis, where biological systems often have redundancies, deterministic methods can miss multiple connecting paths that define more biologically relevant patterns of interactivity ( Lee, et al., 2023 ; Ogris, et al., 2022 ). A key hypothesis in network analysis is that networks not only differ between phenotypes but also vary among individuals within any specific phenotypic group. Methods such LIONESS ( Kuijjer, et al., 2019 ), BONOBO ( Saha, et al., 2023 ), and SWEET ( Chen, et al., 2023 ), used in conjunction with other methods, can infer networks for each individual in a population and there are a number of methods that can be used to for single-cell specific network inference (such as those reviewed by Pratapa et al. ( Pratapa, et al., 2020 )). This suggests that a useful strategy in mapping subnetworks connecting genes would be to identify robust edges that are consistent across individuals, providing greater confidence in the identified connectivity between genes. Approach We developed BLOBFISH ( B ipartite L imited Subnetworks from Multiple O bservations using B readth- Fi rst S earch with Constrained H ops) to find a robust subnetwork connecting a seed set of nodes in collections of individual sample bipartite networks to find patterns of connection consistent across observations. Conceptually, BLOBFISH is based on the idea that each node in a bipartite graph has a sphere of influence that can be obtained using breadth-first search with a user-defined constraint on the number of allowed hops between nodes such that the connectivity between two nodes represents paths to shared nodes within each node’s sphere of influence. This allows multiple paths to connect individual nodes in a way that mirrors the redundancy and shared functionality of genes known to exist in biological networks. To provide confidence in the resulting subnetworks, BLOBFISH requires that all edges in the subnetwork must have statistically significant weights when compared against a null model. Because BLOBFISH operates on bipartite graphs, all connecting paths can be found by evaluating only shared nodes equidistant from a pair of seed nodes (see Theorem 1 in Supplementary File 1). By making use of this property in addition to being deterministic, BLOBFISH provides runtime advantages over a naïve exploration of all possible paths across spheres of influence. The BLOBFISH algorithm is described as pseudocode in Supplementary File 1 together with analysis of some of its performance characteristics. BLOBFISH takes as input a collection of gene regulatory networks derived by applying a specific GRN inference method to an experimental dataset and a null network distribution by using multiple randomizations of the expression levels (or other biological measurements) and using the same network inference method to generate a collection of network models. BLOBFISH analyzes the collection of individual-sample network graphs and, for a set of seed genes, and first uses the Wilcoxon rank-sum test to estimate the significance of the inferred regulatory edges by comparing these to the null network; edges that are significant (based on a user-defined sphere of influence parameter, α, set by default to 2) are retained in a reduced network model. BLOBFISH uses a breadth-first search (BFS) to identify neighborhoods for each gene in the reduced network. BFS explores gene nodes and regulatory edges connecting them systematically starting from each of the seed genes. It explores all neighbors of the current node before moving to the next level of neighbors, ensuring that all nodes are visited in order of their distance from the source, resulting in a sphere of influence for each gene based on a user-determined parameter. The algorithm then finds all possible paths connecting the genes based on the overlap of the collective spheres of influence to create more or more subnetworks connecting the seed gene set. BLOBFISH is integrated into the netZooR R package (v1.6) ( https://github.com/netZoo/netZooR ) ( Ben Guebila, et al., 2023 ) and can be run using a call to the function RunBLOBFISH (). The additional functions PlotNetwork () and GenerateNullPANDADistribution () support plotting the subnetwork and generating the null distribution for bipartite networks generated using PANDA’s message-passing framework or those of its related methods ( Glass, et al., 2013 ; Kuijjer, et al., 2020 ; Osorio, et al., 2024 ; Sonawane, et al., 2021 ; Weighill, et al., 2022 ); the latter function could be easily modified to use other network inference methods. BLOBFISH depends on the R packages igraph and matrixTests . The script used in our analysis is available from https://github.com/QuackenbushLab/BLOBFISH_paper_scripts . Results As a test of BLOBFISH, we downloaded from the GRAND database ( Ben Guebila, et al., 2022 ) GRN models that had been inferred by applying PANDA+LIONESS to GTEx data ( Lonsdale, et al., 2013 ; Lopes-Ramos, et al., 2020 ) for five tissues (subcutaneous adipose, skeletal muscle, lung tissue, skin, and aorta). To minimize influence of age and biological sex on the gene regulatory networks, we used only networks generated for males between the ages of 20-29, resulting in n = 18 for subcutaneous adipose, n = 27 for skeletal muscle, n = 15 for lung tissue, n = 31 for skin, and n = 15 for aorta. We used 26 genes reported to be typical of skeletal muscle by Bortoluzzi et al ( Bortoluzzi, et al., 2000 ) and seven genes involved in adipogenesis ( Ou-yang and Dai, 2023 ) as seed gene sets (available in Supplementary Tables 1 and 2). We ran BLOBFISH using both the skeletal muscle and adipogenesis seed gene sets on each tissue-specific collection of bipartite gene regulatory networks using a null distribution generated using GenerateNullPANDADistribution (), α = 0.05, and a hop constraint of 2 (restricting paths between seed genes to contain a single transcription factor; full subnetworks can be found in Supplementary Tables 3-7). This provides both positive and negative controls that can be used to assess BLOBFISH’s performance. To evaluate only the tissue-specific connectivity between genes in the seed set and exclude connectivity shared between tissues, we retained only edges that were exclusive to each tissue type’s subnetwork. The results can be found in Supplementary Tables 8-12. To assess the significance of the connectivity we found among gene sets associated with skeletal muscle development and adipogenesis in the relevant tissues, we used BLOBFISH to assess these and 100 random sets of 33 (26 + 7) genes in all five tissues for which we had network models. We expect that few if any genes are expressed in only a single tissue and many genes are expressed in a large number of tissues; indeed, for each set of seed genes, we found subnetworks linking some subset of those seed genes in each of the five tissues in nearly every iteration. But we also expect phenotype-specific sets of genes to be highly connected in the relevant tissue since the some level of coordinated regulation of these genes defines, or is defined by, that tissue. Consistent with this, the mean count of transcription factors co-regulating each pair of skeletal-muscle-associated genes was highest in the skeletal-muscle-specific subnetwork and that the mean count of transcription factors co-regulating each pair of adipogenesis-associated genes was highest in the subcutaneous-adipose-specific subnetwork ( Figure 1 and Table 1 ; see Supplementary Figure 1 for the other tissue-specific subnetworks). Further, in the relevant tissue, the mean counts for tissue-specific gene sets were considerably higher (with statistically significant Z-scores) than the mean counts obtained from the random gene sets. In contrast, the transcription factor connectivity for the same adipose and muscle gene sets were essentially at background levels in lung, skin, and aorta based on the distributions for random gene sets. This suggests that BLOBFISH can extract meaningful regulatory subnetwork connections between a tissue- or disease-specific set of genes when applied to gene regulatory networks inferred in a relevant tissue using PANDA+LIONESS. Download figure Open in new tab Figure 1. Tissue-specific gene regulatory subnetworks for GTEx skeletal muscle samples for males 20-29 in (A) subcutaneous adipose and (B) skeletal muscle reveal more co-regulatory connections between skeletal-muscle-associated genes (pink) in skeletal muscle and more co-regulatory connections between adipogenesis-associated genes (gold) in subcutaneous adipose. View this table: View inline View popup Download powerpoint Table 1. The mean number of transcription factors co-regulating skeletal-muscle-associated and adipogenesis-associated genes in each tissue, compared to the mean number of transcription factors co-regulating random subsets of genes. Beyond the tissue specificity we found for connected subnetworks of tissue-relevant gene sets, one would expect that the additional genes connected to the seed set found by BLOBFISH might further help explain the phenotype that the input gene set was meant to capture. To test this, we took the BLOBFISH subnetworks for each tissue generated using the combined skeletal muscle and adipogenesis genes as seeds, and for each performed pre-ranked gene set enrichment analysis on the transcription factors and genes using the fgsea R package ( Korotkevich, et al., 2021 ) with FDR -adjusted p -value < 0.05 and gene sets from the Molecular signatures Database (MSigDB, version 2023.2) ( Liberzon, et al., 2015 ; Subramanian, et al., 2005 ); the number of edges adjacent to each transcription factor or gene was used as the input ranking score. We then compared these results to pathways enriched in each tissue using the log 2 (fold change) of the expression levels of the seed as input. The only functional class that was enriched in the subcutaneous adipose tissue subnetwork was adipogenesis, but this was not surprising given the small number of adipogenesis-relevant genes in the input (seven). In comparison, pathway analysis using expression of the seed resulted in enrichment of PPAR signaling, one step in adipogenesis ( Ghaben and Scherer, 2019 ). In the skeletal muscle network subnetwork seeded by twenty-six genes, we found enrichment for both muscle contraction and Parkinson’s Disease pathways, whereas no pathways were enriched using gene expression data for this the seed set. Impaired skeletal muscle function is a hallmark of Parkinson’s Disease ( Murphy and Lynch, 2023 ), this result provides further evidence that BLOBFISH can use tissue-specific gene regulatory networks to aggregate sets of genes linked through common regulators that share a common biological function. The results for all tissues are presented in Supplementary Tables 13-17 (for network-based analysis) and 18-21 (for expression-based analysis). Discussion A frequent question in the analysis of any biologically interesting phenotype is how subsets of genes previously identified as relevant interact with each other within the context of the regulatory processes that ultimately define each biological state. Methods that attempt to connect genes within those subsets, including methods using correlation analysis, fail to provide information on the broader regulatory context in which these genes exist. Genome-wide gene regulatory network inference can provide a broader context, but interpreting the complex connections within those networks can be challenging. BLOBFISH simplifies the problem of subnetwork identification and interpretation by using gene regulatory network models to find a minimal set of genes and transcription factors linking the elements of a candidate gene set. As such, BLOBFISH complements more general network methods such as degree-based analyses, differential targeting analysis, and statistical comparisons of network edge weights; it fills an important methodological gap by extracting meaningful subnetworks in a way that balances the generalizability of genome-wide networks with the interpretability of a focused set of regulatory processes. Acknowledgements This work was supported by the National Institutes of Health [R01HG011393, R35CA220523]. We thank Enakshi Saha, Kate Hoff-Shutta, and Kimberly Glass for support in the formulation of the null model for LIONESS networks and Viola Fanfani for support in data acquisition. Footnotes Availability and Implementation Source code is available from GitHub as part of the netZooR R package (v1.6) ( https://github.com/netZoo/netZooR ) ( Ben Guebila, et al., 2023 ). Contact johnq{at}hsph.harvard.edu References 1. ↵ Ben Guebila , M. , et al. GRAND: a database of gene regulatory network models across human conditions . Nucleic Acids Research 2022 ; 50 ( D1 ): D610 – D621 . OpenUrl CrossRef PubMed 2. ↵ Ben Guebila , M. , et al. The Network Zoo: a multilingual package for the inference and analysis of gene regulatory networks . Genome Biol 2023 ; 24 ( 1 ): 45 . OpenUrl CrossRef PubMed 3. ↵ Berger , S.I. , Posner , J.M. and Ma’ayan , A. Genes2Networks: connecting lists of gene symbols using mammalian protein interactions databases . BMC Bioinformatics 2007 ; 8 ( 1 ). 4. ↵ Bortoluzzi , S. , et al. The Human Adult Skeletal Muscle Transcriptional Profile Reconstructed by a Novel Computational Approach . Genome Research 2000 ; 10 ( 3 ): 344 – 349 . OpenUrl Abstract / FREE Full Text 5. ↵ Chakrabarty , B. , et al. Network-Based Analysis of Fatal Comorbidities of COVID-19 and Potential Therapeutics . IEEE/ACM Transactions on Computational Biology and Bioinformatics 2021 ; 18 ( 4 ): 1271 – 1280 . OpenUrl CrossRef 6. ↵ Chen , H.H. , et al. SWEET: a single-sample network inference method for deciphering individual features in disease . Brief Bioinform 2023 ; 24 ( 2 ). 7. ↵ Edge , D. , et al. Trimming the Hairball: Edge Cutting Strategies for Making Dense Graphs Usable . In, GTA3 20: The 2nd IEEE Big Data Workshop on Grpah Techniques for Adversarial Activity Analytics . Institute of Electrical and Electronics Engineers Inc .; 2019 . p. 3951 – 3958 . 8. ↵ Eicher , T. , et al. Metabolomics and Multi-Omics Integration: A Survey of Computational Methods and Resources . Metabolites 2020 ; 10 : 202 . OpenUrl CrossRef PubMed 9. ↵ Eicher , T. , et al. IntLIM 2.0: identifying multi-omic relationships dependent on discrete or continuous phenotypic measurements . Bioinformatics Advances 2023 ; 3 ( 1 ): vbad009 . OpenUrl 10. ↵ Fagny , M. , et al. Exploring regulation in tissues with eQTL networks . Proc Natl Acad Sci U S A 2017 ; 114 ( 37 ): E7841 – E7850 . OpenUrl Abstract / FREE Full Text 11. ↵ Ghaben , A.L. and Scherer , P.E. Adipogenesis and metabolic health . Nature Revies Molecular Cell Biology 2019 ; 20 ( 4 ): 242 – 258 . OpenUrl CrossRef 12. ↵ Glass , K. , et al. Passing Messages between Biological Networks to Refine Predicted Interactions . PLoS ONE 2013 ; 8 ( 5 ). 13. Glass , K. , et al. Passing messages between biological networks to refine predicted interactions . PLoS One 2013 ; 8 ( 5 ): e64832 . OpenUrl CrossRef PubMed 14. ↵ Ho , P.L. , et al. Identification of Colorectal Cancer Related Genes with mRMR and Shortest Path in Protein-Protein Interaction Network . PLoS ONE 2012 ; 7 ( 4 ). 15. ↵ Keane , H. , et al. Protein-protein interaction networks identify targets which rescue the MPP+ cellular model of Parkinson’s disease . Scientific Reports 2015 ; 5 ( 1 ). 16. ↵ Korotkevich , G. , et al. An algorithm for fast preranked gene set enrichment analysis using cumulative statistic calculation . BioRXiv 2021 . 17. ↵ Kuijjer , M.L. , et al. PUMA: PANDA Using MicroRNA Associations . Bioinformatics 2020 ; 36 ( 18 ): 4765 – 4773 . OpenUrl CrossRef PubMed 18. ↵ Kuijjer , M.L. , et al. lionessR: single sample network inference in R . BMC Cancer 2019 ; 19 ( 1 ). 19. ↵ Langfelder , P. and Horvath , S. WGCNA: an R package for weighted correlation network analysis . BMC Bioinformatics 2008 ; 9 : 559 . OpenUrl CrossRef PubMed 20. ↵ Lee , C.W. , et al. Relationship between drug targets and drug-signature networks: a network-based genome-wide landscape . BMC Medical Genomics 2023 ; 16 ( 1 ). 21. ↵ Liao , F. , et al. RWR-algorithm-based dissection of microRNA-506-3p and microRNA140-5p as radiosensitive biomarkers in colorectal cancer . Aging 2020 ; 12 ( 20 ): 20512 – 20522 . OpenUrl CrossRef PubMed 22. ↵ Liberzon , A. , et al. The Molecular Signatures Database Hallmark Gene Set Collection . Cell Systems 2015 ; 1 ( 6 ): 417 – 425 . OpenUrl CrossRef PubMed 23. ↵ Lonsdale , J. , et al. The Genotype-Tissue Expression (GTEx) project . Nature Genetics 2013 ; 45 ( 6 ): 580 – 585 . OpenUrl CrossRef PubMed 24. ↵ Lopes-Ramos , C.M. , et al. Sex Differences in Gene Expression and Regulatory Networks across 29 Human Tissues . Cell Rep 2020 ; 31 ( 12 ): 107795 . OpenUrl CrossRef PubMed 25. ↵ Murphy , K.T. and Lynch , G.S. Impaired skeletal muscle health in Parkinsonian syndromes: clinical implications, mechanisms and potential treatments . Journal of Cachexia, Sarcopenia and Muscle 2023 ; 14 ( 5 ): 1987 – 2002 . OpenUrl CrossRef 26. ↵ Ogris , C. , et al. PathwAX II: network-based pathway analysis with interactive visualization of network crosstalk . Bioinformatics 2022 ; 38 ( 9 ): 2659 – 2660 . OpenUrl CrossRef PubMed 27. ↵ Osorio , D. , et al. Population-level comparisons of gene regulatory networks modeled on high-throughput single-cell transcriptomics data . Nature Computational Science 2024 ; 4 ( 3 ): 237 – 250 . OpenUrl CrossRef PubMed 28. ↵ Ou-yang , Y. and Dai , M.-m. Screening for genes, miRNAs and transcription factors of adipogenic differentiation and dedifferentiation of mesenchymal stem cells . Journal of Orthopaedic Surgery and Research 2023 ; 18 ( 1 ). 29. ↵ Platig , J. , et al. Bipartite Community Structure of eQTLs . PLoS computational biology 2016 ; 12 ( 9 ): e1005033 . OpenUrl CrossRef 30. ↵ Pratapa , A. , et al. Benchmarking algorithms for gene regulatory network inference from single-cell transcriptomic data . Nature Methods 2020 ; 17 ( 2 ): 147 – 154 . OpenUrl CrossRef PubMed 31. ↵ Saha , E. , et al. Bayesian Optimized sample-specific Networks Obtained By Omics data (BONOBO) . BioRXiv 2023 . 32. ↵ Shutta , K.H. , et al. DRAGON: Determining Regulatory Associations using Graphical models on multi-Omic Networks . Nucleic Acids Res 2023 ; 51 ( 3 ): e15 . OpenUrl CrossRef PubMed 33. ↵ Sonawane , A.R. , et al. Constructing gene regulatory networks using epigenetic data . npj Systems Biology and Applications 2021 ; 7 ( 1 ). 34. ↵ Subramanian , A. , et al. Gene set enrichment analysis: A knowledge-based approach for interpreting genome-wide expression profiles . Proceedings of the National Academy of Sciences 2005 ; 102 ( 43 ). 35. ↵ Weighill , D. , et al. Gene Targeting in Disease Networks . Frontiers in Genetics 2021 ; 12 . 36. ↵ Weighill , D. , et al. Predicting genotype-specific gene regulatory networks . Genome Research 2022 ; 32 ( 3 ): 524 – 533 . OpenUrl Abstract / FREE Full Text 37. ↵ White , A.G. and Ma’ayan , A. Connecting Seed Lists of Mammalian Proteins Using Steiner Trees . In, Forty-First Asilomar Conference on Signals, Systems and Computers . IEEE ; 2007 . View the discussion thread. Back to top Previous Next Posted March 13, 2025. Download PDF Supplementary Material Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following BLOBFISH: Bipartite Limited Subnetworks from Multiple Observations using Breadth-First Search with Constrained Hops Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share BLOBFISH: Bipartite Limited Subnetworks from Multiple Observations using Breadth-First Search with Constrained Hops Tara Eicher , Marouen Ben Guebila , John Quackenbush bioRxiv 2025.03.11.642378; doi: https://doi.org/10.1101/2025.03.11.642378 Share This Article: Copy Citation Tools BLOBFISH: Bipartite Limited Subnetworks from Multiple Observations using Breadth-First Search with Constrained Hops Tara Eicher , Marouen Ben Guebila , John Quackenbush bioRxiv 2025.03.11.642378; doi: https://doi.org/10.1101/2025.03.11.642378 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Bioinformatics Subject Areas All Articles Animal Behavior and Cognition (7616) Biochemistry (17625) Bioengineering (13850) Bioinformatics (41823) Biophysics (21396) Cancer Biology (18524) Cell Biology (25416) Clinical Trials (138) Developmental Biology (13350) Ecology (19858) Epidemiology (2067) Evolutionary Biology (24277) Genetics (15579) Genomics (22457) Immunology (17698) Microbiology (40278) Molecular Biology (17134) Neuroscience (88397) Paleontology (666) Pathology (2823) Pharmacology and Toxicology (4811) Physiology (7631) Plant Biology (15106) Scientific Communication and Education (2042) Synthetic Biology (4281) Systems Biology (9807) Zoology (2265)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00
unpaywall
last seen: 2026-05-24T02:00:01.246996+00:00
License: CC-BY-NC-ND-4.0