DESeq2-MultiBatch: Batch Correction for Multi-Factorial RNA-seq Experiments

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 28,081 characters · extracted from preprint-html · click to expand
DESeq2-MultiBatch: Batch Correction for Multi-Factorial RNA-seq Experiments | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results DESeq2-MultiBatch: Batch Correction for Multi-Factorial RNA-seq Experiments View ORCID Profile Julien Roy , View ORCID Profile Adrian S. Monthony , View ORCID Profile Davoud Torkamaneh doi: https://doi.org/10.1101/2025.04.20.649392 Julien Roy 1 Département de phytologie, Université Laval , Québec City, Québec, Canada 2 Institut de Biologie Intégrative et des Systèmes (IBIS), Université Laval , Québec, Canada 3 Centre de recherche et d’innovation sur les végétaux (CRIV), Université Laval , Québec, Canada 4 Institut intelligence et données (IID), Université Laval , Québec, Canada Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Julien Roy Adrian S. Monthony 1 Département de phytologie, Université Laval , Québec City, Québec, Canada 2 Institut de Biologie Intégrative et des Systèmes (IBIS), Université Laval , Québec, Canada 3 Centre de recherche et d’innovation sur les végétaux (CRIV), Université Laval , Québec, Canada 4 Institut intelligence et données (IID), Université Laval , Québec, Canada Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Adrian S. Monthony Davoud Torkamaneh 1 Département de phytologie, Université Laval , Québec City, Québec, Canada 2 Institut de Biologie Intégrative et des Systèmes (IBIS), Université Laval , Québec, Canada 3 Centre de recherche et d’innovation sur les végétaux (CRIV), Université Laval , Québec, Canada 4 Institut intelligence et données (IID), Université Laval , Québec, Canada Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Davoud Torkamaneh For correspondence: davoud.torkamaneh.1{at}ulaval.ca Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF Summary RNA sequencing (RNA-seq) experiments frequently encounter batch effects that can significantly distort biological interpretations, particularly in complex, multifactorial studies where biological variables interact with experimental batch conditions. Existing batch correction tools primarily address technical variability and often neglect these critical interaction effects, resulting in incomplete adjustments. To address this gap, we introduce DESeq2-MultiBatch, a novel, lightweight batch correction method implemented entirely within the DESeq2 analytical framework. Unlike conventional approaches, DESeq2-MultiBatch directly leverages DESeq2’s internal model estimates to correct raw gene count data, accurately adjusting for experimental batch effects, including interactions with biological variables. Here, we demonstrate that DESeq2-MultiBatch effectively mitigates batch-related variability while preserving genuine biological differences. Benchmarking against widely used methods highlights DESeq2-MultiBatch as a robust, practical solution for improving exploratory data visualization and downstream analyses in multifactorial RNA-seq studies. Availability and implementation https://github.com/julienroyulaval/DESeq2-MultiBatch Contact julien.roy.10{at}ulaval.ca Supplementary information Supplementary data are available at Bioinformatics online. Introduction RNA sequencing (RNA-seq) has emerged as an indispensable tool in modern biology, enabling detailed analyses of gene regulation, cellular processes, and organismal responses under diverse biological conditions ( Stark, Grzelak and Hadfield 2019 ). Various computational frameworks have been developed to process RNA-seq data, each employing different statistical and bioinformatics strategies ( Costa-Silva et al. 2021 ). However, RNA-seq experiments frequently encounter batch effects, defined as sub-groups of measurements showing qualitatively different behavior across conditions due to unwanted technical variability or non-biological differences introduced during experimental preparation, sequencing, or data processing ( Goh, Wang and Wong 2017 , Leek et al. 2010 ). Although careful experimental design can mitigate these effects, practical constraints frequently necessitate multi-batch studies, making complete avoidance challenging ( Van Den Berge et al., 2019 ; Ye et al., 2023). To date, several computational strategies have been developed to address batch effects, primarily by integrating a batch factor into models of gene expression. Simple linear models, such as mean-scaling and zero-centering, fall under this class (Goh, Wang and Wong 2017). The empirical Bayes algorithm (e.g., ComBat) was among the first widely-adopted methods, effectively normalizing additive and multiplicative batch effects ( Johnson et al. 2007 ). Limma, a popular package for gene expression analysis, incorporates batch-effect removal directly into its linear model framework, streamlining analyses ( Ritchie et al. 2015 ). Recently, ComBat-seq extended the original ComBat algorithm specifically for RNA-seq data, using negative binomial regression to better handle count data typical of RNA-seq experiments ( Zhang, Parmigiani and Johnson 2020 ). Additionally, surrogate variable analysis (SVA) offers another approach by identifying part of the data associated with batch variation, estimating the effect with singular value decomposition and removing it from data via regression ( Leek 2014 , Leek and Storey 2007 ). Most recently, machine learning-based approaches have also been integrated into batch-effect detection and correction workflows, demonstrating promising results in complex scenarios ( Sprang, Andrade-Navarro and Fontaine 2022 ). Performance assessments of existing batch correction methods, conducted with both real and simulated datasets, highlight their effectiveness as highly context-dependent ( Chen et al. 2011 , Liu and Markatou 2016 ). Although many algorithms are robust to moderately confounded experimental designs, their effectiveness diminishes significantly when biological factors and batches are highly confounded, potentially leading to the loss of true biological signals ( Molania et al. 2023 , Zhou, Chi-Hau Sue and Bin Goh 2019 ). Furthermore, batch-correction techniques modifying raw count data require careful application, as they can inadvertently mask genuine biological differences, particularly in unbalanced experimental designs ( Nygaard, Rødland and Hovig 2016 ). Most existing batch correction evaluations have utilized medical or clinical datasets, thus limiting their applicability to non-model species (i.e., plants), where broader experimental designs are commonplace. RNA-seq studies in plants often involve additional layers of complexity due to physiological and environmental variables such as growth stages, genotypic differences, environmental fluctuations (e.g., temperature, humidity, and photoperiod), seasonal variations, and soil composition, each potentially interacting uniquely with batch effects. For instance, dioecious plants (e.g., XX/XY system) may exhibit sex-specific responses to environmental batch conditions, complicating effective batch correction and emphasizing the need for biologically informed experimental designs ( Dale et al. 2021 , Upton et al. 2023 ). In recent years, DESeq2 (Love et al., 2014) has become one of the most widely used tools in RNA-seq analyses. It inherently accounts for batch effects directly within its modeling framework during differential expression analysis, making it unnecessary to correct count data before modeling. This approach has the advantage of preserving raw gene expression values, ensures the interpretability of biological signals and minimizes potential distortions associated with data transformation. However, in numerous analytical workflows — particularly those involving exploratory data visualization, clustering analyses, or dimensionality reduction techniques— batch-corrected expression values are desirable, as they significantly enhance interpretability and comparability among samples. Such downstream tasks often perform best with input data where batch-induced variations have already been mitigated. To address this requirement, we present a novel batch correction method that leverages DESeq2’s internal model-based estimates to directly adjust raw count data, without relying on external correction tools or complex transformations. This approach preserves the integrity of log-fold changes between biological conditions and offers flexibility for handling complex experimental designs. Specifically, our approach effectively accommodates interaction effects, even in scenarios characterized by imbalanced or highly confounded settings. As a result, this facilitates improved data analysis and visualization, while maintaining compatibility with standard DESeq2 workflows. Implementation The simulated dataset used in this study consists of 1,000 genes across 48 samples. The dataset is designed to be computationally efficient, with confirmed scalability to larger real-life datasets. The experimental design involves two batches, modeling gene expression in dioecious plants undergoing sex-specific treatments at two distinct time points: Day 0 (vegetative) and Day 1 (early flowering). Due to sex-specific treatments to alter flower sex, male and female plants were separated across batches: Batch 1 contained female controls (n=6) and treated males (n=6), while Batch 2 included male controls (n=6) and treated females (n=6). The treatments were applied following day 0 measurements but before day 1 measurements, allowing day 0 data to serve as a baseline for controlling batch effects. Samples (n=48) were collected across two genotypes, with three biological replicates per combination of sex, treatment, genotype and time point. Two design models were implemented for batch correction analyses: a single-batch correction design ( ~ sex + day + batch + sex:day + treatment ) and a double-batch correction design ( ~ sex + day + batch + sex:day + sex:batch + treatment ). An additional, more complex model incorporating interacting factors ( ~ sex + day + batch + genotype + sex:day + sex:batch + treatment + treatment:genotype ) was also designed. Log 2 fold changes (LFC) calculated from DESeq2 were utilized to perform single and double-batch corrections, adjusting the expression levels to balance batch effects without biasing towards any specific batch. For single-batch correction, original counts for gene i , with batches A and B and days d ∈ {0, 1}, are defined as and . The DESeq2-estimated LFC between batches at day 0 is represented as LFG o . Adjusted counts for each time point, mitigating batch effects estimated at day 0, are calculated as: For double-batch correction, for any gene i , in male ( m ) or female ( f ) samples, batches labelled A and B and the days indexed as d ∈ {0, 1}, original (unadjusted) counts are defined as follows: for female samples, and and for male samples. DESeq2-estimated LFC between batches at day 0 are represented as for females and for males. To independently adjust counts for sexes at each time point, mitigating batch effects estimated at day 0, adjusted counts are calculated as: Female samples: Male samples: The GitHub repository ( https://github.com/julienroyulaval/DESeq2-MultiBatch ) provides detailed recommendations and practical strategies for performing DESeq2 analyses with complex experimental designs. It includes specific guidance on constructing design matrices, addressing imbalanced datasets, defining appropriate contrasts, and conducting multi-factorial analyses with illustrative examples. Performance of batch correction method was benchmarked against limma’s removeBatchEffects (v. 3.58.1) ( Ritchie et al. 2015 ) and ComBat-Seq (v. 3.50.0) ( Zhang, Parmigiani and Johnson 2020 ) through principal components analysis (PCA) plots (ggplot2 version 3.5.1) ( Wickham 2016 ) and heatmaps (pheatmap version 1.0.12) ( Raivo Kolde 2010 ), in double-batch correction designs ( Figure 1 , Supplementary Figures 1). All analyses were performed in RStudio (v2024.9.0.375) running R (v4.3.1). Download figure Open in new tab Fig. 1: (A) PCA plots at day 0 of uncorrected, single batch corrected, and double batch corrected data using DESeq2-MultiBatch. (B) Heatmaps of nine highly batch-affected genes in uncorrected, single batch corrected, and double batch corrected data using DESeq2-MultiBatch, with Gene 078 framed. (C) Gene expression counts for G078 in uncorrected, single batch corrected, and double batch corrected data using DESeq2-MultiBatch, ( eq.1 - 6 ) shown as arrows. (D-F) PCA plots comparing batch correction (day 0 and day 1) using DESeq2-MultiBatch, limma’s removeBatchEffects, and ComBat-seq. Results Analyses of the simulated dataset from dioecious plants showed substantial batch in uncorrected data at day 0 ( Figure 1A , Supplementary Figure 2 for all uncorrected data), primarily resulting from the experimental design. Application of single batch correction ( eq. 1 and eq. 2 ) significantly reduced batch-induced variation; however, residual differences among biologically identical groups remained evident, as demonstrated by distinct clusters, highlighting persistent batch and sex interactions ( Figure 1A ). In contrast, the sex-dependent batch-correction method, explicitly accounting for these interactions, significantly improved the clustering of biologically identical groups, effectively removing batch-associated variation while preserving inherent biological variability within-groups ( Figure 1A ). Post-correction analysis confirmed a complete elimination of differentially expressed genes between batches at day 0, separately for both males and females. Heatmap analyses of eight highly batch-affected genes further quantified correction effectiveness. Prior to any correction, clear batch-related expression patterns were observed ( Figure 1B ). Single batch correction partially reduced this variation but did not eliminate discrepancies among same-sex groups, for example in G078, which is highly affected by sex and batch interactions. Conversely, sex-dependent correction successfully normalized expression levels across batches for all selected genes, substantially reducing batch-induced variations. Gene expression counts of G078 ( Figure 1C ) show a notable discrepancy in female samples between batches A and B prior to correction, which is not seen in male samples. Correcting for a homogeneous batch effect skews the values for male samples. The sex-dependent correction method independently adjusts male and female expression levels, leading to a more precise alignment of the gene expression data between batches for each sex separately. This approach proved especially advantageous for genes whose expression levels were influenced by interaction between sex and environmental factors across batch. Benchmarking our method against established batch correction approaches shows comparable or superior performance in reducing experimental batch effects. PCA plots encompassing both time points (day 0 and day 1) showed that sex-dependent batch correction provided tighter clustering and clearer separation of biological groups ( Figures 1D ), closely aligning with results obtained from standard methods such as limma’s removeBatchEffects ( Figures 1E , Supplementary Figure 1 for heatmap) and ComBat-seq ( Figures 1F , Supplementary Figure 1 for heatmap). RNA-seq has become a fundamental technique in biological research across diverse species and experimental systems; nonetheless, analyses frequently encounter challenges due to batch effects, which obscure genuine biological signals. Although most literature on batch-effect correction algorithms primarily addresses technical batch effects originating from sample preparation, sequencing, or processing steps, complex and multifactorial studies require effective strategies to correct experimental batch effects that may involve interaction factors. Our proposed DESeq2-MultiBatch method effectively addresses this issue by explicitly modeling interaction effects within the DESeq2 analytical framework, significantly enhancing sample clustering and alignment while preserving genuine biological variability. Compared to alternative methods such as limma’s removeBatchEffect and ComBat-seq, DESeq2-MultiBatch provides a more intuitive workflow by directly modeling interaction effects without requiring complex relabeling of metadata. Additionally, unlike limma’s removeBatchEffect, which operates on variance-stabilized data, DESeq2-MultiBatch retains the ability to produce batch-corrected expression counts directly from raw data, enhancing interpretability and downstream utility. Despite its strengths, the efficacy of DESeq2-MultiBatch depends critically on accurate initial modeling of experimental conditions. Misspecification or inadequate representation of interaction factors may limit correction effectiveness and risk attenuating true biological variation. Looking forward, integrating DESeq2-MultiBatch into widely used RNA-seq analytical pipelines presents a promising avenue for enhancing the robustness and accuracy of multi-factorial RNA-seq experiments. Overall, DESeq2-MultiBatch represents a practical, accessible, and robust solution to the pervasive challenge of batch effect correction in RNA-seq analyses. Funding This work was supported by the Natural Sciences and Engineering Research Council (NSERC; RGPIN-2022-03396 to D.T.) of Canada. ASM has also been supported by a NSERC Canada Vanier Graduate Scholarship. Conflict of Interest none declared. Supporting Information Supplementary Tables Funding Natural Sciences and Engineering Research Council, https://ror.org/01h531d29 , RGPIN-2022-03396 Footnotes https://github.com/julienroyulaval/DESeq2-MultiBatch References [1]. ↵ Daniel Kliebenstein Chen , Chao , Grennan , Kay , Badner , Judith , Zhang , Dandan , Gershon , Elliot , Jin , Li , et al. , ‘ Removing Batch Effects in Analysis of Expression Microarray Data: An Evaluation of Six Batch Adjustment Methods’ , ed. by Daniel Kliebenstein , PLoS ONE , 6/ 2 ( 2011 ), e17238 OpenUrl CrossRef PubMed [2]. ↵ Costa-Silva , Juliana , Domingues Douglas S. , Menotti , David , Hungria , Mariangela , and Lopes Fabricio M , ‘Computational Methods for Differentially Expressed Gene Analysis from RNA-Seq: An Overview’ ( 2021 ) [accessed 17 February 2025 ] [3]. ↵ Dale , Renee , Oswald , Scott , Jalihal , Amogh , LaPorte , Mary-Francis , Fletcher Daniel M. , Hubbard , Allen , et al. , ‘ Overcoming the Challenges to Enhancing Experimental Plant Biology With Computational Modeling’ , Frontiers in Plant Science , 12 ( 2021 ), 687652 OpenUrl CrossRef PubMed [4]. ↵ Goh , Wilson Wen Bin , Wang , Wei , and Wong , Limsoon , ‘ Why Batch Effects Matter in Omics Data, and How to Avoid Them’ , Trends in Biotechnology , 35/ 6 ( 2017 ), 498 – 507 OpenUrl CrossRef PubMed [5]. ↵ Johnson , W. Evan , Li , Cheng , and Rabinovic , Ariel , ‘ Adjusting Batch Effects in Microarray Expression Data Using Empirical Bayes Methods’ , Biostatistics , 8/ 1 ( 2007 ), 118 – 27 OpenUrl CrossRef PubMed Web of Science [6]. ↵ Leek , Jeffrey T. , ‘ Svaseq: Removing Batch Effects and Other Unwanted Noise from Sequencing Data’ , Nucleic Acids Research , 42/ 21 ( 2014 ), e161 – e161 OpenUrl CrossRef PubMed [7]. ↵ Leek , Jeffrey T. , Scharpf Robert B. , Bravo Héctor Corrada , Simcha , David , Langmead , Benjamin , Johnson W. Evan , et al. , ‘ Tackling the Widespread and Critical Impact of Batch Effects in High-Throughput Data’ , Nature Reviews Genetics , 11/ 10 ( 2010 ), 733 – 39 OpenUrl CrossRef PubMed Web of Science [8]. ↵ Greg Gibson Leek , Jeffrey T , and Storey John D , ‘ Capturing Heterogeneity in Gene Expression Studies by Surrogate Variable Analysis’ , ed. by Greg Gibson , PLoS Genetics , 3/ 9 ( 2007 ), e161 OpenUrl CrossRef [9]. ↵ Liu , Qian , and Markatou , Marianthi , ‘ Evaluation of Methods in Removing Batch Effects on RNA-Seq Data’ , Infectious Diseases and Translational Medicine , 2016 [10]. ↵ Molania , Ramyar , Foroutan , Momeneh , Gagnon-Bartsch Johann A. , Gandolfo Luke C. , Jain , Aryan , Sinha , Abhishek , et al. , ‘ Removing Unwanted Variation from Large-Scale RNA Sequencing Data with PRPS’ , Nature Biotechnology , 41/ 1 ( 2023 ), 82 – 95 OpenUrl CrossRef PubMed [11]. ↵ Nygaard , Vegard , Rødland, Einar Andreas , and Hovig , Eivind , ‘ Methods That Remove Batch Effects While Retaining Group Differences May Lead to Exaggerated Confidence in Downstream Analyses’ , Biostatistics , 17/ 1 ( 2016 ), 29 – 39 OpenUrl CrossRef PubMed [12]. ↵ Raivo Kolde , ‘Pheatmap: Pretty Heatmaps’, 2010, 1.0.12 [accessed 7 April 2025 ] [13]. ↵ Ritchie , Matthew E. , Phipson , Belinda , Wu , Di , Hu , Yifang , Law Charity W. , Shi , Wei , et al. , ‘ Limma Powers Differential Expression Analyses for RNA-Sequencing and Microarray Studies’ , Nucleic Acids Research , 43/ 7 ( 2015 ), e47 – e47 OpenUrl CrossRef PubMed [14]. ↵ Sprang , Maximilian , Andrade-Navarro Miguel A. , and Fontaine , Jean-Fred , ‘ Batch Effect Detection and Correction in RNA-Seq Data Using Machine-Learning-Based Automated Assessment of Quality’ , BMC Bioinformatics , 23/ S6 ( 2022 ), 279 OpenUrl CrossRef PubMed [15]. ↵ Stark , Rory , Grzelak , Marta , and Hadfield , James , ‘ RNA Sequencing: The Teenage Years’ , Nature Reviews Genetics , 20/ 11 ( 2019 ), 631 – 56 OpenUrl CrossRef PubMed [16]. ↵ Upton , Racheal N. , Correr Fernando H. , Lile , Jared , Reynolds Gillian L. , Falaschi , Kira , Cook Jason P. , et al. , ‘ Design, Execution, and Interpretation of Plant RNA-Seq Analyses’ , Frontiers in Plant Science , 14 ( 2023 ), 1135455 OpenUrl CrossRef PubMed [17]. ↵ Van Den Berge , Koen , Hembach Katharina M. , Soneson , Charlotte , Tiberi , Simone , Clement , Lieven , Love Michael I. , et al. , ‘ RNA Sequencing Data: Hitchhiker’s Guide to Expression Analysis’ , Annual Review of Biomedical Data Science , 2/ 1 ( 2019 ), 139 – 73 OpenUrl CrossRef [18]. ↵ Wickham , Hadley , Ggplot2: Elegant Graphics for Data Analysis, Use R!, Second edition ( Cham , 2016 ) [19]. ↵ Zhang , Yuqing , Parmigiani , Giovanni , and Johnson , W Evan , ‘ ComBat-Seq: Batch Effect Adjustment for RNA-Seq Count Data’ , NAR Genomics and Bioinformatics , 2/ 3 ( 2020 ), qaa078 OpenUrl [20]. ↵ Zhou , Longjian , Chi-Hau Sue , Andrew, and Bin Goh , Wilson Wen , ‘ Examining the Practical Limits of Batch Effect-Correction Algorithms: When Should You Care about Batch Effects?’ , Journal of Genetics and Genomics , 46/ 9 ( 2019 ), 433 – 43 OpenUrl CrossRef View the discussion thread. Back to top Previous Next Posted April 22, 2025. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following DESeq2-MultiBatch: Batch Correction for Multi-Factorial RNA-seq Experiments Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share DESeq2-MultiBatch: Batch Correction for Multi-Factorial RNA-seq Experiments Julien Roy , Adrian S. Monthony , Davoud Torkamaneh bioRxiv 2025.04.20.649392; doi: https://doi.org/10.1101/2025.04.20.649392 Share This Article: Copy Citation Tools DESeq2-MultiBatch: Batch Correction for Multi-Factorial RNA-seq Experiments Julien Roy , Adrian S. Monthony , Davoud Torkamaneh bioRxiv 2025.04.20.649392; doi: https://doi.org/10.1101/2025.04.20.649392 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Bioinformatics Subject Areas All Articles Animal Behavior and Cognition (7633) Biochemistry (17681) Bioengineering (13890) Bioinformatics (41929) Biophysics (21446) Cancer Biology (18586) Cell Biology (25492) Clinical Trials (138) Developmental Biology (13374) Ecology (19897) Epidemiology (2067) Evolutionary Biology (24308) Genetics (15606) Genomics (22497) Immunology (17736) Microbiology (40385) Molecular Biology (17175) Neuroscience (88584) Paleontology (666) Pathology (2831) Pharmacology and Toxicology (4822) Physiology (7641) Plant Biology (15149) Scientific Communication and Education (2045) Synthetic Biology (4293) Systems Biology (9822) Zoology (2271)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00