Causes and consequences of experimental variation in Nicotiana benthamiana transient expression

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 74,781 characters · extracted from preprint-html · click to expand
Causes and consequences of experimental variation in Nicotiana benthamiana transient expression | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Causes and consequences of experimental variation in Nicotiana benthamiana transient expression Sophia N. Tang , Matthew J. Szarzanowicz , Amy Lanctot , Sasilada Sirirungruang , Liam D. Kirkpatrick , Krista Drako , Simón Álamos , Lyurui Cheng , Lucas M. Waldburger , Shuying Liu , Lena Huang , Sami Kazaz , Emine Akyuz Turumtay , Edward Baidoo , Aymerick Eudes , Mitchell G. Thompson , Patrick M. Shih doi: https://doi.org/10.1101/2025.06.12.659391 Sophia N. Tang 1 Joint BioEnergy Institute , 5885 Hollis Street, Emeryville, CA 94608, USA 2 Environmental Genomics and Systems Biology Division, Lawrence Berkeley National Laboratory , Berkeley, California, USA 3 Department of Molecular and Cell Biology, University of California , Berkeley, CA 94720, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Matthew J. Szarzanowicz 1 Joint BioEnergy Institute , 5885 Hollis Street, Emeryville, CA 94608, USA 2 Environmental Genomics and Systems Biology Division, Lawrence Berkeley National Laboratory , Berkeley, California, USA 4 Department of Plant and Microbial Biology, University of California , Berkeley, CA 94720, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Amy Lanctot 1 Joint BioEnergy Institute , 5885 Hollis Street, Emeryville, CA 94608, USA 2 Environmental Genomics and Systems Biology Division, Lawrence Berkeley National Laboratory , Berkeley, California, USA 4 Department of Plant and Microbial Biology, University of California , Berkeley, CA 94720, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Sasilada Sirirungruang 1 Joint BioEnergy Institute , 5885 Hollis Street, Emeryville, CA 94608, USA 2 Environmental Genomics and Systems Biology Division, Lawrence Berkeley National Laboratory , Berkeley, California, USA 4 Department of Plant and Microbial Biology, University of California , Berkeley, CA 94720, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Liam D. Kirkpatrick 1 Joint BioEnergy Institute , 5885 Hollis Street, Emeryville, CA 94608, USA 2 Environmental Genomics and Systems Biology Division, Lawrence Berkeley National Laboratory , Berkeley, California, USA 4 Department of Plant and Microbial Biology, University of California , Berkeley, CA 94720, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Krista Drako 1 Joint BioEnergy Institute , 5885 Hollis Street, Emeryville, CA 94608, USA 2 Environmental Genomics and Systems Biology Division, Lawrence Berkeley National Laboratory , Berkeley, California, USA 3 Department of Molecular and Cell Biology, University of California , Berkeley, CA 94720, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Simón Álamos 1 Joint BioEnergy Institute , 5885 Hollis Street, Emeryville, CA 94608, USA 2 Environmental Genomics and Systems Biology Division, Lawrence Berkeley National Laboratory , Berkeley, California, USA 4 Department of Plant and Microbial Biology, University of California , Berkeley, CA 94720, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Lyurui Cheng 1 Joint BioEnergy Institute , 5885 Hollis Street, Emeryville, CA 94608, USA 2 Environmental Genomics and Systems Biology Division, Lawrence Berkeley National Laboratory , Berkeley, California, USA 7 Department of Nutritional Sciences and Toxicology, University of California , Berkeley, CA 94720, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Lucas M. Waldburger 1 Joint BioEnergy Institute , 5885 Hollis Street, Emeryville, CA 94608, USA 2 Environmental Genomics and Systems Biology Division, Lawrence Berkeley National Laboratory , Berkeley, California, USA 5 Department of Bioengineering, University of California , Berkeley, California, USA 6 Biological Systems & Engineering Division, Lawrence Berkeley National Laboratory , Berkeley, CA 94720, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Shuying Liu 1 Joint BioEnergy Institute , 5885 Hollis Street, Emeryville, CA 94608, USA 2 Environmental Genomics and Systems Biology Division, Lawrence Berkeley National Laboratory , Berkeley, California, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Lena Huang 1 Joint BioEnergy Institute , 5885 Hollis Street, Emeryville, CA 94608, USA 2 Environmental Genomics and Systems Biology Division, Lawrence Berkeley National Laboratory , Berkeley, California, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Sami Kazaz 1 Joint BioEnergy Institute , 5885 Hollis Street, Emeryville, CA 94608, USA 2 Environmental Genomics and Systems Biology Division, Lawrence Berkeley National Laboratory , Berkeley, California, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Emine Akyuz Turumtay 1 Joint BioEnergy Institute , 5885 Hollis Street, Emeryville, CA 94608, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Edward Baidoo 1 Joint BioEnergy Institute , 5885 Hollis Street, Emeryville, CA 94608, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Aymerick Eudes 1 Joint BioEnergy Institute , 5885 Hollis Street, Emeryville, CA 94608, USA 2 Environmental Genomics and Systems Biology Division, Lawrence Berkeley National Laboratory , Berkeley, California, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Mitchell G. Thompson 1 Joint BioEnergy Institute , 5885 Hollis Street, Emeryville, CA 94608, USA 2 Environmental Genomics and Systems Biology Division, Lawrence Berkeley National Laboratory , Berkeley, California, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: pmshih{at}berkeley.edu mthompson{at}lbl.gov Patrick M. Shih 1 Joint BioEnergy Institute , 5885 Hollis Street, Emeryville, CA 94608, USA 2 Environmental Genomics and Systems Biology Division, Lawrence Berkeley National Laboratory , Berkeley, California, USA 4 Department of Plant and Microbial Biology, University of California , Berkeley, CA 94720, USA 8 Innovative Genomics Institute , Berkeley, California, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: pmshih{at}berkeley.edu mthompson{at}lbl.gov Abstract Full Text Info/History Metrics Supplementary material Preview PDF Abstract Infiltration of Agrobacterium tumefaciens into Nicotiana benthamiana has become a foundational technique in plant biology, enabling efficient delivery of transgenes in planta with technical ease, robust signal, and relatively high throughput. Despite transient expression’s prevalence in disciplines such as synthetic biology, little work has been done to describe and address the variability inherent in this system, a concern for experiments that rely on highly quantitative readouts. In a comprehensive analysis of N. benthamiana agroinfiltration experiments, we model sources of variability that affect transient expression. Our findings emphasize the need to validate normalization methods under the specific conditions of each study, as distinct normalization schemes do not always reduce variation either within or between experiments. Using a dataset of 1,915 plants collected over three years, we develop a model of variation in N. benthamiana transient expression, using power analysis to determine the number of individual plants required for a given effect size. Drawing on our longitudinal data, these findings inform practical guidelines for minimizing variability through strategic experimental design and power analysis, providing a foundation for more robust and reproducible use of N. benthamiana in quantitative plant biology and synthetic biology applications. Introduction Nicotiana benthamiana is a workhorse of plant molecular biology due to the high efficiency of transient Agrobacterium -mediated transformation, enabling researchers to assess gene function and observe phenotypes within days, as opposed to the months it typically takes for stable transformations 1 – 3 . N. benthamiana’ s capacity for transient expression precipitated its use to study diverse aspects of cell and molecular biology 4 , including virus-induced gene silencing 5 , subcellular protein localization 6 , biosynthetic pathway discovery and engineering 7 – 11 , and gene regulation 12 – 16 . Given the lengthy time required to generate stable transformants and the technical challenges inherent in protoplast transformation 17 , 18 , there are few viable in planta alternatives to N. benthamiana transient expression, leading to its primacy as the model of plant synthetic biology 19 , 20 . Despite its widespread use, N. benthamiana lacks substantial efforts to assess error and reproducibility, like many other systems routinely leverage in synthetic biology 21 . Nor is there a standardized way to design transient assays, and as a result, experimental design varies from publication to publication 13 , 22 – 26 . These factors obstruct our ability to model and predict variation in this model system, which is crucial for effective experimental design as has been demonstrated in the closely related Nicotiana tabacum 27 . Limited quantitative understanding of biology has routinely impeded genetic engineers in developing predictable and reliable bioproducts 28 , in comparison to the precision associated with traditional engineering disciplines 29 . For plant synthetic biology to truly be an engineering discipline, we require robust evaluation of variability and its effects on our design goals. The variability of transient expression in N. benthamiana in highly powered and longitudinal experiments has never been rigorously evaluated. Without robust statistics, researchers risk designing underpowered experiments and overlooking subtle effects. While there have been attempts to determine transgene expression variability in stable plant lines 30 , 31 , it is unclear whether these findings translate to transient expression. Transient expression variability in N. benthamiana has been primarily studied using luciferase reporters, but these studies are plagued by small sample size, lack of biological replicates, and the high noise inherent to the luciferase assay 32 – 34 . Most methods used to reduce variability in transient expression experiments have relied on using a second reporter (hereafter referred to as a normalizer) for ratiometric normalization 13 , 22 – 24 , 35 , 36 . In this approach, every tested experimental construct is co-delivered with the same constitutively expressed normalizer, under the assumption that any variation in the experimental construct’s expression that tracks with variation in the normalizer’s expression must not be due to the sequence of the reporters but rather other variables. Although this approach is widely used, whether normalizing transgene expression actually reduces and controls for variation has not been systematically examined. Here, we use fluorescence reporter assays to systematically determine the sources of variation of transient expression in N. benthamiana leaves. Using a large sample size (>1900 plants) across multiple years of independent experiments, we comprehensively capture transgene expression variation observed between plants and between independent experiments in order to model sources of error. We also complete the first systematic comparison of methods to normalize transgene expression and demonstrate whether and to what extent these methods reduce variability. Finally, we suggest best practices to mitigate variation through purposeful experimental design and statistical power analysis. Results Categorizing the sources of transient expression variation To determine sources of variability in N. benthamiana transient expression, we analyzed previously published data wherein the same GFP reporter (vector 1 of Supplementary Table 1) was agroinfiltrated in 15 independent experimental replicates using A. tumefaciens GV3101::pMP90 (hereafter GV3101) ( Fig 1A , Fig. S1) 37 . The reporter strain was infiltrated distal to the petiole of the fourth and fifth leaf from the top (leaves T4 and T5) of N. benthamiana , and three days post-infiltration, four discs were collected from each infiltrated leaf. All plants germinated at the same time and which experienced identical growing conditions and care are referred to as belonging to the same batch. In this dataset, we observed as much as a fourfold difference between experimental replicates with the lowest (teal, 2022.07.25) and highest (orange, 2023.05.30) mean fluorescence ( Fig. 1B , 1C ). Using a mixed-effects model, we attributed nearly all of the variation to fluctuations in batch-level mean GFP (23.8%) and GFP standard deviation (15.6%); plant-level mean GFP (9.9%) and GFP standard deviation (28.2%) within a given batch; and disc-level GFP standard deviation (22.3%) within a given plant ( Fig. 1D ). Though the precise percent contributions of these components varies between experimental replicates (Fig. S2), they are nonetheless all major sources of variation that should be accounted for in experimental design. The underlying factors of these sources of variation may be batch effects across the fifteen experimental replicates’ plants, non-homogenous growing conditions, and varying leaf cellular ages ( Fig. 1E ) 38 , 39 . Download figure Open in new tab Figure 1. Longitudinal assessment of transient expression identifies sources of variability in N. benthamiana fluorescence assays. A) Schematic of the transient fluorescence assay. N. benthamiana is agroinfiltrated with an A. tumefaciens strain at an OD of 0.5. The binary vector contains, from left to right border, CaMV35S2:nptII and PCM2:eGFP:At_Ubq3 oriented divergently in the T-DNA. Discs are collected from leaves 3 days post-infiltration and measured in a plate reader. B) Distributions of GFP fluorescence for 15 experimental replicates, n=64 discs from 8 separate plants, except for 2022.06.06 and 2022.06.13 which are n=40. Dates of sample collection and measurement are written YYYY.MM.DD. C) Boxplots for each plant in experimental replicates with the lowest (2022.07.25) and highest (2023.05.30) mean raw fluorescence show the median and interquartile range (IQR), and whiskers show the range of data within 1.5 IQR. Scatterplots show T4 discs in white and T5 discs in black. D) Percent contributions to observed variability as calculated from a mixed-effects model and illustrations of sources of variability. Since the experimental conditions across these 15 replicates were identical, we separately investigated other potential contributors to variation that were controlled for in that experiment. In other independent experiments, we assessed the effects of 96-well water volume, plant age, leaf infiltration site, and collection time (both time of day and time elapsed between collection and measurement). We found that water volume and plant age are negatively correlated with fluorescence (Fig. S3, S4), infiltration site significantly affects transgene expression in a leaf-and strain-dependent manner (Fig. S5), and collection time has no effect (Fig. S6, S7). Minor changes to water volume ( e.g. , evaporation, pipetting error) may have contributed to residual error in the data from Fig. 1B . However, all plants in this study were 4 weeks old at the time of infiltration and infiltrated distal to the petiole, so no variation can be attributed to differences in age or infiltration site. With these additional experiments, we have both accounted for the majority of variation in our model and now ruled out other potential sources. To demonstrate that these findings are generalizable beyond fluorescent proteins, we also quantified variation for two different metabolic pathways to produce betalain (3 experimental replicates) and 2-pyrone-4,6-dicarboxylic acid (PDC) (4 experimental replicates) 40 , 41 . The three enzymes of the betalain pathway were co-infiltrated on three separate T-DNAs or infiltrated as one T-DNA separated by self-cleaving T2A peptides (RUBY reporter) 42 . The absorbance of one of the three betalain experimental replicates was significantly different from the other two for both methods of delivery, and the greatest fold change between two replicates was about twofold for co-infiltration and about fourfold for T2A, on par with the maximal difference observed for the GFP reporter (Fig. S8, Fig. 1B-D ). For the PDC experimental replicates, yields were not significantly different after Bonferroni correction, but there was a ∼20% difference between the highest and lowest yields (Fig. S8). Multi-step metabolic pathway yields are subject to enzyme subcellular localization, substrate diffusion, and the pathway’s underlying dynamics, which may mask or exacerbate the effects of variable transgene expression. There are considerable variations in yields, specific to each pathway, and the trends observed in FP fluorescence likely translate to the variability of each component transgene in a metabolic pathway. Multiple methods of co-delivering a normalizing transgene can decrease expression variability Normalizing the expression level of a transgene of interest to that of another independent transgene is thought to control for any sources of variability independent of the tested sequences, since they should impact expression of the two transgenes equally. This practice should theoretically reduce variation both within and between experiments. However, there are many different conceivable ways the two transgenes could be delivered in N. benthamiana , and indeed normalization schemes differ between publications 13 , 22 – 26 . We systematically compared normalization schemes for transient expression using fluorescent protein (FP) reporters, whose gene expression is correlated to an easily measured phenotype, fluorescence. The normalized readout of the assay is the ratio of eGFP and mCherry fluorescence measured in a leaf disc. Designating FPs as the reporter or normalizer is arbitrary. The two expression cassettes were co-delivered in three different ways. First, we co-infiltrated a mix of two different strains of A. tumefaciens , each with a binary vector containing one FP (schemes 3-7). Second, we infiltrated single A. tumefaciens strains carrying binary vectors with a T-DNA containing both cassettes in every possible orientation, both relative to one another and to the left and right borders (schemes 8-15). Third, we infiltrated a “BiBi” strain 43 , wherein a single strain of A. tumefaciens carries two binary vectors, each with a unique FP gene and ori (schemes 16-19). All FP genes are driven by the medium strength PCM2 constitutive promoter derived from the A. thaliana HTR5 histone gene (AT4G40040) and are terminated by the A. thaliana Ubq3 terminator (Supplementary Table 1, Fig. S1) 14 . These 17 methods of co-delivery were compared to delivering eGFP (scheme 1) or mCherry (scheme 2) alone in two independent experimental replicates. Co-delivery methods have obvious ramifications for basal transgene expression levels that are consistent between both experimental replicates (Fig. S9). For both co-infiltrations and BiBis, the low copy number origin, pSa, consistently produced much lower fluorescence compared to the higher copy number origins, pVS1 or BBR1 ( Fig. 2A ) 44 . For the stacked, two-cassette T-DNAs, despite sharing the same pVS1 origin and backbone, these schemes yielded up to eight-fold difference in fluorescence depending on the cassettes’ relative orientations ( Fig. 2A , S10). Download figure Open in new tab Figure 2. Comparison of three discrete methods to deliver normalizing reporters. A) Left, categories of delivery methods: unnormalized (green or magenta), co-infiltration (yellow), same T-DNA (pink), and BiBi (blue). Center, distributions of eGFP and mCherry fluorescence, n=96 leaf discs per row. Right, cartoons showing the binary vector origin of replication, resistance marker, and orientations of FP expression cassettes in the T-DNA. All binary vector cartoons are read from left to right: ori, left border, T-DNA, right border. Origins of replication are pVS1 (diamond, black), BBR1 (circle, teal), and pSa (square, gray). Circles enclosing an X represent tOcs, a 722bp spacer in between the two expression cassettes. B) Plant coefficients of variation (CV), as calculated from the 8 discs per plant, when eGFP is treated as the reporter. All values are eGFP/mCherry CV except for scheme 1, which is GFP CV. C) Plant CVs when mCherry is treated as the reporter. All values are mCherry/eGFP CV except for scheme 2, which is mCherry CV. Normalization scheme IDs match across all subpanels. For B) and C) , an independent, one-tailed Welch’s t-test and a Bonferroni correction were conducted to determine whether the reporter/normalizer CV of a scheme is significantly less than the reporter CV for the corresponding unnormalized scheme. Asterisks indicate p-values: * < 0.05, ** < 0.01. Total OD infiltrated in all schemes is 0.5. ODs of co-infiltrated strains are 0.25 each. In the legend, “&” indicates co-infiltration, arrows indicate the direction of an expression cassette, “+” indicates BiBi, and GFP is abbreviated to “G” and mCherry to “R”. Leaves T4 and T5 of six four-week-old N. benthamiana plants were infiltrated in each experimental replicate, and four discs were collected from each infiltrated leaf. Convergent, tandem, and divergent cassettes produced the strongest, intermediate, and weakest expression, respectively (Fig. S10). The expression of one gene is affected by the orientation of the other gene, even when its own position and orientation is maintained, as with schemes 8 and 10 for eGFP or schemes 9 and 11 for mCherry (Fig. S10). The formation of a double terminator with the tOcs spacer in some cassettes may be partly responsible for increased expression, as has been shown with other binary vectors 45 , but reversing tOcs does not consistently increase fluorescence from a doubly terminated cassette over the corresponding singly terminated cassette (Fig. S10). These results suggest that gene position relative to the left and right borders and, most importantly, relative orientation strongly affect expression in multi-gene T-DNAs. Variability, as measured by coefficient of variation (CV) from all leaf discs, decreases for all normalization schemes (Fig. S11). Furthermore, all schemes have a lower CV for reporter/normalizer than for reporter (Fig. S12). The more appropriate comparison, however, is whether a scheme’s reporter/normalizer CV is lower than the corresponding unnormalized control’s reporter CV. Most schemes produce an eGFP/mCherry CV that is significantly less than scheme 1’s eGFP CV following a Bonferroni correction ( Fig. 2B ), but only scheme 3 (co-infiltration of two pVS1 binary vectors) meets this condition when mCherry is treated as the reporter ( Fig. 2C ). Such a test is conservative, and it should be noted that there is at least one scheme per co-delivery method that reduces CV by >50% compared to the unnormalized control, whether CV is calculated per plant or pooling all discs together ( Fig. 2B , 2C , S11). All co-delivery methods can offer reductions in variability, thereby increasing the statistical power of transient expression-based experiments. Inoculum densities of co-infiltrated strains affect signal strength but not variability Because the decrease in CV was the greatest and most statistically significant for co-infiltration of two pVS1 binary vectors (scheme 3), we used this scheme to explore other possible experimental variables for further reductions in variability. Additionally, co-infiltration is highly modular, and multiple T-DNAs can efficiently be delivered to each plant cell 43 , 46 . Since A. tumefaciens strains in N. benthamiana leaves can antagonize or synergize with one another depending on their densities 43 , we next determined whether the OD 600 of each strain in the co-infiltration affects the resulting CV. Each strain was added to the infiltration mix at an OD 600 of 0, 0.01, 0.1, 0.5, or 1 and combined with the other strain, also added at the same densities for a total of 24 possible combinations. Total OD 600 of the co-infiltrated mix and the OD 600 of the individual strains do not greatly nor predictably affect variability, but inoculum density of a strain dictates its total transgene expression levels. There is no discernible pattern in eGFP CV with respect to the OD 600 of the co-infiltrated strains ( Fig. 3A ), and while all CVs for the ratio of eGFP/mCherry are comparatively much lower ( Fig. 3B ), there is no one combination of ODs that is significantly superior to all others. The same trends are apparent when mCherry is treated as the reporter and eGFP as the normalizer (Fig. S13). For raw fluorescence, signal begins to saturate beyond an OD 600 of 0.5, and when one strain is held at a given OD 600 while the OD 600 of another competing strain increases, fluorescence from the fixed strain decreases ( Fig. 3C , 3D ). The primary concern when selecting OD 600 , then, should be the desired signal strength. Of the densities tested, 0.1 results in strong, measurable signal and, in agreement with previous findings, does not saturate the transgene expression capacity of the plant cell 43 , 46 . Download figure Open in new tab Figure 3. OD 600 of two co-infiltrated strains affect transgene expression strength but not variability. Raw fluorescence signal from A) eGFP and B) mCherry for all OD 600 combinations. Darker hues indicate increasing OD 600 of the competing strain, which carries the other FP. Error bars show the standard error. Matrix of all OD 600 combinations’ CV of C) eGFP fluorescence and D) ratio of eGFP/mCherry. Each condition was infiltrated into leaves T4 and T5 of six plants. Four discs were collected from each leaf for a total of n=48 leaf discs. Promoter choice determines the utility of normalization Given that the choice of promoter(s) in transient transformations affects not only signal strength but also normalization outcomes 14 , we more thoroughly explored additional promoter combinations. All transgenes in this study have hitherto been driven by a medium-strength promoter, PCM2. From a library of low, medium, and high strength constitutive promoters characterized by Zhou et al. (annotated as “PCL”, “PCM”, and “PCH,” respectively), we selected low- and high-strength promoters, PCL2 and PCH5, to test alongside PCM2. eGFP and mCherry were driven by this same set of three promoters (“same promoter set”). The eGFP binary vectors were co-infiltrated with the mCherry binary vectors in every possible combination, and all binary vectors were also infiltrated alone for a total of 15 unique infiltrations. There is no discernible pattern in eGFP CV for any of the infiltrations ( Fig. 4A ), but for eGFP/mCherry, identical promoters driving the two FP genes yield the lowest CVs ( Fig. 4B ). Outside of these pairs, normalization does not provide as large reductions in variations, if at all. In fact, for three nonidentical promoter pairs, their eGFP/mCherry CV is greater than their own eGFP CV and, for one pair, also greater than the eGFP CV of its corresponding unnormalized control ( Fig. 4A , 4B ). Similar observations are true when treating mCherry as the reporter and eGFP as the normalizer (Fig. S14). Additionally, fluorescence from a given strain diminishes the stronger a competing strain’s FP promoter is, though this trend is weaker for mCherry than it is for GFP ( Fig. 4C , 4D ). Download figure Open in new tab Figure 4. Promoters of co-infiltrated transgenes determine the efficacy of normalization. eGFP and mCherry were driven by PCL2, PCM2, or PCH5 for a total of six unique binary vectors. Log 2 raw fluorescence from A) eGFP and B) mCherry for all promoter combinations. Darker hues indicate stronger promoter of the competing strain. Error bars show the standard error. Matrix of all promoter combinations’ CV of C) eGFP fluorescence and D) ratio of eGFP/mCherry. Log 2 raw fluorescence signal from E) eGFP and F) mCherry for all promoter combinations when instead the mCherry binary vectors are driven by PCL1, PCM1, or PCH4. Darker hues indicate stronger promoter of the competing strain. Error bars show the standard error. Matrix of all promoter combinations’ CV of G) eGFP fluorescence and H) ratio of eGFP/mCherry. Conditions from the “Same Promoter Set” and “Different Promoter Set” experiments were infiltrated into leaves T4 and T5 of six plants, and four discs were collected from each leaf for a total of n=48 leaf discs. The experiments were performed independently on separate days. We then sought to clarify whether the large decrease in CV when using identical promoters is due to the similar promoter strengths or to other variables, such as shared trans factors affecting mRNA abundance. To do so, we generated another set of three binary vectors with mCherry driven by PCL1, PCM1, and PCH4 (“different promoter set”), which are the promoters in the library closest in expression to the three already tested. As with the first promoter combination experiment, the existing eGFP binary vectors were co-infiltrated with the new mCherry binary vectors in every possible combination, and all six binary vectors were also infiltrated alone. With these promoters, both the CVs of eGFP and of eGFP/mCherry follow no apparent pattern ( Fig. 4E , 4F ), but the negative trend between fluorescence signals of the two competing strains holds true, although PCH4 fits poorly in the trend ( Fig. 4G , 4H ). Several promoter pairs have higher eGFP/mCherry CVs than their own eGFP CVs and/or the eGFP CV of the unnormalized control ( Fig. 4E , 4F ), and vice versa when treating mCherry as the reporter (Fig. S14). Similarity in promoter strength, then, does not guarantee lower CVs upon normalization. Depending on the promoters used to normalize, normalization may even worsen the assay’s statistical power. Since the co-delivery comparison and the OD optimization experiments were conducted using PCM2 for every expression cassette, we had fortuitously picked the best case scenario, identical promoters. Had we chosen nonidentical promoters, all methods of co-delivery might not have decreased CV compared to the unnormalized controls. When possible, identical promoters should be used. Normalization does not yield reproducibility of absolute quantification Normalization can serve two distinct purposes: (1) decreasing within-experiment variation to improve detection of small effect sizes, or (2) decreasing between-experiment variation to allow for comparison across independent experiments. Mitigating within-experiment variation does not necessarily have an effect on between-experiment variation. To explore whether normalization makes comparisons between experimental replicates or to historical data more valid, we co-infiltrated GFP driven by PCL2 (which yielded the lowest average normalized CVs when driving both FPs ( Fig. 4 , S11)) alone and with all six mCherry binary vectors thus far generated in six independent experimental replicates. Normalization makes experimental replicates more similar to one another for most, but not all, promoter pairs ( Fig. 5A , 5B , S15). We performed one-sample Kolmogorov-Smirnov tests for every condition to determine the likelihood that a sample distribution (an individual experimental replicate) is drawn from a reference distribution (all experimental replicates, pooled). The cumulative density functions (CDFs) show that sample distributions nearly all become more comparable to the reference distribution with normalization, i.e. , the maximum vertical distance between the distributions decreases ( Fig. 5A , 5B , S15). Replicate-to-replicate, the PCL2/PCM2 promoter pair produces the most consistent distribution of GFP/mCherry values, far more reproducible than its raw eGFP fluorescences ( Fig. 5A , 5B ). The sole exception is the PCL2/PCM1 promoter pair, whose GFP/mCherry CDFs are actually less comparable to the reference distribution than its GFP CDFs are ( Fig. 5A , 5B ); there is no singular GFP/mCherry value that normalization with this promoter pair causes the data to reliably converge upon. However, this pair and PCL2/PCL2 were the only promoter pairs for which experimental replicate CVs, representing within-experiment variation, were regularly lower than the unnormalized control’s ( Fig. 5C ). Additionally, PCL2/PCL2 produces the most consistent experimental replicate CVs–it alone has an interquartile range of experimental replicate CVs narrower than the unnormalized control’s ( Fig. 5C ). Decreasing within-experiment variation, then, is not equivalent to decreasing between-experiment variation. Normalization schemes must be designed with the desired outcome in mind (minimizing within- and/or between-experiment variation) and then validated. Download figure Open in new tab Figure 5. Promoter choice affects variation between experimental replicates. A) Cumulative density functions of PCL2:eGFP alone or normalized by mCherry driven by PCL2, PCM1, or PCM2. Left: eGFP, right: eGFP/mCherry. Each experimental replicate is a unique color. The black line is the CDF for the pooled data of all six experimental replicates. The p-values of one-sample Kolmogorov-Smirnov tests appear to the right of each CDF, colored by experimental replicate. Asterisks indicate p-values: * < 0.05, ** < 0.01, *** < 0.001, and ns = not significant. B) Absolute value of every experimental replicate’s D, the greatest vertical distance between the CDF a given experimental replicate (color) and the pooled CDF (black) from A) . White boxplots indicate D values for eGFP CDFs and gray boxplots for eGFP/mCherry CDFs. C) CVs of the six experimental replicates for each condition. As in B) , white boxplots indicate eGFP and gray eGFP/mCherry. Every condition was infiltrated into leaves T4 and T5 of four plants, and four discs were collected from each leaf in all six experimental replicates for a total of n=192 leaf discs. Developing a generalizable power analysis framework of N. benthamiana transient expression To evaluate whether normalization meaningfully reduces the number of plants required to detect a given effect size, we developed a model informed by a large dataset of N. benthamiana transient expression experiments. This dataset comprises 1,813 plants infiltrated with a GFP reporter over nearly three years, spanning experiments conducted by multiple researchers and diverse conditions, including different inoculum densities and Agrobacterium strains (see Supplementary Methods 2 for details). Because this dataset accounts for historical variation across diverse experiments, the simulations trained with it will give conservative estimates of variance. Individual, well-controlled experiments may yield lower variations, but since the precise variabilitycannot be known beforehand, erring on the side of excessive rather than insufficient statistical power is preferable. We calculated the CV for each plant infiltrated with one of two Agrobacterium strains: GV3101 and the hypervirulent EHA105, which displays both elevated transgene expression and variance compared to GV3101 ( Fig. 6A ). For batches of plants for which at least 30 plants were used, we visualized the plant CVs in a CDF ( Fig. 6B solid gray line). With these per-plant and per-experiment CVs, we developed a Monte Carlo simulation of assay variability, which closely recapitulates the observed distribution of real plant CVs across the training dataset ( Fig. 6B dotted black line; Wasserstein distance = 0.023, mean ECDF difference = 0.05). Download figure Open in new tab Figure 6. Modeling variation of transgene expression in 4-week-old N. benthamiana plants. A) Per-plant CV of unnormalized GFP calculated from data compiled across many years and independent experiments. CV for a plant is calculated using all discs derived from that plant, regardless of leaf. The number of plants included appears above the violin plots. B) Cumulative density function of per-plant, unnormalized eGFP CVs. Solid gray, empirical data from 32 batches of at least 30 plants. Dotted black, Monte Carlo simulated data. C) Minimum number of simulated plants needed to detect a given effect size with the CV of unnormalized EHA105, unnormalized GV3101, or optimally normalized GV3101 assuming 95% accuracy and statistical significance (p<0.05). D) Exponential regression fit to the simulated data in C) . Dashed horizontal line indicates the arbitrary 50 plant cap, and dotted vertical lines indicate the smallest detectable effect size with 50 plants. Points represent predictions from the Monte Carlo simulations in C . Orange, EHA105. Gray, unnormalized GV3101. Teal, optimally normalized GV3101. We then simulated how variability propagates through an experiment on the per-plant and per-experiment levels. First, a batch CV is drawn from the empirical distribution shown in Fig. 6A by randomly generating a percentile and selecting the corresponding CV, which represents the average CV of plants from a hypothetical experimental replicate. Around this batch-level value, we simulate CVs of individual plants by incorporating additional noise that approximates within-experiment heterogeneity between plants. For each simulated plant, eGFP fluorescence data for eight leaf discs is generated based on the plant CV and a fixed, construct-specific mean expression. Two conditions are compared with an independent, two-tailed Student’s t -test at varying effect size differences and sample sizes ( Fig. 6C ). For each comparison, 1000 independent experimental replicates are simulated and used to calculate the probability of a successful comparison. This approach enables us to estimate the minimum number of plants needed to reliably (>95% of simulations) and significantly ( p < 0.05) distinguish between two constructs. From these calculations of plants needed for given effect sizes, we fit an exponential decay curve assuming fixed CV for three situations: unnormalized EHA105, unnormalized GV3101, and optimally normalized GV3101 (lowest CV achieved in this publication) ( Fig. 6D ). The smallest detectable effect size using 50 plants for unnormalized EHA105 was 13.7%, compared to 10.7% for unnormalized GV3101 and 10.1% for GV3101 under optimal normalization ( Fig. 6D ). While larger sample sizes can resolve even smaller differences, practical constraints limit the number of plants that can be included in an experiment, but relatively small effect sizes can be accurately distinguished with a small number of plants. Based on the Monte Carlo simulations, with n = 3, the minimum reliably detectable effect size for unnormalized GV3101 is ∼40%. Normalization is most beneficial in experiments where small effect sizes must be resolved using limited sample sizes. However, since normalization may also reduce statistical power in some cases (Fig. S16), any normalization strategy should be validated empirically prior to implementation. Discussion Here, we systematically measure expression variability in N. benthamiana agroinfiltration. The inherent noise in the transient expression of FPs is considerable (as much as fourfold difference in mean expression across experimental replicates) but mitigable through proper experimental design ( Fig. 1B ). Using a mixed-effects model, we categorize nearly all observed variation in our dataset ( Fig. 1D ). We find that multiple co-delivery methods for dual reporters can decrease variation via ratiometric normalization, and of the examined methods, co-infiltration best reduces variation, approximately halving the CV compared to no normalization ( Fig. 2 ). Neither inoculum density nor promoter strength in co-infiltrations predictably affect expression variation, but normalization efficacy is highly sensitive to promoter choice ( Fig. 3 , Fig. 4 ). Some promoter pairs may in fact increase variation or make experimental replicates less comparable, and using identical promoters is the surest and most effective way to reduce CV within experiments ( Fig. 4 , Fig. 5 ). Normalization should not be done arbitrarily but rather validated on a case-by-case basis for the co-delivery method and experimental design used, as this is absolutely necessary for results that are reproducible and robust to potential sources of variability. Though unambiguously beneficial, the use of constitutive, identical promoters is also particularly limiting given the popularity of N. benthamiana to characterize the effects of promoter identity and architecture on transcription. This problem is undoubtedly compounded in more complex experimental designs. To increase predictability and standardization of normalization methods, multi-lab efforts to quantify variation using diverse methods will be necessary. More robust transcriptomic datasets of N. benthamiana expressing diverse transgenes in distinct host strains could discourage reliance on a single, unvalidated normalizer. Additionally, multi-factor analysis of binary vector construction and expression cassette positioning could elucidate the extent to which these variables affect both expression and variability. There is little published analysis of how the design of multi-gene T-DNA structure affects the transient expression of those genes 47 . We find that convergent cassettes are far more highly expressed than tandem or divergent cassettes. Since Agrobacteria ’s VirD2 virulence protein covalently binds the right border 48 , it is thought that transgenes proximal to the right border would be protected from exonucleolytic degradation and thus more likely to remain intact inside the plant cell, but this hypothesis is not fully supported by our data ( Fig. 2A , Fig. S10). Clearly, T-DNA architecture affects transgene expression strength and variation, and a high-throughput library approach would be ideal to address the multiplicity of orientation and position combinations in multi-gene binary vectors. Determining these rules of expression and assessing them in both stable and transient systems requires further, data-intensive work. Given the lack of large, curated datasets of transient gene expression in N. benthamiana , it is likely that many published N. benthamiana experiments chose sample sizes arbitrarily based on unvalidated assumptions. Our model of the statistical power required to determine different effect sizes with high confidence shows that in cases where the expected effect size is large, it is easy to achieve the necessary sample size. For example, for effect sizes >50%, fewer than three plants are required using the GV3101 strain. For effect sizes <20%, many plants are required, to the extent that the number of plants needed may be infeasible for single experiments ( e.g. 50 plants are needed to show a 13.7% effect using EHA105). The majority of synthetic biology applications for transient expression, such as bioproduction or circuit reconstruction, require strong effects, which call for small numbers of plants. However, these results could have strong implications for subtle phenotypes, like the transformation efficiency of various Agrobacterium strains or mutants 37 , 49 , or inducible gene expression systems 47 , 50 , 51 . While the data in this work required many hundreds of plants and multiple years to collect, we were nonetheless only able to capture variation in N. benthamiana transient expression from a rather narrow perspective. All of our data are from fluorescent reporters from 4-week-old plants, with data collected three days after infiltration. We demonstrated that Agrobacterium strain, promoter choice, and T-DNA design all impact variation, but many more strains, plasmids, and expression cassette designs remain untested. There are other variables affecting Agrobacterium -mediated transformation that we did not address, such as binary vector origin of replication or T-DNA length. Furthermore, as novel Agrobacterium -independent technologies to introduce nucleic acid and proteins into plant cells mature 52 , 53 , their variability should also be estimated. It is critically important to establish whether our values of variance are broadly applicable, and future work should prioritize cross-lab validation. Even in this simple context, variation in N. benthamiana transient expression depends strongly on a host of inputs, and attempts to normalize and mitigate this variation must be individually validated. As complexity increases in synthetic biology experimental designs, this unpredictability in variation and in confidence will likely be compounded. Our results show that the choice and validation of normalization methods and data collection are critical for N. benthamiana to be a reliable platform for applications such as reconstituting complex metabolic pathways and designing large genetic circuits. As we have thoroughly demonstrated, careful, purposeful experimental design and interpretation are paramount to ensure robust and reproducible results when using this essential technique for synthetic plant biology. Methods Media, chemicals, and culture conditions Routine bacterial cultures were grown in Luria-Bertani (LB) Miller medium (BD Biosciences, USA). E. coli was grown at 37LJ°C, while A. tumefaciens was grown at 30LJ°C unless otherwise noted. Cultures were supplemented with rifampicin (100 μg/mL), kanamycin (50LJμg/L, Sigma Aldrich, USA), gentamicin (30LJμg/L, Fisher Scientific, USA), or spectinomycin (100μg/L, Sigma Aldrich, USA), when indicated. Bacterial strain and plasmid construction All bacterial strains and plasmids used in this work are listed in Supplementary Table 1. All strains and plasmids created in this work are viewable through the public instance of the Joint BioEnergy Institute (JBEI) registry: https://public-registry.jbei.org/folders/929 . All strains and plasmids created in this work can be requested from the strain archivist at JBEI with a signed material transfer agreement. Plasmids were assembled by Gibson assembly using standard protocols. Plasmids were routinely isolated using the QIAprep spin miniprep kit (Qiagen) and all primers were purchased from Integrated DNA Technologies (IDT). Plasmid sequences were verified using whole-plasmid sequencing (Primordium Labs). Agrobacterium was routinely transformed by electroporation as described previously using a 1-mm cuvette and a 2.4-kV, 25-μF, 200-Ω pulse 54 . N. benthamiana growth conditions Wild type N. benthamiana (LAB accession) plants were obtained from the in-house seed bank at the Joint BioEnergy institute. All seedlings and plants were grown at 25LJ°C in 60% humidity under long-day conditions (16LJh of light, 8LJh of darkness) of 150 μmol m −2 s −1 photosynthetically active radiation (PAR; wavelength: 400–700LJnm). As many pots as needed of Sungro Sunshine mix #4 (aggregate plus) were wetted by running excess tap water from above and allowing it to drain through. The soil was then topped with a layer of topsoil that was thoroughly wetted with a spray bottle. Using a spatula, a pinch of seeds were sprinkled evenly over the soil. Ideally, 50-100 good seedlings per pot germinate. If seeds are sown too densely, the seedlings are smaller, and having more sparse, healthy seedlings results in superior plant quality at later stages. All seedling pots were placed in a flat with 1L tapwater and covered with a hood, vents closed, in the growth room. If algal or cyanobacterial contamination grows in the water, reduce the volume of water added to the tray. After one week, flats (as many as needed) were filled with 18 3.11“ x 3.11“ x 2.25“ Traditional Inserts pots (Greenhouse Megastore). These pots were filled to the top with Sungro Sunshine mix #4 (aggregate plus), supplemented with 1.5 Tbsp Osmocote (14-14-14) pellets per 4L soil, and then 3L of tap water was added to the flat. The soil was allowed to soak up the water for 2-3 hours, and then any excess was drained off and the pots broken apart. Small holes were made in each pot’s soil, and the germinated seedlings were transplanted into individual pots. The root of the seedling must not be damaged during transplantation. The block of soil from a seedling pot can be removed and placed on its side to facilitate removing seedlings from soil without causing damage. Flats were covered with a hood, vents closed, in the growth room. After one week, all the vents were opened to allow the hood to slowly equilibrate to the ambient conditions in the growth room. Five days later, the hoods were removed. Two days later, each flat was watered with tap water supplemented with Peter’s Professional (20-20-20) at 1 tsp per 4L water. After five days, the pots were rearranged into a checkerboard pattern within the flats to maximize the amount of space per plant, decreasing the density from 18 plants per flat to 9 plants per flat. Each flat was also watered with 1L water. Three days later, plants were infiltrated. A highly detailed protocol of N. benthamiana growth and care is provided in Supplemental Methods 1. Agroinfiltration of N. benthamiana Generated binary vectors were transformed into A. tumefaciens strain GV3101 via electroporation 54 . BiBi strains were generated by growing a liquid culture of single transformants to saturation, pelleting and washing thrice with ice cold 10% glycerol, resuspending in 100ul water, and electroporating the second binary vector into the cells. Selected transformants were inoculated in liquid media with appropriate selection the night before the experiment. A. tumefaciens strains were grown until OD 600 between 0.8-1.2, centrifuged for 10 min at 4000 g, and resuspended in infiltration buffer (10 mM MgCl2, 10 mM MES, and 200 μM acetosyringone, pH 5.6) to achieve the desired OD 600 . Cultures were induced for 1 h at room temperature on a rocking shaker. Leaves T4 and T5 of 4-week-old N. benthamiana plants were syringe infiltrated with the A. tumefaciens suspensions. After infiltration, N. benthamiana plants were maintained in the same growth conditions as described above with 1L tap water per tray. Three days post infiltration, four 6-mm leaf discs per infiltrated leaf were hole punched. The leaf discs were placed abaxial side up on 350 μL of water in black, 360-μL 96 well Costar Assay Plates with clear flat bottoms (Corning). eGFP (Ex.λ = 488 nm, Em.λ = 520 nm) and mCherry (Ex.λ = 587 nm, Em.λ = 615 nm) fluorescences were measured using a Synergy 4 microplate reader (Bio-tek). Gain was set at 100 and read height at 10.5 mm. RUBY extraction and quantification Leaves T4 and T5 of 4-week N. benthamiana were co-infiltrated with equal amounts of three strains (carrying vectors 2-4 from Supplementary Table 1) on side of the leaf and infiltrated with one strain (carrying vector 5 from Supplementary Table 5) on the other. Total OD 600 for both delivery methods was 0.5, and the infiltrated spots were not touching. Leaf tissues infiltrated with RUBY constructs were excised with a razor blade from the leaf 5 dpi, frozen in liquid nitrogen, and lyophilized for 2 d. Tissues were then weighed to record dry weights and homogenized with metal beads in a PowerLyzer at 1000 g for 2 min. 80 μL of 20% methanol per mg of dry weight was added to each sample. Samples were then centrifuged at 15,000 rcf for 5 min, and 100 μl of the supernatant and diluted with an additional 500 μl of water. Absorbances at λ = 538 nm of 300 μl of the diluted extracts in black, 360-μL 96 well Costar Assay Plates with clear flat bottoms (Corning) were measured in a Syngery 4 microplate reader (Bio-tek). 2-pyrone-4,6-dicarboxylic acid (PDC) extraction and quantification The entirety of leaves T4 and T5 of 4-week old N. benthamiana were infiltrated with 0.2 OD 600 of each of the five enzymes in the PDC pathway (total OD 600 = 1). At 5 dpi, both leaves were frozen in liquid nitrogen together and lyophilized for 2 d. Leaves were then ball-milled and extracted with 80% (v/v) methanol-water as solvent as previously described 40 . Metabolites were analyzed using an HPLC-ESI-TOF-MS as previously described and quantified with a 6-point calibration curve of PDC standard 40 , 41 . Statistical analysis Mixed effects model and Monte Carlo simulations were run using R (v4.2.0) and the following packages: tidyverse (v2.0.0) 55 , transport (v0.14.6), car (v3.1.3), lme4 (v1.1.31) 56 , and performance (v0.13.0) 57 . All other analyses and figures were generated with Python (v3.11.4) and the following packages: jupyterlab (v4.0.3) 58 , pandas (v2.3.3), numpy (v2.3.3) 59 , seaborn (v0.13.2), matplotlib (v3.10.6), scipy (v1.16.1) 60 , and statsmodels (v0.14.5). Data availability All code related to this study is publicly available on GitHub (github.com/shih-lab/benthi_variation). Contributions P.M.S. and M.G.T. conceptualized the initial study. M.G.T., S.A., L.M.W., and S.N.T. designed experiments. S.N.T., K.D., and A.C. generated plasmids and strains. S.N.T, S.S., L.D.K., S.L., M.G.T., M.J.S., K.D., L.H., S.K., E.A.T, A.E., E.E., and A.L. performed experiments. M.J.S. performed mixed-effect modeling and Monte Carlo simulations, and S.N.T. completed all other data analysis. S.N.T. wrote the draft manuscript. All authors discussed the results, reviewed the article, and approved the final article. Ethics declarations M.G.T., M.J.S., and P.M.S. have financial interest in BasidioBio. PMS also has financial interest in Totality Biosciences. Acknowledgements We would like to thank Dr. Tyler Backman and Dr. Hector Garcia-Martin for their invaluable advice on statistics, and to all members of the Shih lab for their helpful discussions. We also thank Konami for facilitating discussion of expression cassette orientation via Dance Dance Revolution artwork. BioRender was used to generate figures 1 ( https://biorender.com/kh6zx0s ), 2 ( https://BioRender.com/2vhubua ), S1 ( https://biorender.com/82xc4es ), S8 ( https://biorender.com/4ila5ts ), and S9 ( https://biorender.com/w0f87at ). This material is based upon work supported by the National Science Foundation Graduate Research Fellowship under Grant No. DGE 2146752. This work was part of the DOE Joint BioEnergy Institute ( https://www.jbei.org ) supported by the U. S. Department of Energy, Office of Science, Office of Biological and Environmental Research, supported by the U.S. Department of Energy, Energy Efficiency and Renewable Energy, Bioenergy Technologies Office, through contract DE-AC02-05CH11231 between Lawrence Berkeley National Laboratory and the U.S. Department of Energy. The funders had no role in manuscript preparation or the decision to publish. The views and opinions of the authors expressed herein do not necessarily state or reflect those of the United States Government or any agency thereof. Neither the United States Government nor any agency thereof, nor any of their employees, makes any warranty, expressed or implied, or assumes any legal liability or responsibility for the accuracy, completeness, or usefulness of any information, apparatus, product, or process disclosed, or represents that its use would not infringe privately owned rights. The United States Government retains and the publisher, by accepting the article for publication, acknowledges that the United States Government retains a nonexclusive, paid-up, irrevocable, worldwide license to publish or reproduce the published form of this manuscript, or allow others to do so, for United States Government purposes. The Department of Energy will provide public access to these results of federally sponsored research in accordance with the DOE Public Access Plan ( http://energy.gov/downloads/doe-public-access-plan ). Footnotes Our updated preprint has a more comprehensive model of the sources of variation in Nicotiana benthamiana transient expression assays. References 1. ↵ Yang , S.-J. , Carter , S. A. , Cole , A. B. , Cheng , N.-H. & Nelson , R. S. A natural variant of a host RNA-dependent RNA polymerase is associated with increased susceptibility to viruses by Nicotiana benthamiana . Proc Natl Acad Sci USA 101 , 6297 – 6302 ( 2004 ). OpenUrl Abstract / FREE Full Text 2. Kapila , J. , De Rycke , R. , Van Montagu , M. & Angenon , G. An Agrobacterium-mediated transient gene expression system for intact leaves . Plant Sci . 122 , 101 – 108 ( 1997 ). OpenUrl CrossRef Web of Science 3. ↵ Grimsley , N. , Hohn , B. , Hohn , T. & Walden , R. “Agroinfection,” an alternative route for viral infection of plants by using the Ti plasmid . Proc Natl Acad Sci USA 83 , 3282 – 3286 ( 1986 ). OpenUrl Abstract / FREE Full Text 4. ↵ Schöb , H. , Kunz , C. & Meins , F. Silencing of transgenes introduced into leaves by agroinfiltration: a simple, rapid method for investigating sequence requirements for gene silencing . Mol. Gen. Genet . 256 , 581 – 585 ( 1997 ). OpenUrl CrossRef PubMed Web of Science 5. ↵ Ruiz , M. T. , Voinnet , O. & Baulcombe , D. C. Initiation and maintenance of virus-induced gene silencing . Plant Cell 10 , 937 – 946 ( 1998 ). OpenUrl Abstract / FREE Full Text 6. ↵ Chakrabarty , R. et al. PSITE vectors for stable integration or transient expression of autofluorescent protein fusions in plants: probing Nicotiana benthamiana-virus interactions . Mol. Plant Microbe Interact . 20 , 740 – 750 ( 2007 ). OpenUrl CrossRef PubMed Web of Science 7. ↵ Irmisch , S. et al. Discovery of UDP-Glycosyltransferases and BAHD-Acyltransferases Involved in the Biosynthesis of the Antidiabetic Plant Metabolite Montbretin A . Plant Cell 30 , 1864 – 1886 ( 2018 ). OpenUrl Abstract / FREE Full Text 8. Wood , C. C. et al. A leaf-based assay using interchangeable design principles to rapidly assemble multistep recombinant pathways . Plant Biotechnol. J . 7 , 914 – 924 ( 2009 ). OpenUrl CrossRef PubMed Web of Science 9. Martin , L. B. B. et al. Complete biosynthesis of the potent vaccine adjuvant QS-21 . Nat. Chem. Biol . 20 , 493 – 502 ( 2024 ). OpenUrl CrossRef PubMed 10. Calgaro-Kozina , A. et al. Engineering plant synthetic pathways for the biosynthesis of novel antifungals . ACS Cent. Sci . 6 , 1394 – 1400 ( 2020 ). OpenUrl PubMed 11. ↵ Nett , R. S. , Lau , W. & Sattely , E. S. Discovery and engineering of colchicine alkaloid biosynthesis . Nature 584 , 148 – 153 ( 2020 ). OpenUrl CrossRef PubMed 12. ↵ Jores , T. et al. Synthetic promoter designs enabled by a comprehensive analysis of plant core promoters . Nat. Plants 7 , 842 – 855 ( 2021 ). OpenUrl PubMed 13. ↵ Hummel , N. F. C. et al. The trans-regulatory landscape of gene networks in plants . Cell Syst . 14 , 501 – 511 .e4 ( 2023 ). OpenUrl PubMed 14. ↵ Zhou , A. et al. A suite of constitutive promoters for tuning gene expression in plants . ACS Synth. Biol . 12 , 1533 – 1545 ( 2023 ). OpenUrl CrossRef PubMed 15. Brophy , J. A. N. et al. Synthetic genetic circuits as a means of reprogramming plant roots . Science 377 , 747 – 751 ( 2022 ). OpenUrl CrossRef PubMed 16. ↵ Belcher , M. S. et al. Design of orthogonal regulatory systems for modulating gene expression in plants . Nat. Chem. Biol . 16 , 857 – 865 ( 2020 ). OpenUrl CrossRef PubMed 17. ↵ Wu , F.-H. et al. Tape-Arabidopsis Sandwich - a simpler Arabidopsis protoplast isolation method . Plant Methods 5 , 16 ( 2009 ). OpenUrl CrossRef PubMed 18. ↵ Yoo , S.-D. , Cho , Y.-H. & Sheen , J. Arabidopsis mesophyll protoplasts: a versatile cell system for transient gene expression analysis . Nat. Protoc . 2 , 1565 – 1572 ( 2007 ). OpenUrl CrossRef PubMed Web of Science 19. ↵ Morey , K. & Khakhar , A. Exploring the frontier of rapid prototyping technologies for plant synthetic biology and what could lie beyond . New Phytol . 242 , 903 – 908 ( 2024 ). OpenUrl CrossRef PubMed 20. ↵ Bally , J. et al. The Rise and Rise of Nicotiana benthamiana: A Plant for All Reasons . Annu. Rev. Phytopathol . 56 , 405 – 426 ( 2018 ). OpenUrl CrossRef PubMed 21. ↵ Lux , M. W. , Strychalski , E. A. & Vora , G. J. Advancing reproducibility can ease the “hard truths” of synthetic biology . Synth Biol (Oxf) 8 , ysad014 ( 2023 ). OpenUrl CrossRef PubMed 22. ↵ Zhou , X. , Mehta , S. & Zhang , J. Genetically encodable fluorescent and bioluminescent biosensors light up signaling networks . Trends Biochem. Sci . 45 , 889 – 905 ( 2020 ). OpenUrl CrossRef PubMed 23. Khosla , A. , Rodriguez-Furlan , C. , Kapoor , S. , Van Norman , J. M. & Nelson , D. C. A series of dual-reporter vectors for ratiometric analysis of protein abundance in plants . Plant Direct 4 , e00231 ( 2020 ). OpenUrl 24. ↵ Rattan , R. , Alamos , S. , Szarzanowicz , M. , Markel , K. & Shih , P. M. Predictable modulation of plant root development using engineered cytokinin regulators . BioRxiv ( 2024 ) doi: 10.1101/2024.12.06.627221 . OpenUrl Abstract / FREE Full Text 25. Morffy , N. et al. Identification of plant transcriptional activation domains . Nature 632 , 166 – 173 ( 2024 ). OpenUrl CrossRef PubMed 26. ↵ Xu , P. et al. Interplay between Agrobacterium T-DNA and backbone DNA in transgenic plant cells . Transgenic Res . 34 , 1 ( 2024 ). OpenUrl PubMed 27. ↵ Buyel , J. F. & Fischer , R. Predictive models for transient protein expression in tobacco (Nicotiana tabacum L.) can optimize process time, yield, and downstream costs . Biotechnol. Bioeng . 109 , 2575 – 2588 ( 2012 ). OpenUrl CrossRef PubMed 28. ↵ Lopatkin , A. J. & Collins , J. J. Predictive biology: modelling, understanding and harnessing microbial complexity . Nat. Rev. Microbiol . 18 , 507 – 520 ( 2020 ). OpenUrl CrossRef PubMed 29. ↵ Covert , M. W. , Gillies , T. E. , Kudo , T. & Agmon , E. A forecast for large-scale, predictive biology: Lessons from meteorology . Cell Syst . 12 , 488 – 496 ( 2021 ). OpenUrl PubMed 30. ↵ Breyne , P. , Gheysen , G. , Jacobs , A. , Van Montagu , M. & Depicker , A. Effect of T-DNA configuration on transgene expression . Mol. Gen. Genet . 235 , 389 – 396 ( 1992 ). OpenUrl CrossRef PubMed 31. ↵ Bhattacharyya , M. K. , Stermer , B. A. & Dixon , R. A. Reduced variation in transgene expression from a binary vector with selectable markers at the right and left T-DNA borders . The Plant Journal ( 1994 ). 32. ↵ Bashandy , H. , Jalkanen , S. & Teeri , T. H. Within leaf variation is the largest source of variation in agroinfiltration of Nicotiana benthamiana . Plant Methods 11 , 47 ( 2015 ). OpenUrl CrossRef PubMed 33. Vazquez-Vilar , M. et al. GB3.0: a platform for plant bio-design that connects functional DNA elements with associated biological data . Nucleic Acids Res . 45 , 2196 – 2209 ( 2017 ). OpenUrl PubMed 34. ↵ Moyle , R. L. et al. An optimized transient dual luciferase assay for quantifying microrna directed repression of targeted sequences . Front. Plant Sci . 8 , 1631 ( 2017 ). OpenUrl CrossRef PubMed 35. ↵ Cazzonelli , C. I. & Velten , J. Analysis of RNA-mediated gene silencing using a new vector (pKNOCKOUT) and an in plantaAgrobacterium transient expression system . Plant Mol. Biol. Rep . 22 , 347 – 359 ( 2004 ). OpenUrl CrossRef 36. ↵ Hellens , R. P. et al. Transient expression vectors for functional genomics, quantification of promoter activity and RNA silencing in plants . Plant Methods 1 , 13 ( 2005 ). OpenUrl CrossRef PubMed 37. ↵ Thompson , M. et al. Genetically refactored Agrobacterium-mediated transformation . BioRxiv ( 2023 ) doi: 10.1101/2023.10.13.561914 . OpenUrl Abstract / FREE Full Text 38. ↵ Huang , Y. W. , Hu , C. C. , Tsai , C. H. , Lin , N. S. & Hsu , Y. H. Chloroplast Hsp70 Isoform Is Required for Age-Dependent Tissue Preference of Bamboo mosaic virus in Mature Nicotiana benthamiana Leaves . Mol. Plant Microbe Interact . 30 , 631 – 645 ( 2017 ). OpenUrl CrossRef PubMed 39. ↵ Sheludko , Y. V. , Sindarovska , Y. R. , Gerasymenko , I. M. , Bannikova , M. A. & Kuchuk , N. V. Comparison of several Nicotiana species as hosts for high-scale Agrobacterium-mediated transient expression . Biotechnol. Bioeng . 96 , 608 – 614 ( 2007 ). OpenUrl CrossRef PubMed Web of Science 40. ↵ Lin , C.-Y. et al. In-planta production of the biodegradable polyester precursor 2-pyrone-4,6-dicarboxylic acid (PDC): Stacking reduced biomass recalcitrance with value-added co-product . Metab. Eng . 66 , 148 – 156 ( 2021 ). OpenUrl CrossRef PubMed 41. ↵ Eudes , A. et al. Production of hydroxycinnamoyl anthranilates from glucose in Escherichia coli . Microb. Cell Fact . 12 , 62 ( 2013 ). OpenUrl CrossRef PubMed 42. ↵ He , Y. , Zhang , T. , Sun , H. , Zhan , H. & Zhao , Y. A reporter for noninvasively monitoring gene expression and plant transformation . Hortic. Res . 7 , 152 ( 2020 ). OpenUrl PubMed 43. ↵ Alamos , S. et al. Quantitative dissection of Agrobacterium T-DNA expression in single plant cells reveals density-dependent synergy and antagonism . Nat. Plants ( 2025 ) doi: 10.1038/s41477-025-01996-w . OpenUrl CrossRef 44. ↵ Szarzanowicz , M. J. et al. Binary vector copy number engineering improves Agrobacterium-mediated transformation . Nat. Biotechnol . 43 , 1708 – 1716 ( 2025 ). OpenUrl PubMed 45. ↵ Diamos , A. G. & Mason , H. S. Chimeric 3’ flanking regions strongly enhance gene expression in plants . Plant Biotechnol. J . 16 , 1971 – 1982 ( 2018 ). OpenUrl CrossRef PubMed 46. ↵ Carlson , E. D. , Rajniak , J. & Sattely , E. S. Multiplicity of the Agrobacterium Infection of Nicotiana benthamiana for Transient DNA Delivery . ACS Synth. Biol . 12 , 2329 – 2338 ( 2023 ). OpenUrl CrossRef PubMed 47. ↵ Kallam , K. et al. Tunable control of insect pheromone biosynthesis in Nicotiana benthamiana . Plant Biotechnol. J . 21 , 1440 – 1453 ( 2023 ). OpenUrl CrossRef PubMed 48. ↵ Dürrenberger , F. , Crameri , A. , Hohn , B. & Koukolíková-Nicola , Z. Covalently bound VirD2 protein of Agrobacterium tumefaciens protects the T-DNA from exonucleolytic degradation . Proc Natl Acad Sci USA 86 , 9154 – 9158 ( 1989 ). OpenUrl Abstract / FREE Full Text 49. ↵ Lopez-Agudelo , J. C. et al. Rhizobium rhizogenes A4-derived strains mediate hyper-efficient transient gene expression in NicotianaLJbenthamiana and other solanaceous plants . Plant Biotechnol. J . ( 2025 ) doi: 10.1111/pbi.70083 . OpenUrl CrossRef 50. ↵ Garcia-Perez , E. et al. A copper switch for inducing CRISPR/Cas9-based transcriptional activation tightly regulates gene expression in Nicotiana benthamiana . BMC Biotechnol . 22 , 12 ( 2022 ). OpenUrl CrossRef PubMed 51. ↵ Larsen , B. et al. Highlighter: An optogenetic system for high-resolution gene expression control in plants . PLoS Biol . 21 , e3002303 ( 2023 ). OpenUrl CrossRef PubMed 52. ↵ Demirer , G. S. et al. High aspect ratio nanomaterials enable delivery of functional genetic material without DNA integration in mature plants . Nat. Nanotechnol . 14 , 456 – 464 ( 2019 ). OpenUrl CrossRef PubMed 53. ↵ Demirer , G. S. , Zhang , H. , Goh , N. S. , González-Grandío , E. & Landry , M. P. Carbon nanotube-mediated DNA delivery without transgene integration in intact plants . Nat. Protoc . 14 , 2954 – 2971 ( 2019 ). OpenUrl CrossRef PubMed 54. ↵ Kámán-Tóth , E. , Pogány , M. , Dankó , T. , Szatmári , Á. & Bozsó , Z. A simplified and efficient Agrobacterium tumefaciens electroporation method . 3 Biotech 8 , 148 ( 2018 ). OpenUrl 55. ↵ Wickham , H. et al. Welcome to the tidyverse . JOSS 4 , 1686 ( 2019 ). OpenUrl CrossRef 56. ↵ Bates , D. , Mächler , M. , Bolker , B. & Walker , S. Fitting linear mixed-effects models using lme4 . J. Stat. Softw . 67 , 1 – 48 ( 2015 ). OpenUrl CrossRef PubMed 57. ↵ Lüdecke , D. , Ben-Shachar , M. , Patil , I. , Waggoner , P. & Makowski , D. performance: An R Package for Assessment, Comparison and Testing of Statistical Models . JOSS 6 , 3139 ( 2021 ). OpenUrl CrossRef 58. ↵ Perez , F. & Granger , B. E. IPython: A System for Interactive Scientific Computing . Comput. Sci. Eng . 9 , 21 – 29 ( 2007 ). OpenUrl CrossRef PubMed 59. ↵ van der Walt , S. , Colbert , S. C. & Varoquaux , G. The NumPy Array: A Structure for Efficient Numerical Computation . Comput. Sci. Eng . 13 , 22 – 30 ( 2011 ). OpenUrl CrossRef PubMed 60. ↵ Virtanen , P. et al. SciPy 1.0: fundamental algorithms for scientific computing in Python . Nat. Methods 17 , 261 – 272 ( 2020 ). OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted November 20, 2025. Download PDF Supplementary Material Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Causes and consequences of experimental variation in Nicotiana benthamiana transient expression Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Causes and consequences of experimental variation in Nicotiana benthamiana transient expression Sophia N. Tang , Matthew J. Szarzanowicz , Amy Lanctot , Sasilada Sirirungruang , Liam D. Kirkpatrick , Krista Drako , Simón Álamos , Lyurui Cheng , Lucas M. Waldburger , Shuying Liu , Lena Huang , Sami Kazaz , Emine Akyuz Turumtay , Edward Baidoo , Aymerick Eudes , Mitchell G. Thompson , Patrick M. Shih bioRxiv 2025.06.12.659391; doi: https://doi.org/10.1101/2025.06.12.659391 Share This Article: Copy Citation Tools Causes and consequences of experimental variation in Nicotiana benthamiana transient expression Sophia N. Tang , Matthew J. Szarzanowicz , Amy Lanctot , Sasilada Sirirungruang , Liam D. Kirkpatrick , Krista Drako , Simón Álamos , Lyurui Cheng , Lucas M. Waldburger , Shuying Liu , Lena Huang , Sami Kazaz , Emine Akyuz Turumtay , Edward Baidoo , Aymerick Eudes , Mitchell G. Thompson , Patrick M. Shih bioRxiv 2025.06.12.659391; doi: https://doi.org/10.1101/2025.06.12.659391 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Plant Biology Subject Areas All Articles Animal Behavior and Cognition (7629) Biochemistry (17660) Bioengineering (13881) Bioinformatics (41910) Biophysics (21436) Cancer Biology (18576) Cell Biology (25480) Clinical Trials (138) Developmental Biology (13368) Ecology (19887) Epidemiology (2067) Evolutionary Biology (24302) Genetics (15598) Genomics (22482) Immunology (17726) Microbiology (40360) Molecular Biology (17163) Neuroscience (88534) Paleontology (666) Pathology (2830) Pharmacology and Toxicology (4821) Physiology (7637) Plant Biology (15129) Scientific Communication and Education (2045) Synthetic Biology (4290) Systems Biology (9817) Zoology (2269)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00