Differential functions of upstream and intronic HOT regions shape dlg-1 transcription and C. elegans development

preprint OA: gold
📄 Open PDF Full text JSON View at publisher
Full text 39,403 characters · extracted from preprint-html · click to expand
Differential functions of upstream and intronic HOT regions shape dlg-1 transcription and C. elegans development | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Differential functions of upstream and intronic HOT regions shape dlg-1 transcription and C. elegans development View ORCID Profile Cristina Tocchini , View ORCID Profile Fanny Eggeler , Palmer Bassett , View ORCID Profile Susan E. Mango doi: https://doi.org/10.1101/2025.06.13.659077 Cristina Tocchini 1 Biozentrum, University of Basel , 4056 Basel, Switzerland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Cristina Tocchini For correspondence: c.tocchini{at}unibas.ch susan.mango{at}unibas.ch Fanny Eggeler 1 Biozentrum, University of Basel , 4056 Basel, Switzerland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Fanny Eggeler Palmer Bassett 1 Biozentrum, University of Basel , 4056 Basel, Switzerland Find this author on Google Scholar Find this author on PubMed Search for this author on this site Susan E. Mango 1 Biozentrum, University of Basel , 4056 Basel, Switzerland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Susan E. Mango For correspondence: c.tocchini{at}unibas.ch susan.mango{at}unibas.ch Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF Abstract High occupancy target (HOT) regions, genomic sites bound by many transcription factors, are found across eukaryotes, but their physiological roles remain unclear. We characterized two HOT regions in the Caenorhabditis elegans dlg-1 locus containing transcription start sites: one upstream the coding sequence and one in the first intron. The upstream region is essential for proper transcription and proper animal development, while the intronic region modestly enhances transcription in epidermal cells. Our findings reveal the functions of HOT regions in animal development, expanding the repertoire of gene regulation strategies in C. elegans . Background Precise regulation of gene expression is crucial for orchestrating complex developmental processes. Transcriptional control relies on a series of regulatory elements located within promoters or in distant genomic regions containing enhancers or repressors ( 1 ). In Caenorhabditis elegans , transcriptional regulation mainly relies on regulatory sequences within promoters, in the close proximity to a gene’s coding sequence (CDS). High occupancy target (HOT) regions are genomic sites bound by unusually large numbers of transcription factors ( 2 , 3 ). HOT regions have been identified across the C. elegans genome and may coincide with enhancer elements, promoters and transcription start sites (TSS) that commonly activate transcription ubiquitously ( 2 , 4 , 5 ). The contribution of HOT regions to transcriptional regulation in a physiological context remains poorly understood. Here, we dissect the regulatory landscape of the dlg-1/Discs large locus during embryonic morphogenesis ( 6 , 7 ). Previously published genomic data revealed multiple candidate regulatory elements for the dlg-1 gene ( 2 , 5 , 8 ). We focused our attention on two HOT regions marked by strong peaks of RNA Polymerase II (PolII) revealed by chromatin immuno-precipitation and sequencing (ChIP-seq), and containing TSS ( 5 , 9 , 10 ): one located upstream the CDS, and one in the first intron. Notably, the upstream HOT region is located more than four kilo-bases (Kb) away the CDS, and the one in the first intron contains enhancer sites, too. Long distances between TSS and CDS are likely allowed by widespread trans-splicing in C. elegans . Approximately 70% of genes, including dlg-1 , receive an SL1 spliced leader that removes the 5′ portion of the primary transcript, thereby decoupling TSS position from mature 5′ UTR structure ( 11 ). By analyzing single-copy integrated transcriptional reporters and CRISPR-generated deletion strains, we clarified the roles of the two HOT regions in the dlg-1 locus during development. Specifically, a subdomain within the conserved region in the upstream HOT region is sufficient for wild-type transcriptional levels in all dlg-1 -positive cells, and is required for normal development. The HOT region in the first intron possesses weak transcriptional capabilities that are restricted to epidermal cells, and are not essential for development. Together, our findings describe the physiological relevance of HOT regions containing TSS and/or enhancer sites and how they control general and selective gene expression in C. elegans . This study provides a physiological example of regulatory strategies used in C. elegans transcriptional regulation. Results and discussion We focused our analysis of transcriptional regulation on the dlg-1 locus, which is expressed in diverse tissues ( 6 , 7 ). The dlg-1 promoter has been originally defined as a seven-kilobase (Kb) sequence that stretches from the CDS of the gene upstream on the minus DNA strand, dpyd-1 , to the SL1 (believed to be also the TSS) of the dlg-1 gene on the plus DNA strand ( 12 ) ( Figure 1A and S1A). More recently, different promoters and TSS have been identified in the dlg-1 locus ( 2 , 5 , 8 ). In analyzing the seven-Kb sequence upstream the dlg-1 CDS, we identified a genomic region highly conserved among the Caenorhabditis species (Figure S1A). This region is bound by several transcription factors (TFs) suggestive of a high occupancy target (HOT) region ( 2 , 3 ) (Figure S1B). Large-scale studies aiming to identify HOT regions indeed picked up this genomic site as a HOT region and promoter of dlg-1 ( 2 , 5 , 10 ). This HOT site also contains polymerase II peaks during embryogenesis (Figure S1C), confirming its role as a promoter ( 9 ). Controversially, C. elegans sequences that dictate correct expression levels and patterning are usually located within a few hundred base-pairs (bp) from a gene’s CDS ( 3 , 13 – 15 ). The conserved region is positioned approximately four Kb from the CDS of dlg-1 and is overlapping and bordered by chromatin marks typically found in enhancers. Specifically, it is enriched in acetylated lysine 27 (H3K27ac) and mono- and di-methylated lysine 4 of histone H3 (H3K4me1/2), and depleted from tri-methylated lysine 4 of histone H3 (H3K4me3) (Figure S1D) ( 5 , 16 ). Indeed, this genomic region has been predicted an enhancer site ( 5 ). Cohesins have been shown to organize the DNA in a way that active enhancers make contacts in the 3D space forming “fountains” detectable in Hi-C data ( 17 , 18 ). Although the presence of a fountain at this locus remains to be determined during embryogenesis, ARC-C data showed the putative HOT region interacts with other DNA sequences, including the first intron of dlg-1 ( 1 ). Download figure Open in new tab Figure 1. A small sequence within the upstream HOT region is the man driver of dlg-1 transcription. A . Schematic representation of the dlg-1 locus: black, exons (thick lines) and introns/UTR (thin lines); cyan, the first long intron; light grey, distal-most sequence of the upstream region to the CDS (Distal); dark purple, sequence in and around the upstream HOT region (uHOT); dark grey, proximal-most sequence of the upstream region (Proximal). Scale bar: 1 Kb. B . Upper-right side: schematic representation of the transgenic constructs used in this figure: H2B::mNG (mNG) coding sequence containing three synthetic introns (green) and a tbb-2 3’UTR (white) were under the control of upstream regions with different lengths (white). The fluorescent images are from live C. elegans embryos (outlined by dashed lines) at the comma stage and corresponding zoom-ins (squared boxes). The three seam cell nuclei used for quantitation are highlighted in the zoom-ins with dashed lines. A reference nucleus to identify the same measured nuclei in all the conditions is highlighted with an asterisk. The transgene expressed in the exemplifying embryos are stated above each image and accompanied with a small schematic. Scale bars: 10 µm (whole embryo) and 5 µm (zoom-in). C . Bar plot with error bars (standard deviation) normalized to the FL. Each dot represents the maximum fluorescent intensity of a seam cell nucleus. ns: not significant; ***: p < 0.01. For raw data, see Table S1. D , F . Upper-right side: schematic representations of the types of transgenic constructs used in these panels: H2B::mNG (mNG) coding sequence containing three synthetic introns (green) and a tbb-2 3’UTR (white) were under the control of portions of the upstream HOT region (purple, D) or the first intron (cyan, F) followed by a minimal Δpes-10 promoter (MINp, orange). The fluorescent images are from live C. elegans embryos (outlined by dashed lines) at the comma stage and corresponding zoom-ins (squared boxes) of the three seam cell nuclei used for quantitation (smaller dashed lines depict nuclei boundaries). A reference cell to identify the same three seam cells measured in all the conditions in highlighted with an asterisk. The transgenes expressed in the embryos are stated above each image and accompanied with a small schematic. Scale bars: 10 µm (whole embryo) and 5 µm (zoom-in). E , G . Bar plot with error bars (standard deviation) normalized to the FL. Each dot represents the maximum fluorescent intensity of a seam cell nucleus (three nuclei per embryo). ns: not significant; ***: p < 0.01. For raw data, see Table S1. We hypothesized the upstream HOT region is the main driver of dlg-1 transcriptional regulation. To test this idea, we generated three single-copy, integrated transcriptional reporters carrying a histone H2B sequence fused to an mNeon-Green (mNG) fluorescent protein under the transcriptional control of the following dlg-1 upstream regions: a full-length sequence (FL) and two deletion sequences spanning from the beginning (uHOT) or the end (Short) of the HOT region until the dlg-1 CDS ( Figure 1B,C ). Live imaging and quantitation analyses showed minor and insignificant differences between the FL and the uHOT reporters regarding cell-type specificity ( Figure 1B ) and levels of expression (FL mean = 1.00, STDEV = 0.26; uHOT mean = 0.93, STDEV = 0.22; Figure 1C ), and recapitulated that of the endogenous dlg-1 gene ( 6 , 7 ). The Short reporter, containing nearly four Kb upstream the CDS and containing three other dlg-1 promoters ( 5 ), showed a dramatic reduction in expression levels compared to FL and uHOT (Short mean = 0.29, STDEV = 0.08; Figure 1B,C ). This reduction was observed in most of the cells where endogenous dlg-1 is normally expressed ( Figure 1B and S2). Only developing epidermal cells were still transcriptionally active, as shown previously with an extrachromosomal dlg-1 transcriptional reporter with truncated upstream region from the CDS ( 19 ). smFISH experiments showed that the transcriptional control mediated by the upstream HOT region was specific to dlg-1 , as the nearby dpyd-1 locus was expressed sporadically (Figure S2). Together, these analyses demonstrate that the upstream HOT region is necessary to (i) increase majorly dlg-1 expression in developing epidermal cells, and (ii) allow dlg-1 expression in a broader range of cell types, such as neuronal and pharyngeal precursors. We conclude that the upstream HOT region constitutes a key regulatory sequence for correct expression levels and patterning of dlg-1 . To understand the sufficiency and determine which portion of the upstream HOT region was important for its function in gene expression strength and patterning, we selected four small regions within and surrounding the upstream conserved region (uHOT1 = 406 bp; uHOT2 = 185 bp; uHOT3 = 332 bp; uHOT4 = 374 bp) ( Figure 1A,D,E ). Each region was paired with the minimal promoter Δpes-10 (MINp) ( Figure 1D ), commonly used to assess the functionality of candidate regulatory sequences in the context of transcription ( 20 ) and generated four transcriptional reporters. As previously described, we performed live imaging and fluorescence quantitation on these reporters to assess the levels and pattern of expression dictated by each sequence. Among the four synthetic promoters designed, only uHOT2 and uHOT3 were permissive for transcription (FL mean = 1.00, STDEV = 0.19; uHOT1 mean = 0.02, STDEV = 0.05; uHOT2 mean = 0.10, STDEV = 0.08; uHOT3 mean = 0.94, STDEV = 0.35; uHOT4 mean = −0.01, STDEV = 0.02; Figure 1D,E ). The uHOT2 reporter showed scattered and variable expression that differed significantly in expression levels compared to the FL. The uHOT3 reporter showed patterning ( Figure 1D ) and expression levels ( Figure 1E ) comparable to the FL reporter. These data suggest that a small conserved sequence of 330 bp, which lies more than four Kb from the CDS, is a strong driver and main promoter of dlg-1 transcription during embryonic morphogenesis. We found a second region within the first long intron of dlg-1 was also enriched for TF binding sites ( 3 ) (Figure S1B) and H3K4me1/2 chromatin modifications ( 13 ) (Figure S1D). Indeed the first intron has been reported to be a HOT region and contain promoter and enhancer sites ( 5 ). Long first introns have been shown to frequently contain regulatory regions used for transcription, such as enhancers ( 21 – 23 ). The enhancers located in introns can drive gene expression in patterns that are distinct from, yet complementary to, those found in the gene’s promoter ( 13 ). To test if the first intron contributed to dlg-1 transcriptional control, we generated two single-copy integrated lines where the first intron was either paired with a minimal promoter Δpes-10 (INT1) or inserted in the FL transgene within the H2B sequence, acting as an actual intron (FL-INT1) ( Figure 1F ). The reporter INT1 was created to test the transcriptional abilities of intron 1 alone, whereas the reporter FL-INT1 was engineered to determine if the first intron was changing the transcriptional capabilities of the upstream region ( Figure 1F,G ). We found that the fluorescence expression driven by the INT1 reporter was confined to developing epidermal cells ( Figure 1F , S3) and minimal (13% of the FL; Mean FL = 1.00, STDEV FL = 0.19; Mean INT1 = 0.13, STDEV INT1 = 0.02; Figure 1G and S3), suggesting that this sequence plays a marginal role in dlg-1 transcription. Interestingly, quantitation analyses on the FL-INT1 reporter showed a slight, but significant increase (+15%) in fluorescence intensity compared to the reference FL reporter in the tested cells (Mean INT1 = 1.15, STDEV INT1 = 0.22; Figure 1G ). This result supports the idea of enhancers providing additive effect to gene transcription. We conclude that dlg-1 intron 1 complements the main promoter, albeit weakly, in a subset of cells. To clarify the impact of the two HOT regions during normal development, we generated two CRISPR lines derived from a strain with dlg-1 tagged endogenously with a GFP sequence at the end of its CDS. The first line had the upstream HOT region removed (Δ-uHOT). Specifically, it spanned from bp 5,475,070 to 5,475,709 on chromosome X and removed HOT2 and HOT2 sequences. The second line had the first intron of dlg-1 (spanning from bp 5,479,783-5,480,664 on chromosome X) substituted with a short synthetic intron of fifty-one bp (synt-INT1). We chose this synthetic intron as it is commonly employed in fluorescent reporter sequences to optimize their translation in C. elegans . Live imaging analyses showed a marked reduction to 46% (STDEV = 19) of DLG-1-GFP levels in Δ-uHOT compared to wild-type (wt) at the junction of embryonic epithelial cells - seam cells ( Figure 2A,B and S4A). Furthermore, Δ-uHOT junctions presented gaps along their perimeter in these and other epithelial cells (Figure S4A,B). Single molecule fluorescent in situ hybridization (smFISH) experiments on fixed samples revealed these defects to be likely caused by a general reduction in dlg-1 mRNA levels in all embryonic cells where dlg-1 is normally expressed ( Figure 2C and S1B). Such reductions in mRNA and protein levels determined severe although not fully penetrant developmental defects. Such defects include: reduced body (two days after L4 stage: wt mean = 1.19 mm; Δ-uHOT mean = 0.79 mm - Figure S4C,D) and brood sizes (wt mean = 164; Δ-uHOT mean = 28 - Figure S4E), and embryonic lethality or larval arrest (L1 stage) (survival to adult stage wt = 99.9%; Δ-uHOT = 3.9% - Figure S4F). To note, embryos managed to finish embryogenesis but die immediately before or shortly after hatching. This phenotype differs from both full knock-out of dlg-1 where embryos survive until shortly after mid-embryogenesis (2-fold stage) ( 12 ) and its knock-down where animals develop normally, only at a slower pace ( 24 ). These results show that deletion of the upstream HOT region causes a reduction in dlg-1 mRNA and consequently DLG-1-GFP protein levels in embryonic cells where dlg-1 is normally expressed, leading to defects in junctional integrity and overall development. We conclude that the upstream HOT region is required for correct junction formation, epithelial integrity and normal animal development. Live imaging analyses on the synt-INT1 strain compared to wild-type (wt) did not reveal any differences at protein level (wt mean = 1.00, STDEV = 0.31; synt-INT1 mean = 1.03, STDEV = 0.30 - Figure 2D ) or distribution of DLG-1-GFP in embryonic seam cells ( Figure 2E ), where intron 1 is permissive of transcription ( Figure 1F and S3). Likewise, smFISH experiments did not show differences at level and distribution of dlg-1 mRNA ( Figure 2F ). In line with these findings, synt-INT1 showed no evident phenotypes at any stage of development compared to wt. These data show that the replacement of the long intron 1 of dlg-1 with a short synthetic intron does not alter mRNA or protein levels or distribution in embryonic seam cells. These results suggest that intron 1 is not required for dlg-1 expression or function in cells where it however is permissive of transcription. Download figure Open in new tab Figure 2. Deletion of the dlg-1 upstream HOT region, but not intron 1, determines reduction at the mRNA and protein levels. A,D . Fluorescent images of zoom-ins on epidermal cells of live C. elegans embryos at the comma stage. The fluorescence comes from the GFP paired to endogenous DLG-1 in wild-type (wt, upper panel) or deletion strain for the upstream HOT region (Δ-uHOT). Scale bar: 5 µm. B , E . Bar plot with error bars (standard deviation) normalized to the wt. In ( B ) comparison of wild-type (wt, gray) to the deletion strain for the upstream HOT region (Δ, pink). In ( E ) comparison of wild-type (wt, gray) to the substitution strain for the first intron with a synthetic one (synt, light-blue). Each dot represents the maximum fluorescent intensity of a junction shared between two seam cells (five junctions per embryo – posterior-most ones). ns: not significant; ***: p < 0.01. For raw data, see Table S1. C , F . Fluorescent images of zoom-ins on epidermal cells of fixes samples of C. elegans embryos at the comma stage. Upper panels, wild-type strain (wt); lower panels, deletion strain for the upstream HOT region (Δ-uHOT, C ) or substitution strain for the first intron with a synthetic one (synt-INT1, F ). Panels from left to right: smFISH signal from dlg-1 mRNA using probes complementary to exon region (magenta); smFISH signal from dlg-1 pre-mRNA using probes complementary to intron regions (cyan); antibody stain signal from GFP fused to DLG-1 (yellow); and merges. Scale bar: 5 µm. In summary, we described the roles of two key regulatory HOT regions in the dlg-1 locus in modulating gene expression and development in the C. elegans embryo: a conserved portion of an upstream HOT region located over four Kb upstream of the CDS (HOT3), and another HOT region included in first long intron. HOT regions in C. elegans have been predominantly associated with promoters and were often considered non-functional or simply reflective of accessible chromatin. Our data provide clear functional evidence that the upstream HOT region can instead act as main driver of transcription and key for normal development. Specifically, we found that a 330 bp fragment within HOT3 is sufficient to drive strong and spatially patterned expression in embryonic cells, closely resembling the endogenous dlg-1 expression profile. Deletion of the key regulatory sequence in the upstream HOT region determines a partial loss-of-function phenotype, mainly causing late embryonic lethality and L1 arrest. Nevertheless, such phenotypes are probably not the sole result of reduction in dlg-1 mRNA, and consequently DLG-1 protein levels, as they are more severe than in other known mutants in which levels are affected, but the CDS of dlg-1 is not ( 24 ). The upstream HOT region interacts with other genomic regions ( 1 ) and its depletion might affect gene expression of other genes beyond dlg-1 itself. We also showed that the first intron acts additively with the upstream region to boost gene expression exclusively in developing epidermal cells in the context of transcriptional reporters. Despite that, exchanging the intron 1 with a synthetic one in the endogenous locus has not effect at the protein level, suggesting additional (co- or post-transcriptional) regulations to be in place to coordinate the translational output. The presence of shared TF binding both HOT/enhancer regions, HOT3 and the first intron of dlg-1 , suggests that regulatory elements far upstream the CDS and intronic regions can function cooperatively. This discovery challenges previous reports that HOT regions are functionally isolated modules, and instead suggest a possible cooperative transcriptional regulation logic. Conclusions Together, our findings illustrate how non-canonical regulatory elements (distal and intronic HOT regions) are integrated to fine-tune gene expression in a cell-type-specific manner during development. These results help to clarify the functional potential of HOT regions in C. elegans and expand our understanding of how promoter and enhancers contribute to precise spatiotemporal control of gene expression in compact genomes like the one of C. elegans . Methods Nematode culture C. elegans strains were maintained as previously described ( 25 ) at 20°C. Embryos were imaged at the comma stage. For a detailed list of transgenic lines used in this study, see Table S1. Generation of transgenic lines Transgenes carrying the different promoters analyzed in this study (amplified from N2 lysate) were fused to an H2B sequence (amplified from N2 lysate) paired to an mNG sequence through a flexible linker (amplified from LP598 lysate), and a tbb-2 3’UTR (amplified from N2 lysate). These sequences were assembled (NEBuilder® HiFi DNA Assembly Cloning Kit, New England BioLabs, cat#E5520) in the pCFJ150 vector and inserted into the ttTi5605 locus on chromosome II of the mosSCI strain EG6699 ( 26 ). NEB® 10-beta Competent E. coli (High Efficiency) (NEB, cat#C3019) competent cells were used for transformation. Full plasmid sequencing from Microsynth was used to confirm the sequences were correct. Plasmids were purified with MIDI preps (NucleoBond Xtra Midi Plus (Macherey - Nagel, cat#740412.10) and single-copy integrated lines were generated following the mosSCI protocol ( 26 ). For a detailed list of plasmids used in this study, see Table S1. Upstream HOT site deletion and synthetic intron 1 replacement lines were obtained using the CRISPR/Cas9 technique, following a previously described protocol ( 27 ). For a complete list of reagents (crRNA, repair oligos, and genotyping/sequencing primers), see Table S1. smFISH smFISH experiments were performed as previously described ( 7 , 24 , 28 ). For a full list of smFISH probes, see Table S1. A widefield microscope FEI “MORE” with total internal reflection fluorescence (TIRF), equipped with a Hamamatsu ORCA flash 4.0 cooled sCMOS camera, and a Live Acquisition 2.5 software were used for capturing smFISH images. Images were deconvolved with the Huygens software and processed in OMERO ( https://www.openmicroscopy.org/omero/ ). All figures were assembled in Adobe Illustrator ( https://www.adobe.com/ ). Live imaging: microscopy, quantitation, and analysis Live imaging was performed on embryos at the comma stage. Embryos were washed from plates with 1 ml of water, collected into Eppendorf tubes, and spun-down (“short”) for 5 seconds in a table centrifuge. After removing the supernatant, embryos were resuspended in M9 buffer and transferred onto poly-L-lysine-coated slides (Thermo Scientific, cat#ER-308B-CE24). A coverslip was placed on the sample and embryos were imaged immediately. A widefield ZEISS Axio Imager M2 equipped with a ZEISS Colibri LED light source, a Hamamatsu ORCA flash 4.0 camera, and ZEN 2.6 software (blue edition) was used for capturing images for live imaging of C. elegans embryos. Fluorescence signal quantitation of nuclear (from H2B-mNG) and junctional (from DLG-1-GFP) signals in the different transgenic lines was performed using Fiji, where the maximum intensity was quantified. Statistical analyses were performed using R software (R Core Team, 2021; https://www.R-project.org/ ). The ggplot2 package (Wickham, 2016; https://ggplot2.tidyverse.org ) was used to generate bar plots with error bars (standard deviation) and dot plots with box plots. Each dot represents the normalized value to the corresponding seam cell nucleus or junction. Statistical differences were determined using a t -test. The clustered column chart was created with Microsoft Excel. Declarations Ethics approval and consent to participate Not applicable. Consent for publication Not applicable. Availability of data and materials All data are available in the described sources in the Methods. Competing interests The authors declare that they have no competing interests. Funding The study has been partially funded by the Forschungsfonds (Excellent Junior Researcher) from the University of Basel (U.570.1040) from CT and the Swiss National Science Foundation (310030_197713) from SEM. Authors’ contribution Conception of the work (CT and SEM); design of the work (CT); acquisition and analysis (CT, FE and PB); interpretation of data (CT); drafted the work (CT); revised the work (SEM). All authors have read and approved the current version of this manuscript and have agreed to its submission for publication. Acknowledgments We thank current and previous lab members of the Mango group for scientific discussions, the Imaging Core Facility (IMCF) of the Biozentrum for technical support, and WormBase. A particular thank to Dr. Camila Pulido for reading and giving comments to the manuscript. Some strains were provided by the CGC, which is funded by the NIH Office of Research Infrastructure Programs (P40 OD010440). Funder Information Declared University of Basel, https://ror.org/02s6k3f65 , U.570.1040 Swiss National Science Foundation, https://ror.org/00yjd3n13 , SNF 310030_197713 , 320030-227954 Footnotes Modified introduction with added references. Fig. 1 and 2 merged. Additional figure 2 and supplemental. Additional author added. https://zenodo.org/records/16762430 References 1. ↵ Huang N , Seow WQ , Appert A , Dong Y , Stempor P , Ahringer J. Accessible Region Conformation Capture (ARC-C) gives high-resolution insights into genome architecture and regulation . Genome Res . 2022 Feb ; 32 ( 2 ): 357 – 66 . OpenUrl Abstract / FREE Full Text 2. ↵ Chen RAJ , Stempor P , Down TA , Zeiser E , Feuer SK , Ahringer J. Extreme HOT regions are CpG-dense promoters in C. elegans and humans . Genome Res . 2014 Jul ; 24 ( 7 ): 1138 – 46 . OpenUrl Abstract / FREE Full Text 3. ↵ Gerstein MB , Lu ZJ , Van Nostrand EL , Cheng C , Arshinoff BI , Liu T , et al. Integrative Analysis of the Caenorhabditis elegans Genome by the modENCODE Project . Science . 2010 Dec 24 ; 330 ( 6012 ): 1775 – 87 . OpenUrl Abstract / FREE Full Text 4. ↵ Van Nostrand EL , Kim SK . Integrative analysis of C. elegans modENCODE ChIP-seq data sets to infer gene regulatory interactions . Genome Res . 2013 Jun ; 23 ( 6 ): 941 – 53 . OpenUrl Abstract / FREE Full Text 5. ↵ Jänes J , Dong Y , Schoof M , Serizay J , Appert A , Cerrato C , et al. Chromatin accessibility dynamics across C. elegans development and ageing . eLife . 2018 Oct 26 ; 7 : e37344 . OpenUrl CrossRef PubMed 6. ↵ Bossinger O , Klebes A , Segbert C , Theres C , Knust E. Zonula Adherens Formation in Caenorhabditis elegans Requires dlg-1, the Homologue of the Drosophila Gene discs large . Developmental Biology . 2001 Feb ; 230 ( 1 ): 29 – 42 . OpenUrl CrossRef PubMed Web of Science 7. ↵ Tocchini C , Rohner M , Guerard L , Ray P , Von Stetina SE , Mango SE . Translation-dependent mRNA localization to Caenorhabditis elegans adherens junctions . Development . 2021 Dec 15 ; 148 ( 24 ): dev200027 . OpenUrl CrossRef PubMed 8. ↵ Serizay J , Dong Y , Jänes J , Chesney M , Cerrato C , Ahringer J. Distinctive regulatory architectures of germline-active and somatic genes in C. elegans . Genome Res . 2020 Dec ; 30 ( 12 ): 1752 – 65 . OpenUrl Abstract / FREE Full Text 9. ↵ Hsu HW , Liao CP , Chiang YC , Syu RT , Pan CL . C. elegans flamingo FMI-1 controls dendrite self-avoidance through F-actin assembly . Development . 2020 Jan 1 ; dev.179168 . 10. ↵ Kruesi WS , Core LJ , Waters CT , Lis JT , Meyer BJ . Condensin controls recruitment of RNA polymerase II to achieve nematode X-chromosome dosage compensation . eLife [Internet] . 2013 Jun 18 [cited 2025 Jul 25]; 2 . Available from: https://elifesciences.org/articles/00808 11. ↵ Blumenthal T. WormBook . Trans-splicing and operons in C elegans . : 1 – 11 . 12. ↵ McMahon L , Legouis R , Vonesch JL , Labouesse M. Assembly of C. elegans apical junctions involves positioning and compaction by LET-413 and protein aggregation by the MAGUK protein DLG-1 . Journal of Cell Science . 2001 Jun 15 ; 114 ( 12 ): 2265 – 77 . OpenUrl Abstract / FREE Full Text 13. ↵ Fuxman Bass JI , Tamburino AM , Mori A , Beittel N , Weirauch MT , Reece-Hoyes JS , et al. Transcription factor binding to Caenorhabditis elegans first introns reveals lack of redundancy with gene promoters . Nucleic Acids Research . 2014 Jan 1 ; 42 ( 1 ): 153 – 62 . OpenUrl CrossRef PubMed 14. Ronald H. A. Plasterk Gaudet J , Muttumu S , Horner M , Mango SE . Whole-Genome Analysis of Temporal Gene Expression during Foregut Development . Ronald H. A. Plasterk , editor. PLoS Biol . 2004 Oct 19 ; 2 ( 11 ): e352 . OpenUrl CrossRef PubMed 15. ↵ Copenhaver GP Zhong M , Niu W , Lu ZJ , Sarov M , Murray JI , Janette J , et al. Genome-Wide Identification of Binding Sites Defines Distinct Functions for Caenorhabditis elegans PHA-4/FOXA in Development and Environmental Response . Copenhaver GP , editor. PLoS Genet . 2010 Feb 19 ; 6 ( 2 ): e1000848 . OpenUrl CrossRef PubMed 16. ↵ Spicuglia S , Vanhille L. Chromatin signatures of active enhancers . Nucleus . 2012 Mar ; 3 ( 2 ): 126 – 31 . OpenUrl CrossRef PubMed Web of Science 17. ↵ Isiaka BN , Semple JI , Haemmerli A , Thapliyal S , Stojanovski K , Das M , et al. Cohesin forms fountains at active enhancers in C. elegans [Internet] . Genomics ; 2023 [cited 2025 Jun 12]. Available from: http://biorxiv.org/lookup/doi/10.1101/2023.07.14.549011 18. ↵ Kim J , Wang H , Ercan S. Cohesin organizes 3D DNA contacts surrounding active enhancers in C. elegans [Internet] . Genomics ; 2023 [cited 2025 Jun 12]. Available from: http://biorxiv.org/lookup/doi/10.1101/2023.09.18.558239 19. ↵ Sheffield M , Loveless T , Hardin J , Pettitt J. C. elegans Enabled Exhibits Novel Interactions with N-WASP, Abl, and Cell-Cell Junctions . Current Biology . 2007 Oct ; 17 ( 20 ): 1791 – 6 . OpenUrl CrossRef PubMed Web of Science 20. ↵ Fire A , Harrison SW , Dixon D. A modular set of lacZ fusion vectors for studying gene expression in Caenorhabditis elegans . Gene . 1990 Jan ; 93 ( 2 ): 189 – 98 . OpenUrl CrossRef PubMed Web of Science 21. ↵ Christoffels A Bradnam KR , Korf I. Longer First Introns Are a General Property of Eukaryotic Gene Structure . Christoffels A , editor. PLoS ONE . 2008 Aug 29 ; 3 ( 8 ): e3093 . OpenUrl CrossRef PubMed 22. Hardin JD Brabin C , Appleford PJ , Woollard A. The Caenorhabditis elegans GATA Factor ELT-1 Works through the Cell Proliferation Regulator BRO-1 and the Fusogen EFF-1 to Maintain the Seam Stem-Like Fate . Hardin JD , editor. PLoS Genet . 2011 Aug 4 ; 7 ( 8 ): e1002200 . OpenUrl CrossRef PubMed 23. ↵ Jorgensen EM , Mango SE . The art and design of genetic screens: Caenorhabditis elegans . Nat Rev Genet . 2002 May 1 ; 3 ( 5 ): 356 – 69 . OpenUrl CrossRef PubMed Web of Science 24. ↵ Ketting RF Tocchini C , Mango SE . An adapted MS2-MCP system to visualize endogenous cytoplasmic mRNA with live imaging in Caenorhabditis elegans . Ketting RF , editor. PLoS Biol . 2024 Mar 1 ; 22 ( 3 ): e3002526 . OpenUrl CrossRef PubMed 25. ↵ Brenner S. The genetics of Caenorhabditis elegans . Genetics . 1974 May ; 77 ( 1 ): 71 – 94 . OpenUrl Abstract / FREE Full Text 26. ↵ Frøkjær-Jensen C , Wayne Davis M , Hopkins CE , Newman BJ , Thummel JM , Olesen SP , et al. Single-copy insertion of transgenes in Caenorhabditis elegans . Nat Genet . 2008 Nov ; 40 ( 11 ): 1375 – 83 . OpenUrl CrossRef PubMed Web of Science 27. ↵ Ghanta KS , Ishidate T , Mello CC . Microinjection for precision genome editing in Caenorhabditis elegans . STAR Protocols . 2021 Sep ; 2 ( 3 ): 100748 . OpenUrl PubMed 28. ↵ Tsanov N , Samacoits A , Chouaib R , Traboulsi AM , Gostan T , Weber C , et al. smiFISH and FISH-quant – a flexible single RNA detection approach with super-resolution capability . Nucleic Acids Res . 2016 Dec 15 ; 44 ( 22 ): e165 – e165 . OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted August 14, 2025. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Differential functions of upstream and intronic HOT regions shape dlg-1 transcription and C. elegans development Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Differential functions of upstream and intronic HOT regions shape dlg-1 transcription and C. elegans development Cristina Tocchini , Fanny Eggeler , Palmer Bassett , Susan E. Mango bioRxiv 2025.06.13.659077; doi: https://doi.org/10.1101/2025.06.13.659077 Share This Article: Copy Citation Tools Differential functions of upstream and intronic HOT regions shape dlg-1 transcription and C. elegans development Cristina Tocchini , Fanny Eggeler , Palmer Bassett , Susan E. Mango bioRxiv 2025.06.13.659077; doi: https://doi.org/10.1101/2025.06.13.659077 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Genetics Subject Areas All Articles Animal Behavior and Cognition (7635) Biochemistry (17691) Bioengineering (13892) Bioinformatics (41937) Biophysics (21452) Cancer Biology (18588) Cell Biology (25504) Clinical Trials (138) Developmental Biology (13378) Ecology (19899) Epidemiology (2067) Evolutionary Biology (24320) Genetics (15609) Genomics (22506) Immunology (17736) Microbiology (40394) Molecular Biology (17181) Neuroscience (88605) Paleontology (666) Pathology (2832) Pharmacology and Toxicology (4824) Physiology (7641) Plant Biology (15156) Scientific Communication and Education (2045) Synthetic Biology (4294) Systems Biology (9825) Zoology (2271)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00
unpaywall
last seen: 2026-06-27T06:33:11.484959+00:00