Repression ofCADM1transcription by HPV type 18 is mediated by three-dimensional rearrangement of promoter-enhancer interactions

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 94,949 characters · extracted from preprint-html · click to expand
Repression of CADM1 transcription by HPV type 18 is mediated by three-dimensional rearrangement of promoter-enhancer interactions | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Repression of CADM1 transcription by HPV type 18 is mediated by three-dimensional rearrangement of promoter-enhancer interactions Karen Campos-León , Jack Ferguson , Thomas Günther , C. David Wood , Steven W. Wingett , Selin Pekel , Christy S Varghese , Csilla Varnai , Michelle West , View ORCID Profile Andrew Beggs , Adam Grundhoff , Boris Noyvert , Sally Roberts , View ORCID Profile Joanna L Parish doi: https://doi.org/10.1101/2024.08.16.608206 Karen Campos-León 1 Department of Cancer and Genomic Sciences, College of Medicine and Health, University of Birmingham , Birmingham, B15 2TT Find this author on Google Scholar Find this author on PubMed Search for this author on this site Jack Ferguson 1 Department of Cancer and Genomic Sciences, College of Medicine and Health, University of Birmingham , Birmingham, B15 2TT Find this author on Google Scholar Find this author on PubMed Search for this author on this site Thomas Günther 2 Leibniz Institute of Virology , Hamburg, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site C. David Wood 3 School of Life Sciences, University of Sussex , Brighton, BN1 9QG Find this author on Google Scholar Find this author on PubMed Search for this author on this site Steven W. Wingett 4 The Babraham Institute, Babraham Research Campus , Cambridge CB22 3AT Find this author on Google Scholar Find this author on PubMed Search for this author on this site Selin Pekel 1 Department of Cancer and Genomic Sciences, College of Medicine and Health, University of Birmingham , Birmingham, B15 2TT Find this author on Google Scholar Find this author on PubMed Search for this author on this site Christy S Varghese 1 Department of Cancer and Genomic Sciences, College of Medicine and Health, University of Birmingham , Birmingham, B15 2TT Find this author on Google Scholar Find this author on PubMed Search for this author on this site Csilla Varnai 1 Department of Cancer and Genomic Sciences, College of Medicine and Health, University of Birmingham , Birmingham, B15 2TT Find this author on Google Scholar Find this author on PubMed Search for this author on this site Michelle West 3 School of Life Sciences, University of Sussex , Brighton, BN1 9QG Find this author on Google Scholar Find this author on PubMed Search for this author on this site Andrew Beggs 1 Department of Cancer and Genomic Sciences, College of Medicine and Health, University of Birmingham , Birmingham, B15 2TT Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Andrew Beggs Adam Grundhoff 2 Leibniz Institute of Virology , Hamburg, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site Boris Noyvert 1 Department of Cancer and Genomic Sciences, College of Medicine and Health, University of Birmingham , Birmingham, B15 2TT 5 Birmingham CRUK Centre, University of Birmingham Find this author on Google Scholar Find this author on PubMed Search for this author on this site Sally Roberts 1 Department of Cancer and Genomic Sciences, College of Medicine and Health, University of Birmingham , Birmingham, B15 2TT Find this author on Google Scholar Find this author on PubMed Search for this author on this site Joanna L Parish 1 Department of Cancer and Genomic Sciences, College of Medicine and Health, University of Birmingham , Birmingham, B15 2TT 6 National Institute of Health Research, Biomedical Research Centre, University of Birmingham Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Joanna L Parish For correspondence: j.l.parish{at}bham.ac.uk Abstract Full Text Info/History Metrics Preview PDF ABSTRACT Upon infection, human papillomavirus (HPV) manipulates host cell gene expression to create an environment that is supportive of a productive and persistent infection. The virus-induced changes to the host cell’s transcriptome are thought to contribute to carcinogenesis. Here, we show by RNA-sequencing that oncogenic HPV18 episome replication in primary human foreskin keratinocytes (HFKs) drives host transcriptional changes that are consistent between multiple HFK donors. We have previously shown that HPV18 episome replication in HFKs results in post-transcriptional stabilisation of the host chromatin insulation protein CTCF. Since CTCF is an important regulator of host cell transcription via coordination of epigenetic boundaries and long-range chromosomal interactions, we hypothesised that HPV18-induced stabilisation of CTCF may contribute to host transcription reprogramming. Analysis of CTCF binding in the host cell genome by ChIP-Seq revealed that while the total number of CTCF binding sites is not altered by the virus, there are a sub-set of CTCF binding sites that are either enriched or depleted of CTCF. Many of these altered sites are clustered within regulatory elements of differentially expressed genes, including the tumour suppressor gene cell adhesion molecule 1 ( CADM1 ), which supresses epithelial cell growth and invasion. We show that HPV18 establishment results in reduced CTCF binding at the CADM1 promoter and upstream enhancer. Loss of CTCF binding is coincident with epigenetic repression of CADM1, in the absence of CpG hypermethylation, while adjacent genes including the transcriptional regulator ZBTB16 are activated. These data indicate that the CADM1 locus is subject to topological rearrangement following HPV18 establishment. We tested this hypothesis using 4C-Seq (circular chromosome confirmation capture-sequencing) and show that HPV18 establishment causes a loss of long-range chromosomal interactions between the CADM1 transcriptional start site and the upstream transcriptional enhancer. These data show that HPV18 manipulates host cell promoter-enhancer interactions to drive transcriptional reprogramming that may contribute to HPV-induced disease progression. AUTHOR SUMMARY Infection with oncogenic HPV is the cause of numerous cancer types, which generally arise after persistent HPV infection. Upon infection, HPV alters the gene expression profile of infected cells to facilitate virus replication and persistence. Multiple mechanisms of HPV-induced host cell reprogramming have been previously suggested. Here, we show that HPV infection induces rearrangement of specific genomic loci by altering the chromatin binding of the host cell protein CTCF, an important regulator of chromatin architecture. Loss of CTCF binding to a cluster of binding sites at the CADM1 locus on chromosome 11 is coincident with epigenetic reprogramming and disruption of long-range chromatin interactions, resulting in transcriptional repression of CADM1 . Our data show that repression of CADM1 is an early event in HPV-driven disease, preceding hypermethylation of the CADM1 transcriptional promoter that is frequently observed in HPV-driven cancers, demonstrating a novel mechanism of HPV-induced host cell transcriptional reprogramming. INTRODUCTION Oncogenic human papillomavirus (HPV) infection is the cause of most cervical cancers and a significant proportion of other anogenital and oropharyngeal cancers [ 1 ]. HPVs exclusively infect the undifferentiated basal keratinocytes of squamous epithelia and gain access to these cells via micro-abrasions [ 2 ]. Most infections are resolved by host immune activation but in some cases, the virus avoids immune detection and establishes a persistent infection, a strong risk factor for cancer development. Virus-mediated transcriptional manipulation of the host is an important facet in the maintenance of persistent oncogenic HPV infection. This family of viruses have evolved intricate mechanisms to induce transcriptional changes in the host to evade immune detection and support persistent infection. Several studies have identified gene sets that are transcriptionally deregulated following oncogenic HPV establishment in primary keratinocytes including down-regulation of immune defence-related genes and altered expression of genes important for epithelial cell structure and differentiation [ 3 – 6 ]. However, the mechanisms that drive HPV-induced host transcriptional reprogramming and how these changes contribute to cancer development remain unclear. HPV oncogenes E6 and E7 modulate the activity of numerous histone modifying and chromatin-remodelling enzymes leading to epigenetic regulation of viral and host chromatin (reviewed by [ 7 ]). Epigenetic modulation of host chromatin is associated with both HPV infection and HPV-driven carcinogenesis and multiple mechanisms have been proposed. HPV E6 and E7 can modulate the activity of both histone acetyltransferases (HATs) and histone deacetylases (HDACs) resulting in host transcriptional reprogramming [ 8 , 9 ]. In addition, HPV E7 drives a global decrease in H3K27Me3 abundance via induction of KDM6A and KDM6B lysine 27-specific demethylases resulting in host cell transcriptional reprogramming via homeobox gene activation [ 10 , 11 ]. HPV replication in primary keratinocytes also induces hypermethylation of CpG dinucleotides in the host genome, directly impacting gene expression [ 12 , 13 ]. This is at least in part through up-regulation of DNA methyltransferase 1 (DNMT1) via the action of the viral oncoproteins E6 and E7 [ 14 , 15 ]. Longitudinal models of HPV-driven primary cell immortalisation have demonstrated that initial promoter hypermethylation is targeted rather than randomly distributed sites in the host genome [ 12 ] and that sequential increases in hypermethylation of specific promoters correlates with disease progression [ 12 , 13 ]. While oncogenic HPV drives a distinct pattern of host transcriptional reprogramming through targeted epigenetic modulation of gene loci [ 16 , 17 ], how these changes are directed is not known. In addition, whether the histone-mediated epigenetic alteration of host transcription observed in models of HPV infection promotes CpG methylation at CpG islands (CGIs) commonly hypermethylated in HPV-driven cancers remains unanswered. We have previously demonstrated that HPV18 targets the ubiquitously expressed host protein CCCTC-binding factor (CTCF) to attenuate viral gene expression via the establishment of a CTCF-Yin Yang 1 (YY1)-dependent epigenetically repressed chromatin loop between the viral enhancer and the E2 encoding early gene region [ 18 , 19 ]. CTCF is a zinc finger DNA binding protein that binds to tens of thousands of genomic sites to regulate epigenetic boundaries, nucleosome positioning, and long-range chromatin interactions termed topologically associated domains (TADs). CTCF is frequently mutated in numerous cancer types [ 20 ] and isolated somatic mutations in CTCF binding sites have been identified in tumours [ 21 , 22 ]. Disruption of CTCF binding has been shown to have profound effects on gene expression within specific gene loci associated with oncogenic transformation [ 23 , 24 ]. While CTCF is an important regulator of HPV gene expression, it is unknown whether HPV infection alters the cellular function of this key transcriptional regulator. Here, using a physiological model of HPV18 episome replication and maintenance in primary human foreskin keratinocytes [ 19 , 25 , 26 ] we show that HPV establishment alters the binding footprint of CTCF at discrete cellular loci. Disruption of CTCF binding clusters within specific cellular loci including the CADM1 (cell adhesion molecule 1; a major regulator of cell adhesion, also known as tumour suppressor in lung cancer 1; TSLC1) locus correlates with epigenetic rearrangement and differential gene expression within these loci. We show that loss of CTCF binding at the CADM1 transcription start site (TSS) and upstream enhancer elements results in topological rearrangement of promoter-enhancer interaction and provides a mechanism for CADM1 transcriptional repression following HPV establishment. In cervical carcinogenesis, CADM1 silencing by promoter hypermethylation is a frequent event in the progression from high grade cervical dysplasia to cancer. Our data show that repression of CADM1 expression occurs early in the replication cycle of HPV18, not by promoter hypermethylation but via alteration of CTCF-dependent promoter-enhancer interaction and localised epigenetic rearrangement. Repression of CADM1 as a major regulator of cell adhesion may be a key event in virus replication and in HPV-induced carcinogenesis mediated by different virus-induced mechanisms. RESULTS Establishment of HPV18 in primary keratinocytes induces alteration of the host cell transcriptome Global gene expression changes induced by HPV18 transfection and establishment in primary HFKs were measured by RNA-sequencing (RNA-Seq) of polyA+ selected mRNA. HFK cultures harvested from six individual donors were transfected with recircularised HPV18 genomes to establish persistent episomal replication. HFK donor cells and matched HPV18 episome-containing lines (HFK-HPV18) were cultured in monolayer on γ-irradiated J2 fibroblasts in serum containing media and the cellular transcriptome was analysed in cells below passage 5 (representing ∼ 20-25 population doublings) to ensure episomal replication of HPV18 genomes, as confirmed by Southern blot analysis of each donor ( Figure. S1A and [ 27 , 28 ]). Although we were able to identify virus-host fusion transcripts in all six donor lines analysed, these were detected at very low abundance (< 0.3 % of total fragments mapped to the HPV18 genome; Table.S1 ), further confirming minimal transcriptionally active viral integrants. In addition, alignment of HPV18 derived transcripts confirmed expression of early transcripts that are predominantly spliced at E6*I and E1^E4 major splice sites and terminate at the early polyA+ signal downstream of E5, typical of episomal HPV transcription ( Fig. S1B ). Download figure Open in new tab Supplemental Figure S1: HPV18 DNA is maintained as extrachromosomal episomes in HFK-HPV18 cultures. (A) Southern blot analysis of DNA extracted from HFK-HPV18 donors 3, 4, 5 and 6. Samples digested with Hindlll show open circle (OC) and supercoiled (SC) forms, whereas digestion with EcoRI linearises the HPV18 episomes as linear (L) forms. Southern blot analysis of donors 1 and 2 was previously described [47, 48]. (B) Alignment of HPV18 transcripts identified by RNA-Seq to the linearized HPV18 genome (annotated below) for HFK-HPV18 donors 1-6. Image created using Integrated Genome Viewer. Download figure Open in new tab Supplemental Figure S2: Differential gene expression analysis following HPV18 replication establishment. Volcano plot of gene expression profiles obtained from differential gene expression analysis of donor matched HFK in comparison to HFK-HPV18 (donors 1-6). Thresholds of Log2FC = 1 and adjusted p-value = 0.05 are indicated by the dotted lines. Significantly altered genes are indicated by red dots. Download figure Open in new tab Supplemental Figure S3: HPV18 genome replication results in significantly reduced CADM1 gene expression. Alignment of RNA-Seq data to the CADM1 open reading frame (exons indicated below the image) in HFK donors 1-6 before and after HPV18 genome replication establishment. Paired tracks for each donor are group scaled as indicated on the right. Dotted line indicates truncation of the tracks within the large intron between exon 1-2. Image created using Integrated Genome Viewer. Principal component analysis (PCA) of regularized log (rlog) transformed RNA-Seq data revealed distinct clustering of HFK and HFK-HPV18 samples with a clear difference in PCA1 following HPV18 episome establishment in all six HFK donors ( Fig. 1A ; p = 0.039), and PC2 showing the differences between the replicates. Differential gene expression (DGE) analysis revealed 976 host genes with 2 or more fold change in gene expression and adjusted p < 0.05 following HPV18 establishment in all six donors. Of these genes, 628 were upregulated ( Fig. S2 and Table.S2 ) and 348 were downregulated ( Fig. S2 and Table.S3 ). Unsupervised hierarchical clustering of the top 50 most up regulated and down regulated genes revealed a remarkably consistent alteration of host cell gene expression in all six HFK donors, suggesting that genes are specifically targeted by HPV18 regardless of host cell genetic background ( Fig. 1B ). Download figure Open in new tab Fig. 1: HPV18 establishment in primary HFKs induces a distinctive pattern of host differential gene expression. (A) Two main principal components of rlog transformed RNA-Seq data from six primary HFK cultures (circles) and isogenic HPV18-genome containing lines (triangles). The six individual donors are shown in different colours. Separation of the 2 groups of samples is shown by the ellipses denoting 95% confidence intervals for each group. Statistical significance of separation was calculated using a permutation test (ClusterSignificance package); p = 0.039. (B) Heatmap of unsupervised hierarchical clustering of the top 50 most significantly upregulated and 50 most significantly down regulated genes between HFK (aqua) and HPV18 (orange) samples. Relative low gene expression is shown in blue and high gene expression shown in red as detailed in the legend. (C) Gene set enrichment analysis of differential expression of genes following HPV18 establishment using the Molecular Signature Hallmarks database. Directional response in expression of gene sets is indicated and significance of gene set terms (corrected for multiple testing) is given on the x-axis, showing only the terms significant at FDR = 0.01. To determine the biological pathways that are transcriptionally altered following HPV18 establishment, we performed gene set enrichment analysis (GSEA) using the Molecular Signatures Database (MSigDB) and Hallmark gene set ( http://www.gsea-msigdb.org/ ). A total of 16 pathways were significantly enriched (FDR < 0.01) including up-regulation of E2F targets and G2M checkpoint and down-regulation of immune response pathways (interferon alpha and gamma responses) and the unfolded protein response. Other notable pathways were both up- and down-regulated including epithelial to mesenchymal transition (EMT), mitotic spindle, apoptosis, immune signalling pathways (TNFα signalling via NFκB and IL-6 JAK-STAT3 signalling) and hypoxia ( Fig. 1C ). HPV18 alters CTCF binding site occupancy in the host cell genome To discover novel mechanisms of HPV18-driven host cell gene expression changes, we opted to identify potential changes to host cell chromatin architecture by mapping differential CTCF binding. CTCF is an important regulator of host cell gene expression, partially through the stabilisation of promoter-enhancer interactions and the insulation of epigenetic boundaries [ 29 ], and we therefore hypothesised that alteration of CTCF activity could drive HPV-mediated host gene expression changes. We and others have previously reported that oncogenic HPV establishment resulted in a significant increase in CTCF protein level [ 30 , 31 ] that was not due to transcriptional upregulation of CTCF [ 30 ], suggesting that changes to CTCF protein function or turnover could be altered by HPV. We therefore hypothesised that HPV18 replication could induce a change in the distribution of CTCF binding within the human genome and that this might contribute to the altered gene expression observed. To test this, we analysed CTCF binding distribution by chromatin immunoprecipitation-sequencing (ChIP-Seq) in two independent HFK donor lines (donors 3 and 4). CTCF-bound peaks were identified using Model-based Analysis of ChIP-Seq (MACS) in each HFK donor before and after HPV18 establishment. While no difference in the total number of CTCF-bound peaks was observed following HPV18 establishment (HFK_3 n = 62125; HFK_4 n = 40988; HFK-HPV18_3 n = 59704, HFK-HPV18_4 n = 41105; p = 0.53), differential peak analysis revealed a subset of peaks differentially bound following HPV18 establishment (>log2FC +/-0.5, p<0.005) ( Fig. 2A and B, Table.S4 ). In total, 396 peaks were significantly reduced in CTCF binding and 504 peaks were significantly increased in the two donors tested. Annotation of all CTCF peaks identified by genomic feature revealed a similar distribution within the human genome as previously described [ 32 ] with most peaks within genebody (40 %) or intergenic regions (41 %). In addition, 14 % of peaks were within proximal and distal promoter regions and less than 5 % of peaks were within gene deserts ( Fig. 2C , Table.S4 ). Interestingly, the distribution of differentially bound peaks in HFK-HPV18 compared to HFK showed a bias towards gene desert regions, particularly in the peaks that were significantly reduced following HPV18 establishment where 19.4 % of differentially accessible CTCF peaks were found within gene deserts ( Fig. 2C ). Download figure Open in new tab Fig. 2: HPV18 induces differential host CTCF binding in primary HFKs. CTCF-bound peak were identified by ChIP-Seq analysis in two independent HFK donors. Significantly enriched peaks were identified using MACs (version 1.4.3) with a p-value cut-off of 1×10 -5 . Heatmaps of CTCF peaks that were significantly down- (A) or up-regulated (B) in HPV positive cells with a log2 fold change cutoff of −1 and +1, respectively. Heatmaps are sorted according to decreasing CTCF ChIP-Seq signal in HFKs. Normalized CTCF signal intensities are illustrated by white/blue to orange color gradient ranging from 0 to 5. (C) Pie charts showing the genomic features associated with all CTCF peaks identified (total) and the peaks significantly reduced (Diff Peaks Down) or increased in magnitude (Diff peaks Up). Genomic feature annotations were obtained using the diffReps tool. HPV18-induced alteration of CTCF binding frequently occurs in clusters associated with differential gene expression To determine whether HPV18-induced differential CTCF binding in the human genome contributes to any of the observed host transcriptional changes, we integrated RNA-Seq analysis of DGE with CTCF ChIP-Seq data. The distance of genes that were altered at least 2-fold (up and down) from the nearest at least 2-fold differentially bound CTCF peak was calculated. This analysis revealed that of the 976 genes that were differentially expressed (|log 2 FC| >1.0 or <-1.0 and adjusted p-value <0.05), 107 (11 %) of these genes were within 100Kb of differentially bound CTCF sites ( Table.S5 ). This represents a 1.5-fold enrichment (p = 2.3 × 10⁻⁵, Hypergeometric test) compared to the 7.5% (1,688 out of 22,598) of all genes included in the differential expression analysis. Interestingly, there appeared to be close clustering of multiple differential CTCF peaks within distinct genomic loci, suggesting that these loci have undergone epigenetic and/or topological rearrangement following HPV18 episome establishment. To identify all loci with multiple differentially bound CTCF peaks and corresponding differential expression we used the bedtools cluster function to identify differential CTCF peak clusters based on the distance between differentially bound peaks. In total, eight genomic loci were identified which contained 12 or more differentially bound CTCF sites. Seven of these loci contained at least one significantly differentially expressed gene ( Tables 1 and S6 ). This analysis identified a region on chromosome 11 which contains a cluster of 20 differentially bound CTCF binding sites ( Fig. 3A ). As this was the highest number of differentially bound CTCF peaks within a distinct genomic locus following HPV18 establishment, we decided to focus our investigation and downstream experiments on this genomic locus. The cell adhesion molecule 1 ( CADM1) and zinc finger and BTB domain 16 ( ZBTB16 ; also known as promyelocytic leukaemia zinc finger, PLZF ) genes are located within this locus. Notably the expression of CADM1 is significantly reduced in our RNA-Seq data ( Fig. 3B and Table S3 ; Log2FC = −3.1, p = 2.83e-06), which was validated by qRT-PCR using three independent primer sets ( Fig. 3B ) and CADM1 protein expression was significantly reduced in HFK-HPV18 in comparison to isogenic HFK cultures ( Fig. 3C ). Conversely, ZBTB16 mRNA was significantly increased in both our RNA-Seq data sets ( Fig. 3D and Table S2 ; Log2FC = 4.43, p = 7.06 x 10 -29 ) which was validated by qRT-PCR using two independent primer sets ( Fig. 3D ). Unfortunately, we were unable to detect ZBTB16 protein in our cultures by western blotting as a suitable antibody is not available. Nonetheless, our integrated analysis of differential gene expression and differential CTCF binding peaks have identified a genomic locus on chromosome 11 which contains a cluster of CTCF binding sites that are significantly reduced in CTCF abundance which is coincident with profound locus-specific gene expression changes. Download figure Open in new tab Fig. 3: HPV18-induced redistribution of a distinct CTCF binding cluster correlates with altered gene expression at the CADM1 locus. (A) Circos plot of Chromosome 11 (Chr11) showing differentially expressed genes (DGE; regularized log2 fold change cutoff (Log2FC) = 1; outer circle), significantly different CTCF peaks obtained by ChIP-seq analysis (inner circle), and clusters of differential CTCF sites with a maximum distance of 1M base pairs (middle circle). (B) CADM1 mRNA expression from RNA-Seq data (left panel) and qRT-PCR with primers designed to amplify exons (Ex) 1-2, exons 2-3 and exons 4-5 of CADM1 (right panel). Data are the mean and standard deviation of six independent HFK donors. Statistical significance was calculated using a paired T-test *p < 0.05 (left) and a one sample T-test with theoretical mean of 1 *** p < 0.001, **** p < 0.0001 (right). (C) CADM1 protein expression was analysed by western blotting. A representative image is shown on the left. Protein levels were quantified using ImageJ and normalized to b-actin and expression in the corresponding HFK donor (untransfected). Data are the mean and standard deviation and statistical significance was calculated using a one sample T-test with theoretical mean of 100, p = 0.048. (D) ZBTB16 mRNA expression from RNA-Seq data (left panel) and qRT-PCR with primers designed to amplify exons 1-2 and exons 1-3 (right panel). Data are the mean and standard deviation of six independent HFK donors. Statistical significance was calculated using a paired T-test, p < 0.02 (left) and a one sample T-test with theoretical mean of 1 *p < 0.05 (right). The genomic location of differential CTCF binding peaks identified in ChIP-Seq datasets was identified using the bedtools cluster function (v2.26.0) with a maximum distance of 1 Mbp. The coordinates and number of differential CTCF binding peaks (up or down) within the cluster are indicated along with the genes located within the cluster (red, significantly reduced expression; green, significantly increased expression; black, no change). HPV18 genome establishment induced epigenetic reprogramming of the CADM1 gene locus To elucidate the molecular basis of HPV18-induced CADM1 transcriptional repression, we analysed chromatin structure by mapping histone post-translational modifications (PTMs) known to be associated with transcriptionally active (H3K4Me3 and H3K27Ac) and inactive (H3K27Me3) loci alongside a mark of transcription progression (H3K36Me3). Active promoters are generally enriched in H3K4Me3 while enhancers often have H3K4Me1/3 and H3K27Ac enrichment (reviewed by [ 33 ]). Analysis of these histone marks at the CADM1 promoter and upstream enhancer (annotated in www.enhanceratlas.org ) demonstrated that enrichment of H3K4Me3 at the CADM1 promoter, and H3K4Me3 and H3K27Ac marks within the upstream enhancer are notably reduced following HPV18 establishment ( Fig. 4 ). In contrast, the CADM1 locus is devoid of repressive H3K27Me3 modifications in primary keratinocytes, the abundance of which is increased following HPV18 establishment, indicating specific epigenetic repression of CADM1 expression ( Fig. 4 ). Interestingly, epigenetic alteration of the CADM1 locus was coincident with epigenetic rearrangement of the neighbouring ZBTB16 gene locus but in contrast to CADM1 , the ZBTB16 locus was increased in activating histone marks H3K4Me3 and H3K27Ac and decreased in H3K27Me3 following HPV18 establishment. These epigenetic alterations to the CADM1/ZBTB16 loci are consistent with HPV18-induced local rearrangement resulting in repression of CADM1 and activation of ZBTB16 expression. Download figure Open in new tab Fig. 4: HPV18 establishment induces epigenetic rearrangement of the CADM1 locus. ChIP-Seq analysis of histone modifications (H3K4Me3, dark green; H3K27Ac, light green; H3K36Me3, purple; H3K27Me3, red) and CTCF (black) in primary HFK donor 3 before (HFK) and after establishment of HPV18 episome replication (HPV+). Significantly differentially enriched peaks (p < 0.0001) were identified using MACS and indicated by the coloured blocks below the ChIP-Seq traces. Differential gene expression (DGE) from RNA-Seq analysis is shown in the lower track alongside annotation of CADM1 and ZBTB16 gene positions. The transcriptional promoter (P) and enhancer elements (E) of CADM1 obtained from ENCODE are indicated. The epigenetic changes observed within the CADM1/ZBTB16 locus were consistent in HFK donor 4. HPV18 establishment induces topological rearrangement of the CADM1 locus The significant reduction of CADM1 transcription and upregulation of ZBTB16 following HPV18 establishment in all six independent primary keratinocyte cultures indicates a specific and targeted mechanism of HPV-induced host transcriptional reprogramming. This, combined with the loss of CTCF at the CADM1 TSS and within the upstream enhancer elements, and the dramatic alteration of epigenetic marks within the CADM1/ZBTB16 locus, led us to hypothesise that HPV18 establishment in primary keratinocytes induces CTCF-dependent topological rearrangement of this locus and contributes to the observed epigenetic reprogramming. To test this hypothesis, we first analysed the CTCF binding peaks identified by ChIP-Seq to map the location, core sequence (presence of primary motif only or primary and secondary motif [ 34 ]) and orientation (sense or anti-sense) of the CTCF binding sites within the CADM1 TSS and upstream enhancer element. We identified three CTCF binding sites at the CADM1 TSS; sites 1 and 2 contain the primary CTCF binding motif only and were in the anti-sense orientation, facing towards the CADM1 gene. Conversely, CTCF binding site 3 at the CADM1 TSS contains the primary and secondary motifs, indicating this site is higher affinity, and is orientated in the sense direction towards the upstream CADM1 transcriptional enhancer ( Fig. 5A and B ). None of the CTCF binding peaks identified at the CADM1 TSS were found to be significantly altered in CTCF binding by HPV establishment in the two HFK donors tested ( Fig. 4 ). However, we also mapped four further CTCF binding sites, termed sites 4, 5, 6 and 7 situated upstream of the CADM1 enhancer at −230 kb, −365 kb, −408 kb and −486 kb in relation to the CADM1 TSS, respectively. All these CTCF binding sites contain the primary and secondary motifs suggesting they are high affinity binding sites that may contribute to the stabilisation of long-range chromatin interactions [ 35 ]. Notably, the upstream CTCF binding sites 4-7 were all significantly reduced in CTCF binding following HPV18 establishment (site 4, p = 0.0044; site 5, p = 0.002; site 6, p = 3.3e -8 ; site 7, p = 2.97e -8 ). CTCF binding sites 5 and 7 were found to be orientated in the sense direction, orientated away from the CADM1 TSS, whereas sites 4 and 6 were orientated in the anti-sense direction, towards the CADM1 TSS. We therefore predicted that CTCF-mediated chromatin looping could be facilitated between convergent CTCF sites 3 and either sites 4 or 6, which could bring the previously annotated distal enhancer element at position Chr11:115492940-115637600 ( www.enhanceratlas.org ) in close physical proximity to the CADM1 TSS to stimulate transcription. Download figure Open in new tab Fig. 5: HPV18 establishment induces topological rearrangement of the CADM1 locus. (A) CTCF bound regions at the CADM1 TSS and upstream transcriptional enhancer were identified from ChIP-Seq data and CTCF binding site identified based on similarity to previously determined binding motif [ 73 ]. Binding site number is indicated and corresponds to the binding site annotation in (B). Direction is shown as sense (S) or antisense (AS) alongside the nucleotide position (kb) in relation to the CADM1 TSS. Primary and secondary CTCF binding motifs are indicated in bold and underlined. CpG dinucleotides within the annotated binding sites are indicated in red. (B) Chromatin interactions with the CADM1 transcriptional start site at Chr11:115375845-115376296 (viewpoint indicted in blue) were analyzed by 4C in two independent HFK donors before and after HPV18 episome establishment. Annotated enhancer elements (grey boxes). The position and orientation of mapped reads was determined using the Probe Trend Plot feature of SeqMonk and shows relative read density over restriction fragments generated by Dpn II and Bfa I digest, correcting to the largest datastore (depth indicated in legends; rainbow). Subtraction of normalised read counts of HFK-HPV18 minus HFK for each donor was calculated and shown below the 4C-Seq tracks for each donor. Green indicates a gain in interaction whereas purple indicates a loss. To determine whether cis- or trans-interactions exist between the CADM1 TSS and any other genomic region in the cellular genome we used circular, chromatin conformation capture (4C) followed by next generation sequencing (4C-Seq). The experiment was designed to capture chromatin interactions with a viewpoint region containing the CADM1 TSS (Chr11:115375845-115376296) created by restriction digest with Dpn II and Bfa I. Analysis of chromatin interactions in two independent primary keratinocyte donors revealed interactions between the CADM1 TSS and the upstream enhancer element in both HFK donors tested ( Fig. 5B ). Notably, in the presence of HPV18 genome replication, the interaction between the CADM1 TSS and upstream enhancer element was reduced, indicated by the dominance of purple bars in the HFK-HPV18 subtraction analysis. This reduced interaction between the CADM1 TSS and upstream enhancer elements was observed across both donors tested, although the overall effect in donor 4 is less pronounced than in donor 3. HPV18-induced loss of CADM1 promoter-enhancer interactions precedes CpG hypermethylation of the CADM1 locus It has previously been shown that CADM1 expression is significantly reduced in HPV-driven cancers [ 36 , 37 ] and this reduced expression correlates with hypermethylation of CpG islands at the CADM1 TSS [ 38 ]. We therefore sought to determine whether the reduced CADM1 expression and alterations to promoter-enhancer interactions were due to CpG hypermethylation at the CADM1 TSS. This is particularly important since the CTCF binding sites present within the CADM1 TSS (binding sites 1-3) each contain multiple CG dinucleotides, methylation of which would inhibit CTCF binding [ 39 ]. The enrichment of CpG methylation at the CADM1 locus and surrounding genes was determined by adaptive Nanopore sequencing, which allows the direct detection of methylated cytosines at CpG sites without the need for bisulphite conversion [ 40 ]. Visualisation of CpG methylation within our region of interest (Chr11:112,500,000-117,500,000) in HPV18 genome containing HFKs (donors 3, 4 and 5) revealed a distinct area of predominantly unmethylated DNA at the CADM1 locus, which was flanked by regions of higher CpG methylation up- and down-stream ( Fig. 6A ). While the mean percentage CpG methylation in each donor at the CADM1 TSS was low (donor 3 26.76 %; donor 4, 21.76 %; donor 5, 15.25 %), the abundance of CpG methylation detected at the neighbouring gene APOA5 was significantly higher (donor 3, 75.4 %; donor 4, 46.98 %; donor 5, 76.23 %; p < 0.0001, Fig. 6B ). These results suggest that the strong repression of CADM1 expression by HPV18 genome replication in primary HFKs is not due to increased CpG methylation of the CADM1 TSS, as previously demonstrated in HPV-driven cancers. Download figure Open in new tab Figure. 6: Low abundance of CpG methylation at the CADM1 locus following establishment of HPV18 replication. Methylation at CpG dinucleotides was determined by adaptive Nanopore sequencing in donors 3, 4 and 5. (A) Histogram of aligned reads (depth 0-25 counts) is shown, CpG dinucleotides are coloured by 5 mC modified CpG (blue indicates unmethylated and red indicates methylated cytosines). The position of genes within the region shown are indicated at the top. CpG islands of >300 bp were identified using Encode and indicated by the green bars below the Figure. (B) Regions of interest at the CADM1 TSS (i) and APOA5 TSS (ii), as depicted on (A) are shown. (C) Violin plots showing the distribution of % CpG methylation at CpG dinucleotides at the CADM1 TSS (blue) and the APOA5 TSS (orange). Data median are indicated by the bold dotted line and quartiles by fine dotted lines. % CpG methylation is significantly higher in the APOA5 TSS than the CADM1 TSS in all three donors tested (p < 0.0001, student’s T-Test). DISCUSSION The establishment of persistent oncogenic HPV replication and in vitro immortalisation of primary keratinocytes is facilitated by manipulation of the host transcriptome to alter the immune response to infection and drive a rebalancing of cellular growth and differentiation. Studies of HPV-induced transcription manipulation of the host in physiological models of oncogenic HPV replication have defined key events in HPV establishment and host cell immortalisation [ 3 , 4 , 6 , 41 ]. Comparison of differential gene expression following HPV16-mediated in vitro immortalisation of primary cervical keratinocytes has previously revealed a strong concordance with aberrant gene expression in HPV-driven cervical cancers [ 3 ]. It has also been shown that HPV positive tumours have a distinct pattern of differential gene expression, mostly driven by E6/E7 expression, compared to HPV-tumours at the same anatomical site and a consistent pattern of aberrant gene expression is noted in HPV+ tumours from distinct anatomical sites [ 42 ]. These findings provide strong evidence that HPV-driven host transcription reprogramming is important for persistent HPV replication as well as initiation of tumourigenesis and subsequent maintenance of tumour growth. In this study we use a panel of six genetically distinct primary HFKs to define gene expression changes that occur following in vitro establishment of HPV18 episome maintenance replication. RNA-Seq analysis revealed a robust and consistent pattern of differential gene expression across HFK donors. Comparison of the gene expression changes that occur in all six HFK donors reveals a discrete subset of significantly altered genes; a total of 628 genes were upregulated and 348 genes downregulated. A lower number (228) of genes were differentially expressed upon establishment of HPV18 episomes in HFKs and analysed using a microarray assay [ 43 ]. Of these, 44 matched the differentially expressed genes in our study, with all 44 being regulated in the same direction. A similar number of genes were also identified in HPV16-mediated immortalisation of HFKs, using a similar method to that used in this study, with some overlap with the differentially expressed genes identified in our study (e.g. UHCL1 , RNF212, and NEFH ) [ 44 ]. We hypothesised that the mechanisms driving HPV-manipulation of host gene expression in our model of productive infection are likely to be different to the less dynamic mechanisms of sustained aberrant gene expression observed in HPV-driven cancers. GSEA highlighted pathways targeted by HPV18 consistent with previous reports, including E2F signalling, G 2 /M checkpoint response and various immune signalling pathways identified in HPV18 replication models [ 43 ] or overexpression of HPV18 E6/E7 [ 45 ]. Notably, some of the gene expression changes we observed in our pre-disease model of HPV replication are also known to occur with high frequency in HPV-driven cancers. For example, CADM1 expression was reduced in all six HFK donors following HPV18 replication establishment. This gene has been shown to be strongly downregulated in HPV+ cancers (REF) [ 36 – 38 ]. We now show that HPV18-induced repression of CADM1 transcription is an early event in HPV-driven pathogenesis and occurs prior to virus-induced cell transformation. We and others have previously shown that oncogenic HPV establishment in primary keratinocytes results in a post-transcriptional increase in CTCF protein abundance [ 18 , 31 ]. CTCF plays a key role in the regulation of HPV and host transcription through the regulation of epigenetic chromatin status and stabilisation of long-range chromatin interactions, often between promoter and enhancer elements to drive transcription [ 18 , 19 , 46 ]. To determine whether HPV manipulation of CTCF function is in part responsible for HPV18-induced differential host gene expression, we performed ChIP-Seq analysis to map CTCF binding sites and key epigenetic marks in the host genome following HPV18 establishment in two independent HFK donors. While the overall number of CTCF binding peaks did not change, the distribution of a sub-set of CTCF bound peaks was significantly altered; 900 distinct CTCF peaks displayed a significant gain (n = 504) or loss (n = 396) of CTCF binding with an apparent bias in loss of binding within gene desert/intergenic regions. Integration of the differentially bound CTCF peaks with differential gene expression data identified gene loci that contained clusters of differentially bound CTCF peaks coincident with significant changes to gene expression. Notably, the CADM1/ZBTB16 gene locus contained 20 differentially bound CTCF sites predominantly located up-stream of the CADM1 gene body including within the upstream transcriptional enhancer of CADM1 . General loss of CTCF binding in this region in HFKs with replicating HPV18 genomes was coincident with increased ZBTB16 expression and decreased CADM1 expression in all six HFK donors tested. The loss of CTCF binding in this region was also coincident with altered epigenetic status within the CADM1 TSS and upstream enhancer from an active to repressed chromatin state. In the two donors analysed, HPV18 replication caused a loss of active chromatin marks H3K4Me3 and H3K27Ac and gain of repressive H3K27Me3 within the CADM1 TSS and upstream enhancer. Whether this alteration of epigenetic marks is a cause or consequence of CTCF binding disruption at this locus is not yet clear. However, CTCF binding is important for epigenetic insulation between active and inactive gene regions [ 47 ]. It is therefore possible that initial disruption of CTCF binding upstream of the CADM1 gene removes epigenetic insulation from the neighbouring repressed gene region thus allowing the spread of repressive H3K27Me3 marks into the CADM1 locus causing a downregulation of CADM1 expression, a hypothesis we are currently testing. Binding of CTCF to target sites can be disrupted by methylation of CpG dinucleotides within the binding footprint [ 48 ]. Notably, it has also been shown that downregulation of CADM1 in HPV-driven cancer is due to hypermethylation of a CpG island at the CADM1 TSS [ 36 , 37 , 49 ] and that sequential hypermethylation at the CADM1 TSS correlates with HPV-driven cancer stage [ 12 , 13 , 38 ]. To determine whether HPV18-induced disruption of CTCF binding at the CADM1 locus could be due to increased CpG methylation of these binding sites, particularly within the upstream transcriptional enhancer, we mapped binding sites by comparison of the genomic sequences within the binding footprints identified in our ChIP-Seq data with the defined CTCF binding motif ( Jasper.com ). While the CTCF binding sites at the CADM1 TSS each contained multiple CpG dinucleotides and therefore CTCF binding at these sites could be sensitive to increased CpG methylation, the upstream sites (4, 5 and 6) did not contain CpG dinucleotides. HPV18-induced loss of CTCF binding at sites 4, 5 and 6 in the CADM1 enhancer is therefore not predicated in alterations in CpG methylation. To determine whether loss of CTCF binding at sites 1, 2 and 3, situated at the CADM1 TSS was due to HPV18-induced hypermethylation of the CADM1 TSS, we analysed CpG methylation levels by Oxford Nanopore sequencing. These experiments revealed a distinct area of hypomethylated DNA at the CADM1 locus that was flanked by hypermethylated regions in HPV18-genome containing HFKs harvested from three individual donors. These results are consistent with a previous study which assessed CpG hypermethylation within 14 key genes, including CADM1 , in a model of E6/E7-driven primary keratinocyte immortalisation. Only a small increase in CpG methylation between HPV-controls and cells harvested between 14-20 passages after E6/E7-mediated immortalisation was observed, and no difference in the level of CpG methylation was detected at the CADM1 promoter [ 13 ]. We therefore conclude that the rearrangement of CTCF binding and altered epigenetic regulation of the CADM1 locus is a pre-cursor to hypermethylation of the CADM1 promoter frequently observed in HPV-driven cancers. Interestingly, a high proportion of CpG islands contain TSSs and it is generally accepted that unmethylated CpG islands act as a nucleation site for the recruitment of histone modifying enzymes such as KDM2A which facilitates enrichment of histone H3 lysine 4 tri-methylation (H3K4Me3) thereby maintaining an active chromatin state [ 50 , 51 ]. The mechanisms of de novo methylation of CpG islands are not fully understood but a strong correlation with loss of H3K4Me3 and a gain of polycomb repressive complex (PRC)-catalysed histone modifications including histone H3 lysine 27 trimethylation (H3K27Me3), creating a repressed chromatin state has been observed [ 51 ]. Evidence suggests that this PRC-mediated H3K27Me3 enrichment is a pre-requisite for de novo CpG island methylation in embryonic development and in cancer [ 52 ] and creates a constitutively silent chromatin state. In summary, we have shown that replication of HPV18 in primary HFKs isolated from six independent donors causes a consistent pattern of differential gene expression in the host cell. Integration of RNA-Seq data with CTCF ChIP-Seq data revealed that many of the significantly altered genes map to genomic loci that contain discrete clusters of differentially bound CTCF sites. The CADM1 locus on chromosome 11 contains 20 differentially bound CTCF binding sites, 19 of which display a significant reduction of CTCF binding in cells with persistently replicating HPV18 genomes. This loss of CTCF binding is coincident with a switch in epigenetic mark enrichment, from an active to inactive chromatin state, and with reduced CADM1 expression, but not with increased CpG hypermethylation as has been described in HPV-driven cancers. We have demonstrated that rearrangement of CTCF binding induced a structural change upstream of the CADM1 genebody, such that physical contacts between the transcriptional enhancer and CADM1 TSS are disrupted. Although other studies have shown that CADM1 expression negatively correlates with HPV-driven cancer stage, we now provide evidence that CADM1 gene expression is targeted by oncogenic HPV prior to cellular transformation, suggesting that CADM1 repression is an important early event in HPV establishment. Functionally, CADM1 is a member of the immunoglobulin superfamily of transmembrane glycoproteins. The extracellular domain mediates interactions of the keratinocyte with extracellular matrix and neighbouring cells including dendritic cells, NK and CD8+ T cells, while the intracellular domain contains protein 4.1-binding and PDZ-binding motifs which, upon binding intracellular partners, regulates cell motility. HPV-mediated repression of CADM1 is therefore likely to be important in persistence of infection by altering both epithelial tissue integrity and immune cell attraction and activation within the lesion. MATERIALS AND METHODS Primary keratinocyte culture and transfection The transfection of normal primary foreskin keratinocytes (HFKs) harvested from neonatal foreskin epithelia (HSE ethical approval number 06/Q1702/45) with recircularized HPV18 genomes was performed in S. Roberts’ laboratory as previously described [ 19 , 53 ]. To eliminate donor-specific effects, primary cells from six foreskin donors were used: five isolated in house and one commercially available (Lonza). RNA Sequencing Primary HFKs and HPV18-transfected isogenic lines (1 x 10 5 ) were cultured on γ - irradiated J2 fibroblasts in epidermal growth factor containing E medium [ 25 ] in 10 cm dishes until 80% confluent. J2 fibroblasts were then removed and HFKs harvested by trypsinisation. Cells were pelleted, washed with PBS, snap frozen and stored at –80 °C. RNA was extracted using the RNeasy Mini Kit following the manufacturer’s protocol (Qiagen) and DNase I treated. Libraries were prepared using TruSeq Stranded mRNA Library Prep kit for NeoPrep (Illumina) using 100 ng total RNA. Libraries were pooled and run as 75 cycle pair end reads on a NextSeq 550 (Illumina) using a high output flow cell. Sequencing reads were aligned to GRCh37 human genome merged with HPV18 genome (AY262282.1) using STAR aligner (v2.5.2b) [ 54 ]. Reads mapping to genes were counted by the same software. Normalisation of read counts and differential expression analysis between HFK and HPV18 samples was performed with DESeq2 (v.1.26.0) R Bioconductor package [ 55 ], taking into account the paired sample design of the experiment. Gene set enrichment analysis was done using GAGE (v.2.36.0) R Bioconductor package [ 56 ] with MSigDB gene set database. The computations were performed on the CaStLeS infrastructure ( http://doi.org/10.5281/zenodo.3250616 ) at the University of Birmingham. The PlotPCA function in DESeq2 was used to calculate the principal components of rlog transformed RNA-Seq expression data of the 500 most variable genes. The ClusterSignificance [ 57 ] R Bioconductor package was used to evaluate statistical significance of group separation compared to permuted data. The P-value was calculated using 10 4 permutations. Chromatin immunoprecipitation (ChIP) and next generation sequencing 1-2 x 10 7 cells were fixed in 1% formaldehyde for 3 mins at room temperature, quenched in 0.25 M glycine and washed in ice cold PBS. Chromatin was immunoprecipitated with 2-10 μg of antibody specific for CTCF (Cell Signaling #D31H2-XP) and histone modifications H3K4Me3 (Upstate: #04-745), H3K27Ac (Abcam: ab4729), H3K36Me3 (Cell Signaling: 4909S) and H3K27Me3 (Upstate: #07-449) as previously described [ 58 ]. ChIP and respective input samples were used for generation of ChIP-Seq libraries as described [ 59 ]. Briefly, 2-10 ng DNA was used in conjunction with the NEXTflex Illumina ChIP-Seq library prep kit (Cat# 5143-02) as per the manufacturer’s protocol. Samples were sequenced on a HiSeq 2500 system (Illumina) using single read (1 x 50) flow cells. Sequencing data was aligned to the GRCh37 human genome using Bowtie [ 60 ] with standard settings and the -m1 option set to exclude multi mapping reads [ 58 ]. Differential ChIP-seq analysis CTCF enriched sites (CTCF peaks) on the human genome were called in all samples using MACS1.4 [ 61 ]. Peaks were first filtered to be present in at least two samples and were subsequently merged into a stringent CTCF peak set using the Bioconductor R package DiffBind (v3.6.5)[ 62 , 63 ]. Differential sites from CTCF ChIP replicates were detected and annotated with diffReps [ 64 ] using presets of negative binomial statistics and nucleosome size detection mode parameters. Differential sites were then reported if overlapping with the stringent peak set to exclude background detection. Normalized heatmap visualization of differential sites (log2 cutoff −1 or 1) was generated with EaSeq (v1.1.1) [ 65 ]. Differential CTCF peaks were then clustered using the bedtools cluster function (v2.26.0) [ 66 ] with a maximum distance of 1 Mbp. Differential ChIP-seq analysis of post-translational histone modifications was performed similarly to CTCF using diffReps [ 64 ] with negative binomial detection presets for replicates. Differential sites for activating histone modifications (H3K4Me3 and H3K27Ac) were detected with “peak” mode presets while broader differential regions of the repressive mark H3K27Me3 and the transcription-associated mark H3K36Me3 were detected with “block” mode presets. Integration of RNA-seq and ChIP-seq data Differentially expressed genes and differential CTCF binding site clusters as well as sites of differential histone modifications were associated using the bedtools closest function (v2.26.0) [ 66 ]. Circos plot visualization of differentially expressed genes, individual differential CTCF binding sites and CTCF clusters was generated with Circos (v0.69-6) [ 67 ]. Quantitative reverse transcriptase PCR (qRT-PCR) DNase I treated RNA (3 µg) was used for random primed cDNA synthesis using Superscript® III (Invitrogen) according to the manufacturer’s instructions. qPCR was performed with 40 cycles of 95 °C, 30 s; 60 °C, 60 s; 72 °C, 40 s followed by a thermal dissociation curve for QC analysis using a Stratagene Mx3005P detection system with SyBr Green incorporation and the primers listed in Table 2 . View this table: View inline View popup Table 1: Cluster analysis of differentially bound CTCF binding peaks. View this table: View inline View popup Table 2: qRT-PCR Primers. View this table: View inline View popup Download powerpoint Table 3: 4C Primers. Western blotting and antibodies Cells were lysed in urea lysis buffer (8 M Urea, 100 mM Tris-HCl, pH 7.4, 14 mM β-mercaptoethanol, protease inhibitors) and protein concentration determined by Bradford assay. Equal amounts of protein were separated by SDS-PAGE and western blotting carried out using conventional methods. CADM1 protein was detected using SynCAM Rabbit polyclonal antibody (Abcam #ab3910; 1:1000), CTCF detected with Active Motif (#61311; 1:1000), GAPDH with Santa Cruz antibody (#0411; 1:5000) and β-actin detected with Sigma antibody (#A5441; 1:5000). Circularised chromosome conformation capture (4C-seq) 4C-Seq was carried out in three independent primary HFK donors and isogenic HPV18 transfected lines using a previously described protocol [ 68 , 69 ]. CADM1 promoter interacting fragments were captured using a 451 bp Dpn II fragment containing the CADM1 promoter, prior to digestion with Bfa I. Cells were passed through a 70 µm filter, counted and 1 x 10 7 cells were fixed in 2 % formaldehyde/10 % FCS in PBS for 10 mins at RT before quenching with 0.125 M glycine on ice. Cells were pelleted by centrifugation at 400 x g for 8 mins at 4 °C and resuspended in 5 mL ice cold lysis buffer (50 mM Tris-HCl, pH 7.5, 150 mM NaCl, 5 mM EDTA, 0.5 % NP-40, 1 % Triton-X-100, 1x protease inhibitor cocktail (Roche)) and incubated on ice for 10 mins. Nuclei were pelleted at 750 x g for 5 mins at 4 °C and snap frozen before storage at –80 °C. Primary digestion and ligation Pellets were resuspended in 500 µL 1x Dpn II restriction enzyme buffer (NEB) containing 0.3 % SDS and incubated at 37 °C with shaking at 900 rpm. Triton-X-100 was added to a final concentration of 0.625 % and the samples incubated for a further 1 hr at 37 °C with shaking at 900 rpm. 200 U of Dpn II was then added and samples incubated at 37 °C for 4 hrs with shaking at 900 rpm. A further 200 U of Dpn II was added and samples digested overnight at 37 °C with shaking and a final 200 U Dpn II was then added for a final 4 hrs to ensure complete digestion. Following restriction enzyme inactivation, digestion efficiency was determined by agarose gel electrophoresis following Proteinase K digestion of undigested and digested aliquots. Proximity ligation was carried out at 16 °C overnight by the addition of 1x ligase buffer to 7 mL and 10 µL T4 DNA Ligase (NEB) and ligation efficiency determined by agarose gel electrophoresis following Proteinase K digestion of an aliquot. Proteinase K was added to a final concentration of 40 µg/mL and samples incubated overnight at 65 °C to reverse crosslinks. 40 µg/mL RNase A was added and samples incubated at 37 °C for 45 mins before extraction with phenol-chloroform-isoamylalcohol (24:24:1) and ethanol precipitation. Pellets were resuspended in 150 µL 10 mM Tris-HCl, pH 7.5. Secondary digestion and ligation To 150 µL of each sample, 50 µL 10x restriction enzyme buffer, 50 U of Bfa I enzyme and 250 µL ddH 2 0 were added and samples incubated overnight at 37 °C. Digestion efficiency was determined as previously described and restriction enzyme heat inactivated before samples were made up to 14 mL with 1x ligase buffer and 20 µL ligase added. Ligation was carried out at 16 °C overnight. DNA was ethanol precipitated and samples purified using a QIAquick PCR purification kit (Qiagen) and eluted in 150 µL Tris-HCl, pH 7.5. PCR amplification of 4C template Captured fragments were amplified by inverse PCR using primers that amplify outwards from the bait region ( Table 2 ). Forward primers included a 5’ overhang containing the Illumina P5 sequence adapter and a unique ‘barcode’ sequence and encompassed the primary Dpn II restriction site within the CADM1 promoter bait. The common reverse primer included a 5’ overhang containing the Illumina P7 sequence adapter and were designed to bind less than 100 bps from the secondary Bfa I restriction site in the CADM1 promoter bait. PCR was carried out using 11.2 µL Expand Long Template Polymerase (Roche) with 3.2 µg template, 1.12 nmol of P5 and P7 primers, 0.2 mM dNTPs in an 800 µL reaction divided into 16 PCR tubes for 2 min 94 °C, 29 cycles of 10 s 94 °C, 1 min 55°C and 3 mins 68 °C, followed by 5 mins at 68 °C. The reactions were pooled and purified using a High Pure PCR Product Purification Kit (Roche). 4C libraries generated from each sample (2 independent HFK donors; HPV18- and HPV18+) with were amplified with sense a primer containing an Illumina P5 adapter (adapter) and unique TSBC barcode (italics) and a common primer containing a P7 Illumina adapter (underlined). CADM1 -specific viewpoint priming sites are indicated in bold. Sequencing, demultiplexing and mapping The samples underwent 101 base pair, single-end sequencing on a HiSeq 2500, to generate FASTQ files using standard Illumina base-calling pipeline software. The samples were combined in one sequencing lane and so required demultiplexing post-sequencing. The library construction positioned the barcodes “in-line” with the target sequences and comprised the first 6 bases of each read. A custom Perl script was used to perform the demultiplexing, which identified FASTQ reads containing expected barcode sequences. The custom script performed additional validation by selecting only reads that conformed to the library design, by selecting for reads that contained a fixed sequence (TGAGCATACCCTCCTCGATC) immediately adjacent to the barcode. Furthermore, sequences which read-through immediately into the bait sequence (TTCTAGAGGGGAAGAAAATAAGTA) were discarded. The FASTQ files were evaluated for sequence quality using FastQC ( https://www.bioinformatics.babraham.ac.uk/projects/fastqc/ ). We confirmed that the reads contained human DNA and were free from likely sources of genetic contamination using FastQ Screen v0.14.0 [ 70 ]. Prior to mapping, the FASTQ files were quality trimmed with Trim Galore v0.6.2 ( https://www.bioinformatics.babraham.ac.uk/projects/trim_galore/ ), using Cutadapt v1.18 [ 71 ]. This step removed low-quality and adapter sequences. The resulting FASTQ files were mapped against human genome assembly GRCh37 using Bowtie2 (v2.3.2) with default mapping parameters. Validating read position and orientation In accordance with our experimental protocol, canonical 4C ligations should generate reads derived from genomic regions adjacent to Dpn II cut sites. Moreover, forward reads should map preferentially to the 5’ end of Dpn II fragments, while reads in the reverse orientation should map to the 3’ ends. In contrast, reads should not exhibit such positional and orientation biases with respect to Bfa I cut sites. To confirm these expectations, in silico Dpn II/ Bfa I genome digestions were performed on human genome GRCh37 FASTA files with the Digester script from HiCUP v0.7.2 [ 72 ]. The position and orientation of the mapped reads were determined using the genome browser SeqMonk ( https://www.bioinformatics.babraham.ac.uk/projects/seqmonk/ ). After importing the BAM files (generated by mapping FASTQ files with Bowtie 2) and the HiCUP-generated genome digest file into SeqMonk, the “Probe Trend Plot” feature of SeqMonk calculated the relative read density over every restriction fragment in the genome. SeqMonk was also used to quantitate the number of mapped reads aligning to each restriction fragment (or contiguous merged restriction fragments). 4C Subtractive Quantitation Analysis Read quantitation comparisons were performed using the bioinformatics tool SeqMonk. Firstly, the SeqMonk pipeline “Even Coverage Probe Generator” was run, using default parameters, to create tiled windows across the Human GrCh37 reference genome. These windows varied in length, so that each one contained the same number of reads (when pooling reads across all the datasets). As expected, this pipeline produced smaller windows proximal to the 4C bait, with these window lengths increasing steadily with distance from the bait. The number of reads per window was then re-quantitated for each dataset and, to enable direct comparisons between datasets, the read counts were normalised by library size. This normalisation step effectively sets the total number of reads to be the same for each dataset. SeqMonk was then used to subtract the normalised read count for every window in the pre-infection control dataset from its corresponding window in the relevant post-infection sample dataset. This paired control/sample subtraction step was repeated for every patient. The results were displayed by SeqMonk as a bar chart adjacent to the associated genome annotation. Adaptive Nanopore Sequencing and CpG methylation analysis Sequencing was carried out on genomic DNA extracted from HFK-HPV18 donors 3, 4 and 5 using a Qiagen Blood DNA extraction kit. Approximately 1 µg DNA was prepared using the Oxford Nanopore LSK109 library preparation protocol according to manufacturer’s instructions. 150 fmol of completed library was sequenced on Nanopore Minion flowcells using R9.4.1 chemistry using an adaptive sampling protocol. The contigs of the GRCh38 reference genome and HPV18 genomes were merged and used to provide a custom genome for the adaptive sampling. A custom BED file targeting the regions of interest (ROI, available on request) was designed according to adaptive sampling parameters and used to control the sequencing run. The adaptive sampling run was set to “enrich” and the flowcells run for 72 hours, with supplemental flush and reload if necessary. Data was basecalled using Dorado 0.6 using the R9.4.1 methylation specific model ( [email protected] ) with 5 mC and 5 hmC calling switched on. This was then aligned to the custom GRCh38+HPV16/18 reference genome using minimap 2.12 (parameters: -ax map-ont), sorted and indexed with Samtools 1.16. BAM files were inspected manually with IGV v2.16 with methylation tagging visibility switched on. SUPPLEMENTAL TABLE LEGENDS Table S1: RNA Sequencing Analysis. Table shows total number of reads per sample alongside number of uniquely mapped reads, reads mapped to the HPV18 genome (AY262282.1) and the number of HPV-host fusion transcripts identified. Table S2: Genes upregulated in HFK-HPV18 compared to HFK. Mean sequencing counts in HFK and HFK-HPV18 are shown alongside log2 FC in gene expression and adjusted p value for each gene identified. Table S3: Genes downregulated in HFK-HPV18 compared to HFK. Mean sequencing counts in HFK and HFK-HPV18 are shown alongside log2 FC in gene expression and adjusted p value for each gene identified. Table S4: ChIP-Seq analysis of CTCF bound chromatin regions. Total CTCF binding peaks identified is given in the first tab. The second tab shows peaks that were differentially bound between HFK and HFK-HPV18 (mean of two donors). Data show the chromosomal location of identified peaks alongside the peak height, log2FC (up or down), neighbouring gene and genomic feature. Table S5: Integration of differential gene expression and differential CTCF peak annotation. RNA-Seq data (blue) and ChIP-Seq data (green) were integrated to determine the distance of genes (red) that were altered at least 2-fold (up and down) from the nearest at least 2-fold differentially bound CTCF peak. Table S6: Cluster analysis of CTCF binding sites. The bedtools cluster function was used to identify all loci with multiple differentially bound CTCF peaks (tab 1), integrated with corresponding differential expression (tab 2). Acknowledgements This work was funded by grants from the Medical Research Council awarded to JLP (MR/R022011/1, MR/T015985/1 and MR/N023498/1). Work from BN was funded through the Cancer Research UK Birmingham Centre award C17422/A25154. Research was carried out at the National Institute for Health and Care Research (NIHR) Birmingham Biomedical Research Centre (BRC). The funders had no role in study design, data collection and interpretation, or the decision to submit the work for publication. We thank Dr. Joseph Spitzer and his patients for the collection and donation of foreskin tissue. REFERENCES 1. ↵ de Martel C , Georges D , Bray F , Ferlay J , Clifford GM . Global burden of cancer attributable to infections in 2018: a worldwide incidence analysis . Lancet Glob Health . 2020 ; 8 ( 2 ): e180 – e90 . Epub 20191217. doi: 10.1016/S2214-109X(19)30488-7 . PubMed PMID: 31862245 . OpenUrl CrossRef PubMed 2. ↵ Moody CA , Laimins LA . Human papillomavirus oncoproteins: pathways to transformation . Nat Rev Cancer . 2010 ; 10 ( 8 ): 550 – 60 . doi: 10.1038/nrc2886 . PubMed PMID: 20592731 . OpenUrl CrossRef PubMed Web of Science 3. ↵ Wan F , Miao X , Quraishi I , Kennedy V , Creek KE , Pirisi L . Gene expression changes during HPV-mediated carcinogenesis: a comparison between an in vitro cell model and cervical cancer . Int J Cancer . 2008 ; 123 ( 1 ): 32 – 40 . doi: 10.1002/ijc.23463 . PubMed PMID: 18398830 . OpenUrl CrossRef PubMed Web of Science 4. ↵ Kang SD , Chatterjee S , Alam S , Salzberg AC , Milici J , van der Burg SH , et al. Effect of Productive Human Papillomavirus 16 Infection on Global Gene Expression in Cervical Epithelium . J Virol . 2018 ; 92 ( 20 ). Epub 20180926. doi: 10.1128/JVI.01261-18 . PubMed PMID: 30045992 . OpenUrl Abstract / FREE Full Text 5. Israr M , Rosenthal D , Frejo-Navarro L , DeVoti J , Meyers C , Bonagura VR . Microarray analysis of human keratinocytes from different anatomic sites reveals site-specific immune signaling and responses to human papillomavirus type 16 transfection . Mol Med . 2018 ; 24 ( 1 ): 23 . Epub 20180516. doi: 10.1186/s10020-018-0022-9 . PubMed PMID: 30134802 . OpenUrl CrossRef PubMed 6. ↵ Klymenko T , Gu Q , Herbert I , Stevenson A , Iliev V , Watkins G , et al. RNA-Seq Analysis of Differentiated Keratinocytes Reveals a Massive Response to Late Events during Human Papillomavirus 16 Infection, Including Loss of Epithelial Barrier Function . J Virol . 2017 ; 91 ( 24 ). Epub 20171130. doi: 10.1128/JVI.01001-17 . PubMed PMID: 29021401 . OpenUrl Abstract / FREE Full Text 7. ↵ Soto D , Song C , McLaughlin-Drubin ME . Epigenetic Alterations in Human Papillomavirus-Associated Cancers . Viruses . 2017 ; 9 ( 9 ). Epub 20170901. doi: 10.3390/v9090248 . PubMed PMID: 28862667 . OpenUrl CrossRef PubMed 8. ↵ Patel D , Huang SM , Baglia LA , McCance DJ . The E6 protein of human papillomavirus type 16 binds to and inhibits co-activation by CBP and p300 . EMBO J . 1999 ; 18 ( 18 ): 5061 – 72 . doi: 10.1093/emboj/18.18.5061 . PubMed PMID: 10487758 . OpenUrl Abstract / FREE Full Text 9. ↵ Zimmermann H , Degenkolbe R , Bernard HU , O’Connor MJ . The human papillomavirus type 16 E6 oncoprotein can down-regulate p53 activity by targeting the transcriptional coactivator CBP/p300 . J Virol . 1999 ; 73 ( 8 ): 6209 – 19 . doi: 10.1128/JVI.73.8.6209-6219.1999 . PubMed PMID: 10400710 . OpenUrl Abstract / FREE Full Text 10. ↵ McLaughlin-Drubin ME , Crum CP , Munger K . Human papillomavirus E7 oncoprotein induces KDM6A and KDM6B histone demethylase expression and causes epigenetic reprogramming . Proc Natl Acad Sci U S A . 2011 ; 108 ( 5 ): 2130 – 5 . Epub 20110118. doi: 10.1073/pnas.1009933108 . PubMed PMID: 21245294 . OpenUrl Abstract / FREE Full Text 11. ↵ Hyland PL , McDade SS , McCloskey R , Dickson GJ , Arthur K , McCance DJ , et al. Evidence for alteration of EZH2, BM I1, and KDM6A and epigenetic reprogramming in human papillomavirus type 16 E6/E7-expressing keratinocytes . J Virol . 2011 ; 85 ( 21 ): 10999 - 1006 . doi: 10.1128/JVI.00160-11 . PubMed PMID: 21865393 . OpenUrl Abstract / FREE Full Text 12. ↵ Leonard SM , Wei W , Collins SI , Pereira M , Diyaf A , Constandinou-Williams C , et al. Oncogenic human papillomavirus imposes an instructive pattern of DNA methylation changes which parallel the natural history of cervical HPV infection in young women . Carcinogenesis . 2012 ; 33 ( 7 ): 1286 – 93 . doi: 10.1093/carcin/bgs157 . PubMed PMID: 22552403 . OpenUrl CrossRef PubMed 13. ↵ Schutze DM , Kooter JM , Wilting SM , Meijer CJ , Quint W , Snijders PJ , et al. Longitudinal assessment of DNA methylation changes during HPVE6E7-induced immortalization of primary keratinocytes . Epigenetics . 2015 ; 10 ( 1 ): 73 – 81 . Epub 20150123. doi: 10.4161/15592294.2014.990787 . PubMed PMID: 25580631 . OpenUrl CrossRef PubMed 14. ↵ Au Yeung CL , Tsang WP , Tsang TY , Co NN , Yau PL , Kwok TT . HPV-16 E6 upregulation of DNMT1 through repression of tumor suppressor p53 . Oncol Rep . 2010 ; 24 ( 6 ): 1599 – 604 . doi: 10.3892/or_00001023 . PubMed PMID: 21042757 . OpenUrl CrossRef PubMed 15. ↵ Chalertpet K , Pakdeechaidan W , Patel V , Mutirangura A , Yanatatsaneejit P . Human papillomavirus type 16 E7 oncoprotein mediates CCNA1 promoter methylation . Cancer Sci . 2015 ; 106 ( 10 ): 1333 – 40 . Epub 20150925. doi: 10.1111/cas.12761 . PubMed PMID: 26250467 . OpenUrl CrossRef PubMed 16. ↵ Sartor MA , Dolinoy DC , Jones TR , Colacino JA , Prince ME , Carey TE , et al. Genome-wide methylation and expression differences in HPV(+) and HPV(-) squamous cell carcinoma cell lines are consistent with divergent mechanisms of carcinogenesis . Epigenetics . 2011 ; 6 ( 6 ): 777 – 87 . Epub 20110601. doi: 10.4161/epi.6.6.16216 . PubMed PMID: 21613826 . OpenUrl CrossRef PubMed Web of Science 17. ↵ Lechner M , Fenton T , West J , Wilson G , Feber A , Henderson S , et al. Identification and functional validation of HPV-mediated hypermethylation in head and neck squamous cell carcinoma . Genome Med . 2013 ; 5 ( 2 ): 15 . Epub 20130205. doi: 10.1186/gm419 . PubMed PMID: 23419152 . OpenUrl CrossRef PubMed 18. ↵ Pentland L , Campos-Leon K , Cotic M , Davies K-J , Wood CD , Groves IJ , et al. Disruption of CTCF-YY1-dependent looping of the human papillomavirus genome activates differentiation-induced viral oncogene transcription . Plos Biology . 2018 ; 16 ( 10 ). doi: 10.1371/source.pbio.2005752 . PubMed PMID: WOS:000449322300007 . OpenUrl CrossRef PubMed 19. ↵ Paris C , Pentland I , Groves I , Roberts DC , Powis SJ , Coleman N , et al. CCCTC-binding factor recruitment to the early region of the human papillomavirus 18 genome regulates viral oncogene expression . J Virol . 2015 ; 89 ( 9 ): 4770 – 85 . doi: 10.1128/JVI.00097-15 . PubMed PMID: 25694598 . OpenUrl Abstract / FREE Full Text 20. ↵ Kandoth C , McLellan MD , Vandin F , Ye K , Niu B , Lu C , et al. Mutational landscape and significance across 12 major cancer types . Nature . 2013 ; 502 (7471):333-9. doi: 10.1038/nature12634 . PubMed PMID: 24132290 . OpenUrl CrossRef PubMed Web of Science 21. ↵ Filippova GN , Qi CF , Ulmer JE , Moore JM , Ward MD , Hu YJ , et al. Tumor-associated zinc finger mutations in the CTCF transcription factor selectively alter tts DNA-binding specificity . Cancer Res . 2002 ; 62 ( 1 ): 48 – 52 . PubMed PMID: 11782357 . OpenUrl Abstract / FREE Full Text 22. ↵ Stark B , Poon GMK , Wyrick JJ . CTCF puts a new twist on UV damage and repair in skin cancer . Mol Cell Oncol . 2021 ; 8 ( 6 ): 2009424 . Epub 20211206. doi: 10.1080/23723556.2021.2009424 . PubMed PMID: 35419468 . OpenUrl CrossRef PubMed 23. ↵ Lebeau B , Zhao K , Jangal M , Zhao T , Guerra M , Greenwood CMT , et al. Single base-pair resolution analysis of DNA binding motif with MoMotif reveals an oncogenic function of CTCF zinc-finger 1 mutation . Nucleic Acids Res . 2022 . Epub 20220810. doi: 10.1093/nar/gkac658 . PubMed PMID: 35947648 . OpenUrl CrossRef PubMed 24. ↵ Bailey CG , Gupta S , Metierre C , Amarasekera PMS , O’Young P , Kyaw W , et al. Structure-function relationships explain CTCF zinc finger mutation phenotypes in cancer . Cell Mol Life Sci . 2021 ; 78 ( 23 ): 7519 – 36 . Epub 20211016. doi: 10.1007/s00018-021-03946-z . PubMed PMID: 34657170 . OpenUrl CrossRef PubMed 25. ↵ Wilson R , Laimins LA . Differentiation of HPV-containing cells using organotypic “raft” culture or methylcellulose . Methods Mol Med . 2005 ; 119 : 157 – 69 . doi: 10.1385/1-59259-982-6:157 . PubMed PMID: 16350403 . OpenUrl CrossRef PubMed 26. ↵ Knight GL , Pugh AG , Yates E , Bell I , Wilson R , Moody CA , et al. A cyclin-binding motif in human papillomavirus type 18 (HPV18) E1^E4 is necessary for association with CDK-cyclin complexes and G2/M cell cycle arrest of keratinocytes, but is not required for differentiation-dependent viral genome amplification or L1 capsid protein expression . Virology . 2011 ; 412 ( 1 ): 196 – 210 . doi: 10.1016/j.virol.2011.01.007 . PubMed PMID: 21276999 . OpenUrl CrossRef PubMed 27. ↵ Marsh EK , Delury CP , Davies NJ , Weston CJ , Miah MAL , Banks L , et al. Mitotic control of human papillomavirus genome-containing cells is regulated by the function of the PDZ-binding motif of the E6 oncoprotein . Oncotarget . 2017 ; 8 ( 12 ): 19491 – 506 . doi: 10.18632/oncotarget.14469 . PubMed PMID: 28061478 . OpenUrl CrossRef PubMed 28. ↵ Delury CP , Marsh EK , James CD , Boon SS , Banks L , Knight GL , et al. The role of protein kinase A regulation of the E6 PDZ-binding domain during the differentiation-dependent life cycle of human papillomavirus type 18 . J Virol . 2013 ; 87 ( 17 ): 9463 – 72 . doi: 10.1128/JVI.01234-13 . PubMed PMID: 23804647 . OpenUrl Abstract / FREE Full Text 29. ↵ Wu Q , Liu P , Wang L . Many facades of CTCF unified by its coding for three-dimensional genome architecture . J Genet Genomics . 2020 ; 47 ( 8 ): 407 – 24 . Epub 2020/11/15. doi: 10.1016/j.jgg.2020.06.008 . PubMed PMID: 33187878 . OpenUrl CrossRef PubMed 30. ↵ Pentland I , Campos-Leon K , Cotic M , Davies KJ , Wood CD , Groves IJ , et al. Disruption of CTCF-YY1-dependent looping of the human papillomavirus genome activates differentiation-induced viral oncogene transcription . PLoS Biol . 2018 ; 16 ( 10 ): e2005752 . Epub 2018/10/26. doi: 10.1371/source.pbio.2005752 . PubMed PMID: 30359362 . OpenUrl CrossRef PubMed 31. ↵ Mehta K , Gunasekharan V , Satsuka A , Laimins LA . Human papillomaviruses activate and recruit SMC1 cohesin proteins for the differentiation-dependent life cycle through association with CTCF insulators . PLoS Pathog . 2015 ; 11 ( 4 ): e1004763 . doi: 10.1371/source.ppat.1004763 . PubMed PMID: 25875106 . OpenUrl CrossRef PubMed 32. ↵ Chen H , Tian Y , Shu W , Bo X , Wang S . Comprehensive identification and annotation of cell type-specific and ubiquitous CTCF-binding sites in the human genome . PLoS One . 2012 ; 7 ( 7 ): e41374 . doi: 10.1371/source.pone.0041374 . PubMed PMID: 22829947 . OpenUrl CrossRef PubMed 33. ↵ Zhao S , Allis CD , Wang GG . The language of chromatin modification in human cancers . Nat Rev Cancer . 2021 ; 21 ( 7 ): 413 – 30 . Epub 20210517. doi: 10.1038/s41568-021-00357-x . PubMed PMID: 34002060 . OpenUrl CrossRef PubMed 34. ↵ Nakahashi H , Kieffer Kwon KR , Resch W , Vian L , Dose M , Stavreva D , et al. A genome-wide map of CTCF multivalency redefines the CTCF code . Cell Rep . 2013 ; 3 ( 5 ): 1678 – 89 . Epub 20130523. doi: 10.1016/j.celrep.2013.04.024 . PubMed PMID: 23707059 . OpenUrl CrossRef PubMed Web of Science 35. ↵ Marina-Zarate E , Rodriguez-Ronchel A , Gomez MJ , Sanchez-Cabo F , Ramiro AR. Low-affinity CTCF binding drives transcriptional regulation whereas high-affinity binding encompasses architectural functions . iScience . 2023 ; 26 ( 3 ): 106106 . Epub 20230202. doi: 10.1016/j.isci.2023.106106 . PubMed PMID: 36852270 . OpenUrl CrossRef PubMed 36. ↵ Phillips S , Cassells K , Garland SM , Machalek DA , Roberts JM , Templeton DJ , et al. Gene methylation of CADM1 and MAL identified as a biomarker of high grade anal intraepithelial neoplasia . Sci Rep . 2022 ; 12 ( 1 ): 3565 . Epub 20220303. doi: 10.1038/s41598-022-07258-5 . PubMed PMID: 35241698 . OpenUrl CrossRef PubMed 37. ↵ Birknerova N , Kovarikova H , Baranova I , Prikrylova A , Laco J , Vosmikova H , et al. DNA hypermethylation of CADM1, PAX5, WT1, RARbeta, and PAX6 genes in oropharyngeal cancer associated with human papillomavirus . Epigenetics . 2022 : 1 – 10 . Epub 20220103. doi: 10.1080/15592294.2021.2018812 . PubMed PMID: 34974810 . OpenUrl CrossRef PubMed 38. ↵ van Baars R , van der Marel J , Snijders PJ , Rodriquez-Manfredi A , ter Harmsel B , van den Munckhof HA , et al. CADM1 and MAL methylation status in cervical scrapes is representative of the most severe underlying lesion in women with multiple cervical biopsies . Int J Cancer . 2016 ; 138 ( 2 ): 463 – 71 . Epub 20150814. doi: 10.1002/ijc.29706 . PubMed PMID: 26219541 . OpenUrl CrossRef PubMed 39. ↵ Wang H , Maurano MT , Qu H , Varley KE , Gertz J , Pauli F , et al. Widespread plasticity in CTCF occupancy linked to DNA methylation . Genome Res . 2012 ; 22 ( 9 ): 1680 – 8 . doi: 10.1101/gr.136101.111 . PubMed PMID: 22955980 . OpenUrl Abstract / FREE Full Text 40. ↵ Liu Y , Rosikiewicz W , Pan Z , Jillette N , Wang P , Taghbalout A , et al. DNA methylation-calling tools for Oxford Nanopore sequencing: a survey and human epigenome-wide evaluation . Genome Biol . 2021 ; 22 ( 1 ): 295 . Epub 20211018. doi: 10.1186/s13059-021-02510-z . PubMed PMID: 34663425 . OpenUrl CrossRef PubMed 41. ↵ Nees M , Geoghegan JM , Hyman T , Frank S , Miller L , Woodworth CD . Papillomavirus type 16 oncogenes downregulate expression of interferon-responsive genes and upregulate proliferation-associated and NF-kappaB-responsive genes in cervical keratinocytes . J Virol . 2001 ; 75 ( 9 ): 4283 – 96 . doi: 10.1128/JVI.75.9.4283-4296.2001 . PubMed PMID: 11287578 . OpenUrl Abstract / FREE Full Text 42. ↵ Pyeon D , Newton MA , Lambert PF , den Boon JA , Sengupta S , Marsit CJ , et al. Fundamental differences in cell cycle deregulation in human papillomavirus-positive and human papillomavirus-negative head/neck and cervical cancers . Cancer Res . 2007 ; 67 ( 10 ): 4605 – 19 . doi: 10.1158/0008-5472.CAN-06-3619 . PubMed PMID: 17510386 . OpenUrl Abstract / FREE Full Text 43. ↵ Karstensen B , Poppelreuther S , Bonin M , Walter M , Iftner T , Stubenrauch F . Gene expression profiles reveal an upregulation of E2F and downregulation of interferon targets by HPV18 but no changes between keratinocytes with integrated or episomal viral genomes . Virology . 2006 ; 353 ( 1 ): 200 – 9 . doi: 10.1016/j.virol.2006.05.030 . PubMed PMID: 16814354 . OpenUrl CrossRef PubMed 44. ↵ Bienkowska-Haba M , Luszczek W , Zwolinska K , Scott RS , Sapp M . Genome-Wide Transcriptome Analysis of Human Papillomavirus 16-Infected Primary Keratinocytes Reveals Subtle Perturbations Mostly due to E7 Protein Expression . J Virol . 2020 ; 94 ( 3 ). Epub 20200117. doi: 10.1128/JVI.01360-19 . PubMed PMID: 31748387 . OpenUrl Abstract / FREE Full Text 45. ↵ Garner-Hamrick PA , Fostel JM , Chien WM , Banerjee NS , Chow LT , Broker TR , et al. Global effects of human papillomavirus type 18 E6/E7 in an organotypic keratinocyte culture system . J Virol . 2004 ; 78 ( 17 ): 9041 – 50 . doi: 10.1128/JVI.78.17.9041-9050.2004 . PubMed PMID: 15308700 . OpenUrl Abstract / FREE Full Text 46. ↵ Del Moral-Morales A , Salgado-Albarran M , Sanchez-Perez Y , Wenke NK , Baumbach J , Soto-Reyes E . CTCF and Its Multi-Partner Network for Chromatin Regulation . Cells . 2023 ; 12 ( 10 ). Epub 20230510. doi: 10.3390/cells12101357 . PubMed PMID: 37408191 . OpenUrl CrossRef PubMed 47. ↵ Hnisz D , Weintraub AS , Day DS , Valton AL , Bak RO , Li CH , et al. Activation of proto-oncogenes by disruption of chromosome neighborhoods . Science . 2016 ; 351 ( 6280 ): 1454 – 8 . Epub 20160303. doi: 10.1126/science.aad9024 . PubMed PMID: 26940867 . OpenUrl Abstract / FREE Full Text 48. ↵ Monteagudo-Sanchez A , Noordermeer D , Greenberg MVC . The impact of DNA methylation on CTCF-mediated 3D genome organization . Nat Struct Mol Biol . 2024 ; 31 ( 3 ): 404 – 12 . Epub 20240318. doi: 10.1038/s41594-024-01241-6 . PubMed PMID: 38499830 . OpenUrl CrossRef PubMed 49. ↵ Kim MK , Lee IH , Lee KH , Lee YK , So KA , Hong SR , et al. DNA methylation in human papillomavirus-infected cervical cells is elevated in high-grade squamous intraepithelial lesions and cancer . J Gynecol Oncol . 2016 ; 27 ( 2 ): e14 . doi: 10.3802/jgo.2016.27.e14 . PubMed PMID: 26768780 . OpenUrl CrossRef PubMed 50. ↵ Blackledge NP , Zhou JC , Tolstorukov MY , Farcas AM , Park PJ , Klose RJ . CpG islands recruit a histone H3 lysine 36 demethylase . Mol Cell . 2010 ; 38 ( 2 ): 179 – 90 . doi: 10.1016/j.molcel.2010.04.009 . PubMed PMID: 20417597 . OpenUrl CrossRef PubMed Web of Science 51. ↵ Thomson JP , Skene PJ , Selfridge J , Clouaire T , Guy J , Webb S , et al. CpG islands influence chromatin structure via the CpG-binding protein Cfp1 . Nature . 2010 ; 464 ( 7291 ): 1082 – 6 . doi: 10.1038/nature08924 . PubMed PMID: 20393567 . OpenUrl CrossRef PubMed Web of Science 52. ↵ Schlesinger Y , Straussman R , Keshet I , Farkash S , Hecht M , Zimmerman J , et al. Polycomb-mediated methylation on Lys27 of histone H3 pre-marks genes for de novo methylation in cancer . Nat Genet . 2007 ; 39 ( 2 ): 232 – 6 . Epub 20061231. doi: 10.1038/ng1950 . PubMed PMID: 17200670 . OpenUrl CrossRef PubMed Web of Science 53. ↵ Wilson R , Ryan GB , Knight GL , Laimins LA , Roberts S . The full-length E1E4 protein of human papillomavirus type 18 modulates differentiation-dependent viral DNA amplification and late gene expression . Virology . 2007 ; 362 ( 2 ): 453 – 60 . doi: 10.1016/j.virol.2007.01.005 . PubMed PMID: 17303206 . OpenUrl CrossRef PubMed 54. ↵ Dobin A , Davis CA , Schlesinger F , Drenkow J , Zaleski C , Jha S , et al. STAR: ultrafast universal RNA-seq aligner . Bioinformatics . 2012 ; 29 ( 1 ): 15 – 21 . doi: 10.1093/bioinformatics/bts635 . OpenUrl CrossRef PubMed Web of Science 55. ↵ Love MI , Huber W , Anders S . Moderated estimation of fold change and dispersion for RNA-seq data with DESeq2 . Genome Biol . 2014 ; 15 ( 12 ): 550 . Epub 2014/12/18. doi: 10.1186/s13059-014-0550-8 . PubMed PMID: 25516281 . OpenUrl CrossRef PubMed 56. ↵ Luo W , Friedman MS , Shedden K , Hankenson KD , Woolf PJ . GAGE: generally applicable gene set enrichment for pathway analysis . BMC Bioinformatics . 2009 ; 10 : 161 . Epub 2009/05/29. doi: 10.1186/1471-2105-10-161 . PubMed PMID: 19473525 . OpenUrl CrossRef PubMed 57. ↵ Serviss JT , Gadin JR , Eriksson P , Folkersen L , Grander D . ClusterSignificance: a bioconductor package facilitating statistical analysis of class cluster separations in dimensionality reduced data . Bioinformatics . 2017 ; 33 ( 19 ): 3126 – 8 . Epub 2017/09/29. doi: 10.1093/bioinformatics/btx393 . PubMed PMID: 28957498 . OpenUrl CrossRef PubMed 58. ↵ Gunther T , Grundhoff A . The epigenetic landscape of latent Kaposi sarcoma-associated herpesvirus genomes . PLoS Pathog . 2010 ; 6 ( 6 ): e1000935 . Epub 2010/06/10. doi: 10.1371/source.ppat.1000935 . PubMed PMID: 20532208 . OpenUrl CrossRef PubMed 59. ↵ Gunther T , Frohlich J , Herrde C , Ohno S , Burkhardt L , Adler H , et al. A comparative epigenome analysis of gammaherpesviruses suggests cis-acting sequence features as critical mediators of rapid polycomb recruitment . PLoS Pathog . 2019 ; 15 ( 10 ): e1007838 . Epub 2019/11/02. doi: 10.1371/source.ppat.1007838 . PubMed PMID: 31671162 . OpenUrl CrossRef PubMed 60. ↵ Langmead B , Trapnell C , Pop M , Salzberg SL . Ultrafast and memory-efficient alignment of short DNA sequences to the human genome . Genome Biol . 2009 ; 10 ( 3 ): R25 . Epub 2009/03/06. doi: 10.1186/gb-2009-10-3-r25 . PubMed PMID: 19261174 . OpenUrl CrossRef PubMed 61. ↵ Zhang Y , Liu T , Meyer CA , Eeckhoute J , Johnson DS , Bernstein BE , et al. Model-based analysis of ChIP-Seq (MACS) . Genome Biol . 2008 ; 9 ( 9 ): R137 . Epub 20080917. doi: 10.1186/gb-2008-9-9-r137 . PubMed PMID: 18798982 . OpenUrl CrossRef PubMed 62. ↵ Stark R , Brown G . DiffBind differential binding analysis of ChIP-Seq peak data . In R package version . 2011 ; 100 . 63. ↵ Stark RB , G . DiffBind differential binding analysis of ChIP-Seq peak data . In R package version , 2011 . R package version 2011. 64. ↵ Shen L , Shao NY , Liu X , Maze I , Feng J , Nestler EJ . diffReps: detecting differential chromatin modification sites from ChIP-seq data with biological replicates . PLoS One . 2013 ; 8 ( 6 ): e65598 . Epub 20130610. doi: 10.1371/source.pone.0065598 . PubMed PMID: 23762400 . OpenUrl CrossRef PubMed 65. ↵ Lerdrup M , Johansen JV , Agrawal-Singh S , Hansen K . An interactive environment for agile analysis and visualization of ChIP-sequencing data . Nat Struct Mol Biol . 2016 ; 23 ( 4 ): 349 – 57 . Epub 20160229. doi: 10.1038/nsmb.3180 . PubMed PMID: 26926434 . OpenUrl CrossRef PubMed 66. ↵ Quinlan AR , Hall IM . BEDTools: a flexible suite of utilities for comparing genomic features . Bioinformatics . 2010 ; 26 ( 6 ): 841 – 2 . Epub 20100128. doi: 10.1093/bioinformatics/btq033 . PubMed PMID: 20110278 . OpenUrl CrossRef PubMed Web of Science 67. ↵ Krzywinski M , Schein J , Birol I , Connors J , Gascoyne R , Horsman D , et al. Circos: an information aesthetic for comparative genomics . Genome Res . 2009 ; 19 ( 9 ): 1639 – 45 . Epub 20090618. doi: 10.1101/gr.092759.109 . PubMed PMID: 19541911 . OpenUrl Abstract / FREE Full Text 68. ↵ Splinter E , de Wit E , van de Werken HJ , Klous P , de Laat W . Determining long-range chromatin interactions for selected genomic sites using 4C-seq technology: from fixation to computation . Methods . 2012 ; 58 ( 3 ): 221 – 30 . Epub 2012/05/23. doi: 10.1016/j.ymeth.2012.04.009 . PubMed PMID: 22609568 . OpenUrl CrossRef PubMed Web of Science 69. ↵ Wood CD , Veenstra H , Khasnis S , Gunnell A , Webb HM , Shannon-Lowe C , et al. MYC activation and BCL2L11 silencing by a tumour virus through the large-scale reconfiguration of enhancer-promoter hubs . Elife . 2016 ; 5 . Epub 2016/08/05. doi: 10.7554/eLife.18270 . PubMed PMID: 27490482 . OpenUrl CrossRef PubMed 70. ↵ Wingett S , Andrews S . FastQ Screen: A tool for multi-genome mapping and quality control [version 2; peer review: 4 approved] . F1000Research . 2018 ; 7 ( 1338 ). doi: 10.12688/f1000research.15931.2 . OpenUrl CrossRef PubMed 71. ↵ Martin M. Cutadapt removes adapter sequences from high-throughput sequencing reads . 2011 . 2011; 17 ( 1 ): 3 . Epub 2011-08-02. doi: 10.14806/ej.17.1.200 . OpenUrl CrossRef 72. ↵ Wingett S , Ewels P , Furlan-Magaril M , Nagano T , Schoenfelder S , Fraser P , et al. HiCUP: pipeline for mapping and processing Hi-C data [version 1; peer review: 2 approved, 1 approved with reservations] . F1000Research . 2015 ; 4 ( 1310 ). doi: 10.12688/f1000research.7334.1 . OpenUrl CrossRef PubMed 73. ↵ Schmidt D , Schwalie PC , Wilson MD , Ballester B , Goncalves A , Kutter C , et al. Waves of retrotransposon expansion remodel genome organization and CTCF binding in multiple mammalian lineages . Cell . 2012 ; 148 ( 1-2 ): 335 – 48 . doi: 10.1016/j.cell.2011.11.058 . PubMed PMID: 22244452 . OpenUrl CrossRef PubMed Web of Science View the discussion thread. Back to top Previous Next Posted August 16, 2024. Download PDF Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Repression of CADM1 transcription by HPV type 18 is mediated by three-dimensional rearrangement of promoter-enhancer interactions Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Repression of CADM1 transcription by HPV type 18 is mediated by three-dimensional rearrangement of promoter-enhancer interactions Karen Campos-León , Jack Ferguson , Thomas Günther , C. David Wood , Steven W. Wingett , Selin Pekel , Christy S Varghese , Csilla Varnai , Michelle West , Andrew Beggs , Adam Grundhoff , Boris Noyvert , Sally Roberts , Joanna L Parish bioRxiv 2024.08.16.608206; doi: https://doi.org/10.1101/2024.08.16.608206 Share This Article: Copy Citation Tools Repression of CADM1 transcription by HPV type 18 is mediated by three-dimensional rearrangement of promoter-enhancer interactions Karen Campos-León , Jack Ferguson , Thomas Günther , C. David Wood , Steven W. Wingett , Selin Pekel , Christy S Varghese , Csilla Varnai , Michelle West , Andrew Beggs , Adam Grundhoff , Boris Noyvert , Sally Roberts , Joanna L Parish bioRxiv 2024.08.16.608206; doi: https://doi.org/10.1101/2024.08.16.608206 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Microbiology Subject Areas All Articles Animal Behavior and Cognition (7644) Biochemistry (17726) Bioengineering (13916) Bioinformatics (42033) Biophysics (21486) Cancer Biology (18635) Cell Biology (25549) Clinical Trials (138) Developmental Biology (13397) Ecology (19940) Epidemiology (2067) Evolutionary Biology (24361) Genetics (15620) Genomics (22541) Immunology (17763) Microbiology (40468) Molecular Biology (17207) Neuroscience (88739) Paleontology (667) Pathology (2842) Pharmacology and Toxicology (4834) Physiology (7659) Plant Biology (15175) Scientific Communication and Education (2047) Synthetic Biology (4304) Systems Biology (9834) Zoology (2272)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2024) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00