Identification of a terpene synthase arsenal using long-read sequencing and genome assembly ofAspergillus wentii

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 58,800 characters · extracted from preprint-html · click to expand
Identification of a terpene synthase arsenal using long-read sequencing and genome assembly of Aspergillus wentii | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Identification of a terpene synthase arsenal using long-read sequencing and genome assembly of Aspergillus wentii Richard Olumakaiye , View ORCID Profile Christophe Corre , View ORCID Profile Fabrizio Alberti doi: https://doi.org/10.1101/2024.09.23.614465 Richard Olumakaiye 1 School of Life Sciences, University of Warwick , Coventry, CV4 7AL, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site Christophe Corre 1 School of Life Sciences, University of Warwick , Coventry, CV4 7AL, UK 2 Department of Chemistry, University of Warwick , Coventry, CV4 7AL, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Christophe Corre Fabrizio Alberti 1 School of Life Sciences, University of Warwick , Coventry, CV4 7AL, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Fabrizio Alberti For correspondence: F.Alberti{at}warwick.ac.uk Abstract Full Text Info/History Metrics Supplementary material Preview PDF ABSTRACT Fungi are talented producers of secondary metabolites with applications in the pharmaceutical and agrochemical sectors. Aspergillus wentii CBS 141173 has gathered research interest due to its ability to produce high-value norditerpenoid compounds, including anticancer molecules. In this study, we aimed to expand the genomic information available for A. wentii to facilitate the identification of terpenoid biosynthetic genes that may be involved in the production of bioactive molecules. Long-read genome sequencing of Aspergillus wentii CBS 141173 was conducted using Oxford Nanopore Technologies (ONT) MinION MK1C. In addition, paired-end stranded RNA-seq data from two time points, 7 days and 30 days, was used for functional annotation of the assembled genome. Overall, we assembled a genome of approximately 31.2 Mb and identified 66 biosynthetic gene clusters from the annotated genome. Metabolic extracts of A. wentii were analysed and the production of the bioactive terpenoid asperolide A was confirmed. We further mined the assembled and annotated genome for BGCs involved in terpenoid pathways using a combination of antiSMASH and local BlastP and identified 16 terpene synthases. Phylogenetic analysis was conducted and allowed us to establish relationships with other characterised terpene synthases. We identified two terpene clusters potentially involved in pimarane-like diterpenoid biosynthesis. Finally, the analysis of the 16 terpene synthases in our 7-day and 30-day transcriptomic data suggested that only four of them were constitutively expressed under laboratory conditions. These results provide a scaffold for the future exploration of terpenoid biosynthetic pathways for bioactive molecules in A. wentii . The terpenoid clusters identified in this study are candidates for heterologous gene expression and/or gene disruption experiments. The description and availability of the long-read genome assembly of A. wentii CBS 141173 further provides the basis for downstream genome analysis and biotechnological exploitation of this species. BACKGROUND Aspergillus is one of the best studied genera of filamentous fungi, largely because of the medical and industrial relevance of some of its species. Their ubiquitous nature enables them to perform roles as saprophytes, parasites and endophytic symbionts with other entities in the environment, arguably inspiring the diverse secondary metabolic pathways exhibited by these organisms that range from toxins to antimicrobial molecules [ 1 ]. These secondary metabolites can be classified into various groups such as polyketides, terpenoids, peptides, alkaloids and meroterpenoids, which have raised pharmaceutical and agrochemical interests for human use. A noteworthy example is the cholesterol-lowering agent lovastatin produced by Aspergillus terreus [ 2 ]. For context, in the past 40 years, natural products and their derivatives from living organisms have accounted for 32% of the total small molecule drugs approved by the U.S. Food and Drug Administration with major impact as anticancer and antibacterial preparations [ 3 ]. Within the Aspergillus genus, Aspergillus wentii is known to produce a plethora of bioactive molecules, including 97 reported compounds that include terpenoids, anthraquinones and xanthones [ 4 ]. To understand and exploit the biosynthesis of bioactive molecules, genome sequencing is essential. The genome sequence of Aspergillus wentii CBS 141173 was first reported in 2017, as part of a study conducted by a global consortium of mycologists to provide better genomic coverage for the genus Aspergillus [ 5 ]. However, only short-read sequencing was employed in this case. In the present study, we explored Aspergillus wentii CBS 141173, a commonly found fungus in terrestrial, marine and endophytic environments and a talented producer of small molecules. This strain is a promising reservoir of a specific group of natural products with valuable biological potentials for application in medicine known as norditepenoid dilactones, which include asperolide A, wentilactone A and B ( Figure 1 ) [ 6 , 7 ]. They belong to a family of diterpenoids that includes tetranorlabdane, podolactone, aromatic norditerpenes, and isopimarane. Most importantly, wentilactone A has been reported to exert a significantly selective toxicity by its inhibitory effect on lung carcinoma cell lines [ 8 ]. A recent review by Ainousah et al . extensively discussed A. wentii , highlighting the terpenoids produced by this organism [ 4 ]. This group of compounds displayed various biological properties including in vitro and in vivo antifungal, cytotoxic, herbicidal, and plant-growth-regulating activity. Download figure Open in new tab Figure 1: Examples of natural products reported from Aspergillus wentii . Fungal terpenoid natural products are derived from the common five-carbon isoprene units isopentenyl diphosphate (IPP) and dimethylallyl diphosphate (DMAPP), which are synthesized from the mevalonate (MVA) pathway [ 9 ]. These isoprene units can be joined together to form various terpenoid scaffolds by the catalytic activity of terpene synthases; geranyl pyrophosphate (GPP) synthase, farnesyl pyrophosphate (FFP) synthase and geranyl geranyl pyrophosphate (GGPP) synthase leading to monoterpenes (C10), sesquiterpenes (C15) and diterpenes (C20), respectively [ 10 ]. It has been proposed that the family of norditerpenoids could derive from the removal of four methylene groups from a C20 diterpenoid, therefore producing a C16 molecule [ 11 ]. Clustering of genes that collaborate towards biosynthesis of secondary metabolites is a genomic phenomenon that has been widely recognised [ 12 ]. They are often described as biosynthetic gene clusters (BGCs) and have greatly aided researchers in characterising and even directing biosynthesis of the corresponding metabolite [ 13 ]. BGCs can be searched for within assembled genomes using a range of bioinformatics tools such as antiSMASH [ 14 ], cblaster [ 15 ] and local Blast searches. In the present work, we aimed to complement the existing short-read genome assembly of A. wentii CBS 141173 published by de Vries et al . [ 5 ], with a nanopore long-read assembly and functional annotation framework of paired-end stranded RNA-seq data. The newly annotated genome and transcriptomic data will aid the elucidation of the terpene synthase biosynthetic gene clusters that could putatively be involved in the production of norditerpenoid lactone secondary metabolites and in the characterisation of other cryptic BGCs present within the genome. MATERIALS AND METHODS Fungal strain Aspergillus wentii CBS 141173 was obtained from CBS-KNAW, Fungal Biodiversity Centre, Westerdijk, Netherlands. The strain was grown and maintained on Potato Dextrose Agar (PDA, 20 g/L glucose, 4 g/L potato extract, 20 g/L agar) plates and Potato Dextrose Broth (PDB, 20 g/L glucose, 4 g/L potato extract). Genomic DNA extraction A. wentii CBS 141173 cultures were grown on 25 mL PDB within 250 mL conical flasks, using agar plugs from PDA plates containing the fungus as the inoculum. The flasks were incubated for 72 hours, at 25°C, shaking at 200 rpm. Fungal mycelia were pelleted from the broth via centrifugation at 8,000 g for five minutes, the pellet was subsequently washed twice with distilled water to remove residual media. High Molecular Weight (HMW) genomic DNA extraction was carried out with via cryogenic grinding with liquid nitrogen, and a sterile mortar and pestle. 1 g of fresh mycelia was grinded into a fine powder. 200 mg of the powder were transferred aseptically into a microcentrifuge tube. For genomic DNA extraction, GenElute™ Plant Genomic DNA Miniprep Kit (Sigma-Aldrich) was used, following the manufacturer’s protocol. Extracted genomic DNA was further concentrated by ethanol precipitation. Briefly, 1/10 volume of 3 M sodium acetate, pH 5.2, was added to the eluted gDNA, followed by three volumes of 100% ethanol. The samples were mixed by gentle inversion and stored at −20 °C overnight, then spun at 14,000 g for 30 minutes at 4°C. The supernatant was decanted, the DNA pellet was air dried and resuspended in nuclease free water (ThermoFisher). To ascertain the quality and concentration of extracted genomic DNA, gel electrophoresis (1% w/v agarose gel with 1 x GelRed), Nanodrop ND 1000 (Thermo Fisher, USA), and Qubit (dsDNA Broad range assay, Invitrogen) were used. RNA extraction and sequencing A. wentii CBS 141173 total RNA was extracted using Plant/Fungi total RNA purification kit (Norgen Biotek) following the manufacturer’s instructions, based on column purification technology. An agar plug of growing mycelium was taken from a PDA plate and used to inoculate 50 mL of PDB in a 250 mL flask. Collection of the mycelia at two timepoints was performed, after 7 days and 30 days of growth, respectively, at 25°c with shaking at 200 rpm. The mycelium was harvested by centrifugation at 7,000 x g for 3 minutes, supernatant discarded, and 1 g of mycelium was grinded into a fine powder in liquid nitrogen using sterile mortar and pestle in an RNAse decontaminated environment. Using a sterile inoculation loop, 100 mg of the fine powder were transferred into a sterile 1.5 ml microcentrifuge tube and kept on dry ice. The RNA extraction and DNAse treatment were performed following the manufacturer’s instruction. The purified RNA was visualised on a 1% w/v agarose gel with 1x GelRed to assess integrity. Quantification of the RNA and purity checks were conducted with Nanodrop ND 1000 (Thermo Fisher). The RNA was sequenced with Illumina paired-end (2×150 bp) technology on a HiSeq 2500 platform (Azenta Life Sciences). Genome sequencing The genome of A. wentii was sequenced with Oxford Nanopore Technology (ONT)(16). The manufacturer’s protocol for the Ligation sequencing kit (SQK-LSK109) was followed with minor modifications introduced for DNA repair and end-prep stage by increasing the incubation time and temperature after washing with ethanol to 15 minutes at 37°C. To enrich DNA fragments of 3 kb or longer, the Long Fragment Buffer was used for the DNA clean-up. Noteworthy, 1.2 µg of genomic DNA was used for the library preparation, resulting in a final amount of 345 ng of DNA at the end of the adapter ligation and clean-up step. Nanopore sequencing was performed on a MinION MK1C Platform with a FLO-MIN-106 R9.4 flow-cell and run for 18 hours. Genome assembly De novo strategies were utilised for the fungal genome assembly. Utilizing the default parameters, raw data from the MinION MK1c output .fastq files were transferred and merged into one single .fastq file and inputted into Flye version 2.8.2 using default settings and the nano-raw mode, to create a draft genome assembly. Polishing of this draft assembly was done by aligning the merged .fastq file that was inputted into Flye against the draft genome using Minimap2 version 2.11, errors could then be corrected using Racon version 1.4.20 [ 17 ]. The settings used in Racon were as follows: a value of 8 for matching bases, −6 for mismatches, −8 for gaps, and a window size of 500. Polishing using this procedure was performed three times. The third Racon polished assembly was then inputted into Medaka version 1.2.1 ( https://github.com/nanoporetech/medaka ) using model r941_min_high_g360 and default settings creating a consensus fasta file. Polishing was then performed on the consensus file generated by medaka using Pilon version 1.24 [ 18 ] and its default settings. The output from Pilon was polished again, this was repeated until Pilon had been run four times. For the polished genome evaluation, Benchmarking Universal Single-Copy Orthologs (BUSCO) version 5.6.1 was used with eurotiales_odb10 database with the default genome mode settings [ 19 ]. Genome annotation Functional annotation was done using the Funannotate version 1.8.17 pipeline [ 20 ], utilizing a “gold standard” annotation framework of paired-end stranded RNA-seq data from two time points, 7 days and 30 days coupled with a genome assembly built from a de novo strategy, following the Funannotate user instructions of clean-sort-mask. The following step of Funannotate training involved the introduction of RNA sequencing data, using downstream commands Funannotate predict and Funannotate update. Results generated were then run through antiSMASH v7.1.0 [ 14 ] within the Funannotate pipeline. The final prediction was run on BUSCO [ 19 ] to provide quality check on the predicted proteins generated, once again using the eurotialales_odb10 database. All parameters not mentioned above were left on their default setting, unless stated otherwise. The annotated genome of A. wentii CBS 141173 was further analysed by running EggNOG-mapper v2.1.12 [ 21 ] and programs that are part of the GenomeTools 1.6.1 package [ 22 ]. Fungal metabolite extraction A. wentii CBS 141173 was cultured on PDA plates at 28°C for 10 days and then agar plus were used to inoculate 100 mL of PDB medium in 500 mL flasks, which were grown for 30 days at 25 °C, shaking at 200 rpm. The culture was then homogenised by TissueRuptor (Qiagen) to a fine consistent paste. The blended mix was acidified with concentrated hydrochloric acid to pH= 3. Thereafter, it was twice extracted with ethyl acetate with a ratio of 1:1 v/v. The organic phases resulting from the two extractions were pooled, dried with addition of an excess of MgSO 4 , filtered and evaporated in vacuo . The resulting residues were dissolved in high-performance liquid chromatography (HPLC)-grade methanol, spin-filtered, transferred to amber glass 11 mm vials and analysed by Ultra-high performance Liquid Chromatography-High-Resolution Mass Spectrometry (UHPLC-HRMS). UHPLC-HRMS Analysis UHPLC-HRMS analyses were carried out on 5 μL of prepared extracts injected through a reverse phase column using an UHPLC-HRMS Agilent ZORBAX Eclipse Plus column C18, 4.6 × 150 mm 40 (particle size 5 μm) on a Dionex 3000RS UHPLC coupled to a Bruker Ultra High Resolution (UHR) Q-TOF MS MaXis II mass spectrometer with an electrospray source. Sodium formate (10 mM) was utilised for internal calibrations, with a gradient elution from 95 : 5 solvent A/solvent B to 0 : 100 solvent A/solvent B in 35 minutes, with solvent A being water (0.1% formic acid) and solvent B acetonitrile (0.1% formic acid). Identification of terpene synthases The long-read genome assembly of A. wentii incorporating full length transcriptomic RNA-seq data was used in this study. This allowed the identification of putative terpene synthase (TS) gene family based on antiSMASH predictions and local BlastP analysis using as a query TS genes from NCBI GenBank ( https://www.ncbi.nlm.nih.gov/genbank/ ) and UniProt ( https://www.uniprot.org/ ). Phylogenetic analysis Multiple sequence alignments of protein sequences of mined TSs and their homologues from other organisms were conducted using MUSCLE in MEGA11.0 using default settings. The obtained alignment was used as the input for the Maximum Likelihood tree algorithm in MEGA11.0 software to construct a phylogenetic tree [ 23 ]. Visualisation was conducted using iTOL: Interactive Tree Of Life web viewer https://itol.embl.de/ . RESULTS Genomic DNA and total RNA extraction High molecular weight (HMW) genomic DNA of Aspergillus wentii was sequenced using Oxford nanopore long-read whole-genome sequencing. HMW genomic DNA extraction was performed on A. wentii in duplicate (Supplementary Figure 1). The extracted genomic DNA was further subjected to ethanol precipitation and resuspended in 35 µL of nuclease-free water leading to an improved concentration of both samples (Supplementary Table 1). Fungal total RNA was extracted in duplicate from A. wentii liquid cultures at two time points, 7 days and 30 days, and sequenced using Illumina paired-end (2×150 bp) sequencing. The number of RNA-seq reads obtained for each sample is shown in Supplementary Table 2. Genome assembly and analysis The nanopore sequencing generated a significant quantity of long-read data with a high degree of coverage of over 100x. The large coverage of the long-read nanopore sequencing allowed for a robust first draft genome to be created, with only few fragments. To improve the annotation framework, we included paired-end RNA-seq data from two time points, which is known to lead to a high-quality annotation facilitated by Funannotate 1.8.17 [ 20 ]. The final draft genome size for the organism was 31.2 Mb. This is consistent with the size of other Aspergilli genome assemblies which tend to be 31–40 Mb in size [ 5 , 24 ]. The full genome statistics ( Table 1 ), were generated with genometools [ 22 ]. Briefly, the genome comprised 8 contigs, 7 of which may be putatively assembled at the chromosome level and 1 being putatively mitochondrial View this table: View inline View popup Download powerpoint Table 1: Genome statistics and predicted features of the nanopore assembled genome of Aspergillus wentii CBS 141173. DNA. The genome has a 47.2% GC content, N50 length of 4,417,627 bp, with the longest contig being 7,905,159 bp and the average gene length being 1,365 bp. A total of 12,925 genes and 187 tRNAs were predicted from the genome. While the gene function of the predicted genes in genomes was assigned using Funannotate, the predicted proteome was run again through Eggnog-mapper v2.1.4-2 [ 21 ]. This yielded a prediction of 10,592 proteins. Supplementary Figure 2 shows how through eggnog-mapper we were able to assign gene ontology terms to the genome including matches to multiple KEGG databases, and BRITE hierarchies. Additionally, predicted proteins were matched to the Carbohydrate Active enZymes (CAZymes) CAZy database and a total number of 1,615 genes were predicted to be CAZy. Noteworthy, >85% of genes in the genome were matched to proteins in the pfam database. All data generated using eggnog mapper are available in the Supplementary Dataset 1. From the predicted proteins from eggnog-mapper, 85.7% Clusters of Orthologous Groups (COG) categories were assigned. The distribution of the predicted proteins across the COG categories is shown in Supplementary Figure 3. The most frequently mapped category was “Function Unknown”. Of those that could be placed into a category of known function, the five most common in order of decreasing predicted protein count within the categories were “Intracellular trafficking, secretion, and vesicular transport”, “Amino acid transport and metabolism”, “Secondary metabolite biosynthesis, transport and catabolism”, “Posttranslational modification, protein turnover, chaperones”, and “Carbohydrate transport and metabolism”. The presence of over 575 proteins associated with secondary metabolites in the genome is promising and these deserve further examinations, particularly in the context of the high value terpenoids such as wentilactones, and asperolides known to be produced by Aspergillus wentii . It is also interesting that no mobilome elements associated with transposons and prophages were detected, and less than 100 predicted proteins were identified in the genome that were associated with any of the following categories: “Extracellular structures”, “Cell motility”, “Nuclear structure”, and “Defence mechanisms”. Finally, BUSCO was used to assess the completeness of the genome assembly and annotation using the Eurotiales odb10, and suggested a complete annotation set with a 94.8% genome BUSCO score and a 95.3% protein BUSCO score, respectively (Supplementary Table 3). Biosynthetic gene clusters analysis The whole genome sequence of Aspergillus wentii produced in this study, as well as the one produced previously through short-read sequencing [ 5 ] were mined for putative biosynthetic gene clusters (BGCs) using antiSMASH [ 14 ]. A total number of 66 BGCs were identified from the sequenced genome (Supplementary Dataset 2). This is an improvement compared to 50 BGCs identified from the genome previously deposited to NCBI and JGI ( Table 2 ). From the present study, 19 non-ribosomal peptide synthetases (NRPS) BGCs were found to be the most abundant in the genome, followed by polyketide synthases (PKS) and terpene BGCs. View this table: View inline View popup Download powerpoint Table 2: Comparative antiSMASH analysis of predicted BGCs from the two Aspergillus wentii CBS 141173 genome assemblies. Comparative genomics To further analyse the biosynthetic capabilities of Aspergillus genomes, a BGC comparative analysis was conducted using the BGC identification defined by antiSMASH ( Figure 2 ). Across the set genomes used for this analysis, it is noteworthy that Aspergillus parasiticus contained the highest number of BGCs - 77. Interestingly, the highest number of putative terpene BGCs - 13 - was found in the long-read assembly of A. wentii , followed by A. felis and A. nidulans with 11 and 10, respectively. NRPS and PKS BGCs were altogether the most dominant class across the Aspergilli genomes. For instance, 26 NRPS clusters were identified from both A. flavus and A. parasiticus . Our long-read assembly of A. wentii recorded a high number of polyketide BGCs - 16 - while the highest was 17 from the A. parasiticus genome. There is a vast resource of fungal genomes to always inspire BGCs comparative studies, notwithstanding, our BGC analysis shows that the long-read assembly of A. wentii CBS41173 is consistent with other Aspergillus genomes in its capacity to produce diverse natural products. Download figure Open in new tab Figure 2: Comparison of the BGCs found in selected Aspergillus genomes. The number of BGCs from the sequenced A. wentii fungal strain was compared to the number of BGCs from other members of the Aspergillus genus as predicted by antiSMASH. This revealed that the fungal strain characterised in this study has the potential to produce terpenoids, polyketides and NRPs in line with other members of the genus. Production of asperolide A UHPLC-HRMS was used to analyse metabolite extracts from A. wentii CBS 141173. Asperolide A was detected from the metabolic extracts on the basis of the calculated m/z 289.1076 [M+H] + for asperolide A. Extracted ion chromatogram of the HRMS data showed a dominant ion peak at m/z 289.1072 ( Figure 3 ) and the molecular formula was predicted as C 16 H 16 O 5 , confirming the production of the norditerpenoid compound. Speculatively, asperolide A might be the main norditerpenoid produced by A. wentii CBS 141173 at the 30-day time point analysed under laboratory conditions. Download figure Open in new tab Figure 3: UHPLC-HRMS detection of asperolide A. A ) Extracted ion chromatogram in positive mode for m/z = 289.1076 is shown, highlighting accumulation of asperolide A in A. wentii (trace in blue) and not in the culture medium control (trace in grey). B ) Mass spectrum of asperolide A (M= C 16 H 16 O 5 ); m/z expected for [M + H] + = 289.1076, for [M + Na] + = 311.0895. Terpene synthases from Aspergillus wentii CBS 141173 To identify putative terpene synthases that could be involved in the production of terpenoids in A. wentii, we utilised two strategies, antiSMASH and local BlastP analysis. Noteworthy, from the 13 putative terpenoid clusters identified by antiSMASH, we shortlisted 10 (AwTS1 – AwTS10), based on their protein blast (BlastP) homology with other known TSs from the UniProt database ( Table 3 ). Using a manual BlastP analysis of the Aspergillus wentii BGCs on antiSMASH, we also recruited additional terpene synthases (AwTS11 – AwTS14) found within other BGCs such as polyketide and NRPS clusters. Finally, a local BlastP search using geranylgeranyl pyrophosphate synthase as a query allowed us to identify pimarane/pimaradiene-like synthases (AwTS15, AwTS16) from the genome assembly. View this table: View inline View popup Download powerpoint Table 3: BlastP analysis of terpene synthases from Aspergillus wentii CBS 141173 genome. Terpene biosynthetic gene clusters To understand the genetic context of the terpene synthases identified, we analysed the flanking regions of each of the terpene synthase genes. Full descriptions of the gene clusters can be found in Supplementary Dataset 3. Worth highlighting is that the AwTS15 and AwTS16 terpene clusters are predicted to encode a pimarane/pimaradiene diterpenoid scaffold. For the AwTS15 BGC ( Figure 4A ), BlastP analysis shows the presence of primary metabolic enzymes such as the HMG-CoA involved in the mevalonate pathway that may be involved in the biosynthesis of geranylgeranyl pyrophosphate to make a diterpenoid compound. The additional presence of multifunctional biosynthetic enzymes such as oxidoreductase and a cytochrome P450 in the cluster could potentially be involved in the maturation of the diterpenoid scaffold. Also, for the AwTS16 BGC ( Figure 4B ), the presence of three cytochrome P450s and other tailoring enzymes makes it a candidate cluster for the production of pimarane-like diterpenoids biosynthesis in A. wentii . Other notable terpenoid clusters found in the genome include the AwTS1 triterpenoid cluster ( Figure 4C ) and AwTS13 hybrid terpene cluster with an NRPS biosynthetic origin ( Figure 4D ). Experimental characterisation will be vital to elucidate the resulting biosynthetic products. Download figure Open in new tab Figure 4: Diversity of the terpenoid biosynthetic gene clusters from A. wentii CBS 141173. A ) AwTS15 diterpenoid gene cluster. B ) AwTS16 diterpenoid gene cluster. C ) AwTS1 triterpenoid gene cluster, D ) AwTS13 hybrid terpene-NRPS biosynthetic gene cluster. Terpene Phylogeny To further investigate the role of the terpenoid genes from Aspergillus wentii in making terpenoid compounds, a phylogenetic assessment was also conducted using 55 TS proteins, comprising the 16 identified AwTSs from Aspergillus wentii ( Table 3 ), and 39 characterised TSs from other fungal species (Supplementary Dataset 4). These terpene synthases were grouped into subfamilies (TFa-TFj) based on their putative role in terpenoids biosynthesis such as diterpenoid pyrones, tricyclic diterpenoids, and mixed terpenoids ( Figure 5 ). Download figure Open in new tab Figure 5: Phylogenetic analysis of Aspergillus wentii CBS 141173 terpene synthases (AwTS), based on their predicted protein sequences. The Maximum Likelihood algorithm tree was generated from an alignment of 55 TS proteins, comprising 16 AwTS and another 39 characterised TSs from different fungal species. Sections are identified by colours. The names of the sections are indicated as TF-a : Tricyclic diterpenoids, TF-b : Mixed diterpenoids, TF-c : Diterpenoid pyrones, TF-d : Mixed sesquiterpenoids, TF-e : Sesterterpenoids, TF-f : α-humulene based terpenoids, TF-g : Indole diterpenoids, TF-h : Squalenes, TF-i: Diterpenoids, TF-j: Lanosterol transferases. From the phylogeny analysis, the A. wentii terpene synthases appeared to be very diverse and share similarities with some bifunctional cyclases (TF-a, and TF-f) such as those that could encode for terpenoid scaffolds such as monocyclic humulene-like compounds and tricyclic diterpenoids, respectively. Additionally, we observed relationships between AwTS6, -11, -12 and -13 and terpene synthases involved in mixed biosynthetic pathways (TF-b and TF-d) ( Figure 5 ). AwTS2 and AwTS9 fell into the TF-i subfamily, revealing their relationship with other diterpenoid synthases. The AwTSs in the TF-h section are putative triterpenoid synthases and distinctly AwTS10 belong to the lanosterol transferase category. Interestingly none of the AwTS belonged to the subfamilies of diterpenoid pyrone, sesterterpenoid and indole diterpenoids. Expression of AwTSs under laboratory conditions We further analysed the count of the RNA transcripts of each of the terpene genes by comparing them with the beta-tubulin and GAPDH (housekeeping) genes of A. wentii to gain insights into the level of their gene expression ( Table 5 ). Interestingly, from the 16 TSs recruited for our analysis across the two different timepoints of 7 days and 30 days, only four genes (AwTS3, -5, -9, and -10) were expressed at considerable levels, while others were suppressed or not expressed under laboratory conditions ( Table 5 ). AwTS3 and AwTS5 are predicted to be lanosterol synthases, whereas AwTS9 and AwTS10 are predicted to be a geranylgeranyl pyrophosphate synthase and a farnesyl-diphosphate farnesyltransferase, respectively ( Table 3 ). Moreover, AwTS9 was differentially expressed across the two timepoints, with a substantial increase in expression at 30 days. Generally, most terpenoid genes exhibited the same suppression characteristic across the two timepoints suggesting that some genes responded in similar ways to standard laboratory conditions. View this table: View inline View popup Download powerpoint Table 5: Transcriptomic hitcounts of terpenoid genes in Aspergillus wentii CBS 141173 at two timepoints (7 and 30 days) performed in duplicate (A and B). Genes highlighted in red (AwTS3, -5, -9, and -10) show the highest expression across the samples analysed. DISCUSSION In this study, we provided the long-read genome assembly of A. wentii CBS 141173 with RNA-seq functional annotation, which has improved the quality of genomic resources available to carry out biosynthetic studies on this fungal strain. We successfully sequenced the whole genome of A. wentii to about 31.2 Mb, which is consistent with the genome sequence and assembly that was initially published [ 5 ]. The improved annotated genome assembly allowed for a significant improvement in the identification of 66 BGCs, including 16 terpene synthases, from the genome that could direct the biosynthesis of novel and known bioactive compounds. Our study shows how Nanopore sequencing can continue to spur long-read assembly of fungal genomes for targeted biosynthetic studies and is becoming increasingly useful even for both genomics and metagenomic research [ 26 , 27 ]. Various high-quality fungal genomes have already been sequenced on a MinION [ 28 – 30 ] thereby contributing to the availability of fungal genomes across curated databases such as NCBI and JGI. Nanopore sequencing presents challenges with accuracy when compared to established short-read platforms such as Illumina [ 31 ]. The proposed standard for most whole-genome sequencing projects to achieve high quality assemblies would be a hybrid assembly by incorporating both nanopore long-read and short-read sequencing [ 32 ] as seen in Tamizi et al . [ 32 ], as it combines the advantages provided by the two sequencing platforms. Equally, we believe that a cost-effective stand-alone long read sequencing strategy can become a viable alternative. Providing necessary software upgrades for genome polishing tools and base calling algorithms would improve assembly confidence for downstream genomic studies [ 33 ]. Additionally, incorporating paired-end RNA-seq data to guide functional annotation of long-reads assembly can boost the integrity of the whole-genome assembly [ 34 ]. From the metabolite analysis conducted in our study, the bioactive norditerpenoid asperolide A made by A. wentii CBS 141173 was detected. The compound has been reported to show cytotoxicity against several human tumour cell lines in preliminary screening experiments and has been reported to inhibit lung carcinoma cell proliferation [ 35 ], bone metastatic breast cancer [ 36 ], and hepatocellular carcinoma cell proliferation by targeting MAPK and TP53 [ 6 , 7 , 35 , 37 ]. The structural similarities between asperolide A and other high-value anticancer norditerpenoids such as wentilactones A and B [ 38 , 39 ] confirms its potential as a scaffold for drug development. To uncover the biosynthesis of such high-value molecules, the biosynthetic genes need to be identified. AntiSMASH is a powerful tool that has enabled the identification of BGCs encoding high value compounds. A classic example is strobilurin – the natural product that inspired the development of the β-methoxyacrylate class of agricultural fungicides that are widely used in crop protection [ 40 , 41 ]. AntiSMASH enabled the identification of the strobilurin polyketide BGC from the Strobilurus tenacellus genome and facilitated the characterisation of its biosynthetic pathway [ 40 ]. Other traditional approaches can also be used to identify novel BGCs. For instance, in the identification of the pleuromutilin terpenoid BGC from Clitopilus passeckerianus , degenerate PCR was used to identify putative GGPPS and then followed by analysis of the flanking regions to reveal additional biosynthetic genes included in the pleuromutilin BGC [ 42 , 43 ]. With advances in sequencing technology and continuous improvements with the bioinformatic tools, such as antiSMASH [ 14 ], and cblaster [ 15 ] finding novel terpenoid BGCs has become easier. From our study, a complementary gene mining approach using antiSMASH and local BlastP searches enabled the identification of BGCs that might not be picked up by antiSMASH alone due to the lack of canonical synthase genes in some BGCs [ 44 ]. With this approach we were able to recruit 16 terpene synthases for downstream analysis. We further analysed the flanking regions of the terpene synthases to reveal their potential to encode diterpenoid compounds. From our analysis, we highlighted two diterpenoid clusters from AwTS15 and AwTS16 that could be involved in the biosynthesis of pimarane diterpenoids such as pimaradiene [ 45 ], and acanthoic acid (46). Noteworthy, the pimarane carbon skeleton is a signature scaffold for notable diterpenoids isolated from A. wentii such as aspewentins and wentinoids [ 4 ]. The presence of tailoring enzymes such as cytochrome P450 and oxidoreductase enzymes in the highlighted cluster adds credibility to the potential of the cluster to direct the biosynthesis of a bioactive diterpenoid compound. From the phylogeny analysis, A. wentii terpene synthases appeared to be very diverse and could be involved in directing monocyclic and tricyclic terpenoid based scaffolds. For instance, humulene based scaffolds are monocyclic sesquiterpenoids recognised for their cytotoxic and anti-inflammatory effects [ 47 – 49 ]. Although a common feature of some plant terpenoids [ 49 ], humulene synthases have been characterised from fungi such as EupE , which is involved in the biosynthesis of Eupenifeldin [ 50 ]. Our phylogenetic study further reiterates the possibility of some AwTS to encode tricyclic diterpenoids due to their relationship with pimaradiene synthases [ 51 , 52 ] and its resulting compounds are often known for their cytotoxic bioactivity [ 46 , 52 ]. Terpene synthases are very versatile, as they can be involved in making either stand-alone terpenoids or hybrid biosynthetic products, such as alkaloidal terpenoids from a mixed terpene and nonribosomal peptide biosynthetic pathway [ 53 ]. Since none of the terpene synthases from A. wentii have been experimentally characterised, it will be informative to understand the function of these genes via either heterologous expression or gene deletions. Transcriptomic analysis showed that most terpenoid synthases of A. wentii are not expressed under standard laboratory conditions. The use of beta-tubulin and GAPDH as reference genes to analyse the transcript level of the terpenoid synthase genes shows low levels of expression across the 7- and 30-days timepoints. This is not unusual, as various strategies have been used to improve expression of BGCs in fungi. For instance, the manipulation of transcription regulators such as mcrA impacts fungal secondary metabolism especially in A. wentii to upregulate and trigger the expression of cryptic BGCs [ 54 , 55 ]. Additionally, the culture medium condition has a role in determining fungal metabolism and growth [ 56 ]. The availability and concentration of certain nutrients such as carbon source, minerals and pH can influence gene expressions and ultimately impact the production of secondary metabolites [ 56 ]. For example, the production of ascofuranone and ascochlorin, meroterpenoid compounds from Acremonium egyptiacum , was shown to be dependent on the culture medium [ 57 ]. Since Aspergillus wentii is associated with marine habitats [ 6 ], extracting RNA and metabolites from mycelia grown in culture medium supplemented with seawater could provide more insight into the production of some of its cryptic metabolites and other norditerpenoid dilactones which have been detected in A. wentii . CONCLUSIONS Our study provides a platform for elucidating the biosynthesis of norditerpenoids and other specialised metabolites made by Aspergillus wentii CBS 141173. Under standard laboratory conditions, RNA-seq data from two time points of 7 days and 30 days enabled us to provide a robust annotation for our nanopore long-read assembly. Based on the secondary metabolite analysis of Aspergillus wentii CBS 141173, we were able to confirm the production of asperolide A. We further analysed 16 terpene synthases identified from our genome assembly that could be involved in the biosynthesis of various terpenoid scaffolds in Aspergillus wentii , and highlighted two clusters that could make diterpenoids such as pimarane-like compounds. Genetic engineering strategies such as heterologous expression and gene disruption experiments, including through CRISPR/Cas9, can be used to link the compounds to their respective biosynthetic genes and enable us to elucidate the terpenoid biosynthetic pathways for bioactive molecules such as asperolide A made by A. wentii . Ethics approval and consent to participate Not applicable. Consent for publication Not applicable. Availability of data and materials The assembled annotated genome was deposited at the NCBI database under the BioProject: PRJNA1133277, accession number: CP165651 - CP165658 (Supplementary Table 4). RNA-seq raw data is available upon request. Competing interests None. Funding F.A. was supported by a UKRI Future Leaders Fellowship [MR/V022334/1]. Authors’ contributions F.A., C.C. and R.O. were responsible for project conceptualisation. R.O. and F.A. were responsible for experimental design and analysis. R.O. analysed and interpreted the data. R.O. wrote the initial manuscript. F.A. reviewed and edited the manuscript with contributions from C.C. All authors read and approved the final manuscript. Acknowledgements We would like to thank Richard Stark (University of Warwick Bioinformatics & Digital Health RTP), Jack Weaver, and Tosin Orababa for their help with the installation and the operation of the statistical and genome assembly software packages. Lijiang Song is also acknowledged for help with UHPLC-HRMS analysis. References 1. ↵ Hagag A , Abdelwahab MF , Abd El-kader AM , Fouad MA . The endophytic Aspergillus strains: A bountiful source of natural products . Vol. 132 , Journal of Applied Microbiology . John Wiley and Sons Inc ; 2022 . p. 4150 – 69 . OpenUrl 2. ↵ Hajjaj H , Niederberger P , Duboc P. Lovastatin Biosynthesis by Aspergillus terreus in a Chemically Defined Medium . Appl Environ Microbiol . 2001 Jun ; 67 ( 6 ): 2596 – 602 . OpenUrl Abstract / FREE Full Text 3. ↵ Newman DJ , Cragg GM . Natural Products as Sources of New Drugs over the Nearly Four Decades from 01/1981 to 09/2019 . Vol. 83 , Journal of Natural Products . American Chemical Society ; 2020 . p. 770 – 803 . OpenUrl CrossRef PubMed 4. ↵ Ainousah BE , Ibrahim SRM , Alzain AA , Mohamed SGA , Hussein HGA , Ashour A , et al. Exploring the potential of Aspergillus wentii: secondary metabolites and biological properties . Vol. 206 , Archives of Microbiology . Springer Science and Business Media Deutschland GmbH ; 2024 . 5. ↵ de Vries RP , Riley R , Wiebenga A , Aguilar-Osorio G , Amillis S , Uchima CA , et al. Comparative genomics reveals high biological diversity and specific adaptations in the industrially and medically important fungal genus Aspergillus . Genome Biol . 2017 Feb 14; 18 ( 1 ). 6. ↵ Sun HF , Li XM , Meng L , Cui CM , Gao SS , Li CS , et al. Asperolides A-C, tetranorlabdane diterpenoids from the marine alga-derived endophytic fungus aspergillus wentii EN-48 . J Nat Prod . 2012 Feb 24; 75 ( 2 ): 148 – 52 . OpenUrl PubMed 7. ↵ Xu R , Li X , Xu G , Wang B. Optimizing production of asperolide A, a potential anti-tumor tetranorditerpenoid originally produced by the algal-derived endophytic fungus Aspergillus wentii EN-48 . Chinese Journal of Oceanology and Limnology . 2017 May 1; 35 ( 3 ): 658 – 63 . OpenUrl 8. ↵ Lv C , Hong Y , Miao L , Li C , Xu G , Wei S , et al. Wentilactone A as a novel potential antitumor agent induces apoptosis and G2/M arrest of human lung carcinoma cells, and is mediated by HRas-GTP accumulation to excessively activate the Ras/Raf/ERK/p53-p21 pathway . Cell Death Dis . 2013 Dec ; 4 ( 12 ). 9. ↵ Quin MB , Flynn CM , Schmidt-Dannert C. Traversing the fungal terpenome . Vol. 31 , Natural Product Reports. Royal Society of Chemistry ; 2014 . p. 1449 – 73 . OpenUrl 10. ↵ Luo P , Huang JH , Lv JM , Wang GQ , Hu D , Gao H. Biosynthesis of fungal terpenoids . Vol. 41 , Natural Product Reports . Royal Society of Chemistry ; 2024 . p. 748 – 83 . OpenUrl 11. ↵ Zeng N , Zhang Q , Yao Q , Fu G , Su W , Wang W , et al. A Comprehensive Review of the Classification, Sources, Phytochemistry, and Pharmacology of Norditerpenes . Vol. 29 , Molecules . Multidisciplinary Digital Publishing Institute (MDPI ); 2024 . 12. ↵ Yuan Y , Cheng S , Bian G , Yan P , Ma Z , Dai W , et al. Efficient exploration of terpenoid biosynthetic gene clusters in filamentous fungi . Nat Catal . 2022 Apr 1; 5 ( 4 ): 277 – 87 . OpenUrl 13. ↵ Alberti F , Foster GD , Bailey AM . Natural products from filamentous fungi and production by heterologous expression . Vol. 101 , Applied Microbiology and Biotechnology . Springer Verlag ; 2017 . p. 493 – 500 . OpenUrl CrossRef 14. ↵ Blin K , Shaw S , Augustijn HE , Reitz ZL , Biermann F , Alanjary M , et al. AntiSMASH 7.0: New and improved predictions for detection, regulation, chemical structures and visualisation . Nucleic Acids Res . 2023 Jul 5; 51 ( W1 ): W46 – 50 . OpenUrl CrossRef 15. ↵ Gilchrist CLM , Booth TJ , Van Wersch B , Van Grieken L , Medema MH , Chooi YH . cblaster: a remote search tool for rapid identification and visualization of homologous gene clusters . Bioinformatics Advances . 2021 ; 1 ( 1 ). 16. Sereika M , Kirkegaard RH , Karst SM , Michaelsen TY , Sørensen EA , Wollenberg RD , et al. Oxford Nanopore R10.4 long-read sequencing enables the generation of near-finished bacterial genomes from pure cultures and metagenomes without short-read or reference polishing . Nat Methods . 2022 Jul 1; 19 ( 7 ): 823 – 6 . OpenUrl CrossRef 17. ↵ Li H. Minimap2: Pairwise alignment for nucleotide sequences . Bioinformatics . 2018 Sep 15; 34 ( 18 ): 3094 – 100 . OpenUrl CrossRef PubMed 18. ↵ Walker BJ , Abeel T , Shea T , Priest M , Abouelliel A , Sakthikumar S , et al. Pilon: An integrated tool for comprehensive microbial variant detection and genome assembly improvement . PLoS One . 2014 Nov 19; 9 ( 11 ). 19. ↵ Simão FA , Waterhouse RM , Ioannidis P , Kriventseva E V. , Zdobnov EM . BUSCO: Assessing genome assembly and annotation completeness with single-copy orthologs . Bioinformatics . 2015 Oct 1; 31 ( 19 ): 3210 – 2 . OpenUrl CrossRef PubMed 20. ↵ Jonathan M. Palmer & JS . Funannotate v1.8.1: Eukaryotic genome annotation (v1.8.1) . Zenodo . 2020 ; 21. ↵ Cantalapiedra CP , Hernlandez-Plaza A , Letunic I , Bork P , Huerta-Cepas J. eggNOG-mapper v2: Functional Annotation, Orthology Assignments, and Domain Prediction at the Metagenomic Scale . Mol Biol Evol . 2021 ; 38 ( 12 ): 5825 – 9 . OpenUrl CrossRef 22. ↵ Gremme G , Steinbiss S , Kurtz S. Genome tools: A comprehensive software library for efficient processing of structured genome annotations . IEEE/ACM Trans Comput Biol Bioinform . 2013 ; 10 ( 3 ): 645 – 56 . OpenUrl CrossRef 23. ↵ Tamura K , Stecher G , Kumar S. MEGA11: Molecular Evolutionary Genetics Analysis Version 11 . Mol Biol Evol . 2021 Jul 1; 38 ( 7 ): 3022 – 7 . OpenUrl CrossRef 24. ↵ Han X , Chakrabortti A , Zhu J , Liang ZX , Li J. Sequencing and functional annotation of the whole genome of the filamentous fungus Aspergillus westerdijkiae . BMC Genomics . 2016 Aug 15; 17 ( 1 ). 25. Archer M , Xu J. Current practices for reference gene selection in rt-qpcr of aspergillus: Outlook and recommendations for the future . Genes (Basel) . 2021 Jun 1; 12 ( 7 ). 26. ↵ Kerkhof LJ . Is Oxford Nanopore sequencing ready for analyzing complex microbiomes? Vol. 97 , FEMS Microbiology Ecology . Oxford University Press ; 2021 . 27. ↵ Morrison GA , Fu J , Lee GC , Wiederhold NP , Cañete-Gibas CF , Bunnik EM , et al. Nanopore Sequencing of the Fungal Intergenic Spacer Sequence as a Potential Rapid Diagnostic Assay [Internet] . 2020 . Available from: https://journals.asm.org/journal/jcm 28. ↵ McKenzie SK , Walston RF , Allen JL . Complete, high-quality genomes from long-read metagenomic sequencing of two wolf lichen thalli reveals enigmatic genome architecture . Genomics . 2020 Sep 1; 112 ( 5 ): 3150 – 6 . OpenUrl CrossRef 29. Petersen C , Sørensen T , Westphal KR , Fechete LI , Sondergaard TE , Sørensen JL , et al. High molecular weight DNA extraction methods lead to high quality filamentous ascomycete fungal genome assemblies using Oxford Nanopore sequencing . Microb Genom . 2022 ; 8 ( 4 ). 30. ↵ Dutreux F , Da Silva C , D’agata L , Couloux A , Gay EJ , Istace B , et al. Data descriptor: De novo assembly and annotation of three leptosphaeria genomes using oxford nanopore minion sequencing . Sci Data . 2018 ; 5 . 31. ↵ Amarasinghe SL , Su S , Dong X , Zappia L , Ritchie ME , Gouil Q. Opportunities and challenges in long-read sequencing data analysis . Vol. 21 , Genome Biology . BioMed Central Ltd .; 2020 . 32. ↵ Tamizi AA , Mat-Amin N , Weaver JA , Olumakaiye RT , Akbar MA , Jin S , et al. Genome Sequencing and Analysis of Trichoderma (Hypocreaceae) Isolates Exhibiting Antagonistic Activity against the Papaya Dieback Pathogen, Erwinia mallotivora . Journal of Fungi . 2022 Mar 1; 8 ( 3 ). 33. ↵ Lee JY , Kong M , Oh J , Lim JS , Chung SH , Kim JM , et al. Comparative evaluation of Nanopore polishing tools for microbial genome assembly and polishing strategies for downstream analysis . Sci Rep . 2021 Dec 1; 11 ( 1 ). 34. ↵ Cortés-Maldonado L , Marcial-Quino J , Gómez-Manzo S , Fierro F , Tomasini A. A method for the extraction of high quality fungal RNA suitable for RNA-seq . J Microbiol Methods . 2020 Mar 1; 170 . 35. ↵ Lv C , Sun W , Sun H , Wei S , Chen R , Wang B , et al. Asperolide A, a marine-derived tetranorditerpenoid, induces G2/M arrest in human NCI-H460 lung carcinoma cells, is mediated by p53-p21 stabilization and modulated by Ras/Raf/MEK/ERK signaling pathway . Mar Drugs . 2013 ; 11 ( 2 ): 316 – 31 . OpenUrl CrossRef PubMed 36. ↵ Jiang W , Rixiati Y , Huang H , Shi YJ , Huang C , Jiao B. Asperolide A prevents bone metastatic breast cancer via the PI3K/AKT/mTOR/c-Fos/NFATc1 signaling pathway . Cancer Med . 2020 Nov 1; 9 ( 21 ): 8173 – 85 . OpenUrl 37. ↵ Lv C , Lan A , Fan X , Huang C , Yang G. Asperolide A induces apoptosis and cell cycle arrest of human hepatoma cells with p53-Y220C mutant through p38 mediating phosphorylation of p53 (S33) . Heliyon . 2023 Mar 1; 9 ( 3 ). 38. ↵ Jiang W , Meng L , Xu G , Lv C , Wang H , Tian HE , et al. Wentilactone a induces cell apoptosis by targeting AKR1C1 gene via the IGF-1R/IRS1/PI3K/AKT/NRF2/FLIP/Caspase-3 signaling pathway in small cell lung cancer . Oncol Lett . 2018 Nov 1; 16 ( 5 ): 6445 – 57 . OpenUrl 39. ↵ Zhang Z , Miao L , Lv C , Sun H , Wei S , Wang B , et al. Wentilactone B induces G2/M phase arrest and apoptosis via the Ras/Raf/MAPK signaling pathway in human hepatoma SMMC-7721 cells . Cell Death Dis . 2013 Jun ; 4 ( 6 ). 40. ↵ Nofiani R , de Mattos-Shipley K , Lebe KE , Han LC , Iqbal Z , Bailey AM , et al. Strobilurin biosynthesis in Basidiomycete fungi . Nat Commun . 2018 Dec 1; 9 ( 1 ). 41. ↵ Song H , Song HX , Shi DQ . Synthesis and fungicidal activity of strobilurin analogues containing 1,2,4-triazole oxime ether moiety . J Heterocycl Chem . 2014 ; 51 ( 6 ): 1603 – 6 . OpenUrl 42. ↵ Bailey AM , Alberti F , Kilaru S , Collins CM , De Mattos-Shipley K , Hartley AJ , et al. Identification and manipulation of the pleuromutilin gene cluster from Clitopilus passeckerianus for increased rapid antibiotic production . Sci Rep . 2016 May 4; 6 . 43. ↵ Alberti F , Khairudin K , Venegas ER , Davies JA , Hayes PM , Willis CL , et al. Heterologous expression reveals the biosynthesis of the antibiotic pleuromutilin and generates bioactive semi-synthetic derivatives . Nat Commun . 2017 Dec 1; 8 ( 1 ). 44. ↵ Rokas A , Mead ME , Steenwyk JL , Raja HA , Oberlies NH . Biosynthetic gene clusters and the evolution of fungal chemodiversity . Vol. 37 , Natural Product Reports . Royal Society of Chemistry ; 2020 . p. 868 – 78 . OpenUrl 45. ↵ Bromann K , Viljanen K , Moreira VM , Yli-Kauhaluoma J , Ruohonen L , Nakari-Setälä T. Isolation and purification of ent-pimara-8(14), 15-diene from engineered Aspergillus nidulans by accelerated solvent extraction combined with HPLC . Analytical Methods . 2014 Feb 21; 6 ( 4 ): 1227 – 34 . OpenUrl 46. ↵ Dou JY , Jiang YC , Cui ZY , Lian LH , Nan JX , Wu YL . Acanthoic acid, unique potential pimaradiene diterpene isolated from Acanthopanax koreanum Nakai (Araliaceae): A review on its pharmacology, molecular mechanism, and structural modification . Vol. 200 , Phytochemistry . Elsevier Ltd ; 2022 . 47. ↵ Becker L , Holtmann D. Anti-inflammatory effects of α-humulene on the release of pro-inflammatory cytokines in lipopolysaccharide-induced THP-1 cells . Cell Biochem Biophys . 2024 ; 48. Zhao WY , Yi J , Chang YB , Sun CP , Ma XC . Recent studies on terpenoids in Aspergillus fungi: Chemical diversity, biosynthesis, and bioactivity . Vol. 193 , Phytochemistry . Elsevier Ltd ; 2022 . 49. ↵ Mendes de Lacerda Leite G , de Oliveira Barbosa M , Pereira Lopes MJ , de Araújo Delmondes G , Bezerra DS , Araújo IM , et al. Pharmacological and toxicological activities of α-humulene and its isomers: A systematic review . Vol. 115 , Trends in Food Science and Technology . Elsevier Ltd ; 2021 . p. 255 – 74 . OpenUrl 50. ↵ Zhai Y , Li Y , Zhang J , Zhang Y , Ren F , Zhang X , et al. Identification of the gene cluster for bistropolone-humulene meroterpenoid biosynthesis in Phoma sp . Fungal Genetics and Biology . 2019 Aug 1; 129 : 7 – 15 . OpenUrl 51. ↵ Bromann K , Toivari M , Viljanen K , Vuoristo A , Ruohonen L , Nakari-Setälä T. Identification and characterization of a novel diterpene gene cluster in aspergillus nidulans . PLoS One . 2012 Apr 10; 7 ( 4 ). 52. ↵ Ye K , Ai HL . Pimarane Diterpenes from Fungi . Vol. 15 , Pharmaceuticals . MDPI ; 2022 . 53. ↵ Yee DA , Kakule TB , Cheng W , Chen M , Chong CTY , Hai Y , et al. Genome Mining of Alkaloidal Terpenoids from a Hybrid Terpene and Nonribosomal Peptide Biosynthetic Pathway . J Am Chem Soc . 2020 Jan 15; 142 ( 2 ): 710 – 4 . OpenUrl 54. ↵ Yuan B , Keller NP , Oakley BR , Stajich JE , Wang CCC . Manipulation of the Global Regulator mcrA Upregulates Secondary Metabolite Production in Aspergillus wentii Using CRISPR-Cas9 with In Vitro Assembled Ribonucleoproteins . ACS Chem Biol . 2022 Oct 21; 17 ( 10 ): 2828 – 35 . OpenUrl 55. ↵ Oakley CE , Ahuja M , Sun WW , Entwistle R , Akashi T , Yaegashi J , et al. Discovery of McrA, a master regulator of Aspergillus secondary metabolism . Mol Microbiol . 2017 Jan 1; 103 ( 2 ): 347 – 65 . OpenUrl CrossRef 56. ↵ Hur JY , Jeong E , Kim YC , Lee SR . Strategies for Natural Product Discovery by Unlocking Cryptic Biosynthetic Gene Clusters in Fungi . Vol. 10 , Separations . MDPI ; 2023 . 57. ↵ Araki Y , Awakawa T , Matsuzaki M , Cho R , Matsuda Y , Hoshino S , et al. Complete biosynthetic pathways of ascofuranone and ascochlorin in Acremonium egyptiacum . Proc Natl Acad Sci U S A . 2019 ; 116 ( 17 ): 8269 – 74 . OpenUrl Abstract / FREE Full Text View the discussion thread. Back to top Previous Next Posted September 24, 2024. Download PDF Supplementary Material Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Identification of a terpene synthase arsenal using long-read sequencing and genome assembly of Aspergillus wentii Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Identification of a terpene synthase arsenal using long-read sequencing and genome assembly of Aspergillus wentii Richard Olumakaiye , Christophe Corre , Fabrizio Alberti bioRxiv 2024.09.23.614465; doi: https://doi.org/10.1101/2024.09.23.614465 Share This Article: Copy Citation Tools Identification of a terpene synthase arsenal using long-read sequencing and genome assembly of Aspergillus wentii Richard Olumakaiye , Christophe Corre , Fabrizio Alberti bioRxiv 2024.09.23.614465; doi: https://doi.org/10.1101/2024.09.23.614465 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Genomics Subject Areas All Articles Animal Behavior and Cognition (7651) Biochemistry (17746) Bioengineering (13928) Bioinformatics (42066) Biophysics (21499) Cancer Biology (18650) Cell Biology (25579) Clinical Trials (138) Developmental Biology (13409) Ecology (19947) Epidemiology (2067) Evolutionary Biology (24374) Genetics (15633) Genomics (22557) Immunology (17775) Microbiology (40505) Molecular Biology (17217) Neuroscience (88796) Paleontology (667) Pathology (2845) Pharmacology and Toxicology (4836) Physiology (7664) Plant Biology (15179) Scientific Communication and Education (2047) Synthetic Biology (4304) Systems Biology (9839) Zoology (2272)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2024) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00