Deconvolving mutation and selection reveals stage-specific drivers of thyroid cancer

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 22,952 characters · extracted from preprint-html · click to expand
Deconvolving mutation and selection reveals stage-specific drivers of thyroid cancer | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Deconvolving mutation and selection reveals stage-specific drivers of thyroid cancer View ORCID Profile Moein Rajaei , View ORCID Profile Andrew Ju , View ORCID Profile Adebowale J. Adeniran , View ORCID Profile Jeffrey P. Townsend doi: https://doi.org/10.1101/2025.10.08.681166 Moein Rajaei 1 Department of Biostatistics, Yale School of Public Health , New Haven, CT Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Moein Rajaei Andrew Ju 1 Department of Biostatistics, Yale School of Public Health , New Haven, CT Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Andrew Ju Adebowale J. Adeniran 2 Department of Pathology, Yale School of Medicine , New Haven, CT 3 Yale Cancer Center, Yale University , New Haven, CT Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Adebowale J. Adeniran Jeffrey P. Townsend 1 Department of Biostatistics, Yale School of Public Health , New Haven, CT 3 Yale Cancer Center, Yale University , New Haven, CT 4 Department of Ecology and Evolutionary Biology, Yale University , New Haven, CT, 5 Program in Computational Biology and Biomedical Informatics, Yale University , New Haven, CT Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Jeffrey P. Townsend For correspondence: jeffrey.townsend{at}yale.edu Abstract Full Text Info/History Metrics Preview PDF Abstract Objective Mutational profiles of primary and metastatic thyroid cancer (THCA) have been examined by comparison of somatic mutation prevalences in the two stages, using P values to identify significant differences. However, prevalences and P values for mutations do not directly quantify the cancer effects of somatic variants. Methods We calculated cancer effect sizes accounting for substantial gene- and site-specific mutation rates, to quantify somatic selection across stages. This approach provides a direct measure of cancer-driving impact of new mutations and reveals the genes that drive tumorigenesis and progression, and whether mutations have greater effects in primary or metastatic THCA. Results Trinucleotide mutation profiles were similar between primary and metastatic THCA. Most canonical driver genes ( BRAF, NRAS, TP53, ATM, EIF1AX, KMT2C, NF1, RBM10, ARID1A, PIK3CA , and NKX2-1 ) exhibited stronger selection during initial tumorigenesis (from organogenesis to primary THCA) than during progression (from primary to metastatic THCA). Notably, TERT mutations have been shown to be at higher prevalence in metastatic tumors, yet their strongest selection occurred earlier, during tumor initiation. In contrast, RET mutations exhibited the opposite trajectory, experiencing weaker selection during tumorigenesis but stronger selection during metastatic progression. Conclusion Cancer effect size analysis revealed dynamic shifts in selective pressures across THCA evolution, distinguishing genes that drive initiation from those that promote metastatic progression. This evolutionary framework provides a quantitative basis for understanding THCA pathogenesis and provides guidance for stage-specific precision-medicine therapeutic strategies. Background Thyroid cancer (THCA) has one of the highest contemporary 5-year survival rates among cancers (98%) 1 . Nevertheless,it accounted for an estimated 821,000 new cases and 44,000 deaths worldwide in 2022 2 , ranking as the seventh-most commonly diagnosed malignancy. Prognosis declines sharply with stage, from 99.8% survival for localized tumors to 97% with regional metastases, and 57.3% with distant metastases 3 , demonstrating the importance of early diagnosis and treatment to prevent metastatic spread and improve outcomes. Given the crucial value of understanding the differences between primary and metastatic THCA, prior studies have characterized variant profiles of tumors by reporting differences in prevalence between stages, accompanied by their statistical significance 4 , However, prevalence conveys only the proportion of patients carrying a variant, and P values convey only the probability of observed differences given the data. They are related to, but are not measures of oncogenic effect 5 . A more comprehensive understanding therefore requires quantification of mutational patterns, background mutation rates, and selective pressures on driver genes across disease stages. To guide basic and translational research, we analyzed 2,145 primary and 1,374 metastatic THCA sequences from Maximo et al 4 , Masoodi et al 6 , TCGA, and GENIE. Quantifying gene- and site-specific mutation rates, we established neutral expectations, separating mutational processes from selective pressures. We then quantified somatic selection on driver genes, distinguishing those most crucial to tumor initiation from those driving metastatic progression. Methods Of 475 target-sequenced primary and metastatic TCs reported by Maximo et al . 4 , we analyzed the 458 non-follicular tumors for which non-synonymous single-nucleotide variants (SNVs) were provided. We also included whole-exome sequences from TCGA, targeted panel data from GENIE Release 15.1 7 , and 14 matched primary-metastasis pairs from Masoodi et al . 6 . In total, our dataset comprised 2,145 primary and 1,374 metastatic tumors, aligned to the human reference genome Hg19. TCGA data originally aligned to Hg38 was converted to Hg19 using Liftover. We analyzed the trinucleotide mutational profiles of primary and metastatic THCA using MutationalPatterns v3.8.1 8 and cancereffectsizeR v2.9.0 9 . Following Cannataro et al. 10 , we excluded mutational signatures previously determined to be absent in THCA 11 . Trinucleotide mutation rates were convolved with gene-specific background rates 12 to estimate neutral expectations for each site, and the sequential model 9 was applied to quantify somatic selection during both primary tumorigenesis and metastatic progression. Analyses focused on the sixteen most prevalent thyroid cancer genes reported by Maximo et al. 4 . Variants within genes were modeled with site-specific mutation rates but as sharing a single invariant cancer effect size. This approach enabled quantification of stage-specific differences in somatic selection intensity, providing insight into the mutations driving thyroid cancer initiation and progression and informing the basis for stage-targeted precision therapies. Results The overall trinucleotide mutational landscape was largely similar between primary and metastatic THCA. However, GTG → GAG, TTG → TCG, and ATG → ACG substitutions were at substantially higher proportions in metastases. These differences in trinucleotide mutation profile were insufficient to cause the differences in variant prevalence between primary and metastatic THCA. Neutral mutation accumulation was significantly higher in metastatic tumors than in primary tumors (rank-biserial correlation = 0.63; P < 2.2 × 10 −16 ; Mann–Whitney U test), and across all 16 genes analyzed, neutral mutation rates were elevated in metastatic disease ( Table 1 ). Mutations of RET were more prevalent in metastatic tumors than in primary tumors ( Fig. 1A ). Consistent with this pattern of prevalence, our analysis showed that RET mutations were subject to weaker selection during primary tumorigenesis, and stronger selection during metastatic progression ( Fig. 1B ). In contrast, NRAS and KMT2C mutations exhibited the opposite trajectory: they were much more strongly selected during primary tumorigenesis than during progression to metastasis, even though their prevalence was similar across stages. View this table: View inline View popup Table 1. Gene-level mutation rates in primary and metastatic thyroid tumors. Download figure Open in new tab Figure 1. ( A ) Prevalence of mutations in 16 selected genes across primary and metastatic thyroid cancers. ( B ) Cancer effect sizes of somatic variants in oncogenic sites / regions / domains of 16 genes that are known to act as drivers in thyroid cancer tumorigenesis and metastasis. Metastases carried BRAF mutations at a frequency comparable to primary tumors, and BRAF mutation rates were increasing but fairly consistent between stages (2.5 × 10 −7 vs . 8.4 × 10 −8 ). In contrast new BRAF mutations were subject to much stronger selection during the transition from organogenesis to primary THCA than during progression to metastasis ( Fig. 1B ) . Just as a similar mutation frequency across stages does not reliably scale with selective pressure, a higher frequency of gene mutation in a later stage does not necessarily equate to higher selection. The prevalence of TP53 mutations was higher in metastatic tumors than in primary tumors. However, the selection intensity for TP53 mutations occurring during progression to metastasis was lower than it was for mutations occurring during primary tumorigenesis ( Fig. 1B ) . In this case, variant prevalence increase and strength of selection on the variant were decoupled, with prevalence increasing even as selection intensity decreased. Mutations in TERT, ATM, NF1, NKX2-1, EIF1AX, RBM10, PIK3CA , and ARID1A were subject to stronger somatic selection from organogenesis through primary tumorigenesis than during progression to metastasis ( Fig. 1B ). Mutations in TBX3, CDKN2B , and BCOR genes did not exhibit statistically significant differences in the intensity of selection between primary tumorigenesis and progression to metastasis. Overall, most driver genes demonstrated higher selective pressure earlier in disease progression, with only a subset maintaining similar intensities across stages. Discussion Our analysis demonstrated that TP53 and RET mutations both exhibited higher prevalence in metastatic than in primary tumors. However, their selective dynamics were divergent: novel TP53 mutations were under weaker selection during progression to metastasis than during primary tumorigenesis, whereas RET mutations were under significantly stronger selection during metastatic progression—consistent with a prior study demonstrating a functional role of RET in metastatic THCA 16 . These findings indicate that therapeutic inhibition of RET might be beneficial even in tumors that have not yet acquired RET mutations, as such intervention could potentially forestall metastatic progression. By accounting for underlying neutral mutation rates and quantifying cancer effect, these analyses demonstrate the enhanced power and accuracy obtained when deconvolving mutation and selection differences across stages of cancer. Our analysis classified tumors as “primary” or “metastatic”, a relevant but coarse binary discretization of the continuum of thyroid cancer progression. Such discretization obscures intermediate states such as locally advanced or regionally metastatic disease, which may exert specific selective dynamics on novel gene variants. Nonetheless, the contrast between localized primaries and established distant metastases maximizes power with a limited sample size and provides a clear and biologically meaningful comparison. This dichotomy enables robust detection of shifts in selective pressure, while also motivating future work that dissects finer-grained transitions. Our analysis relied on bulk sequencing, which integrates signals from genetically heterogeneous tumor cell populations and does not distinguish clonal from subclonal mutations or model frequency-dependent selection among competing variants. Higher-resolution approaches such as single-cell sequencing or spatial genomics will be needed to capture these dynamics of clonal competition and dissemination. Nevertheless, this limitation does not compromise the accuracy of our estimates of population-level selective pressures, which reflect longer-term molecular evolutionary outcomes determining frequencies of variants across tumors. Incorporation of gene- and site-specific mutation rates to calculate cancer effect enables quantification of somatic selection and the contributions of individual variants and genes to thyroid tumorigenesis and progression. However, this approach does not elucidate the underlying biological mechanisms that drive that selection. It identifies which mutations are favored across disease stages, but cannot reveal whether selection arises from altered signaling pathways, changes in the tumor microenvironment, or other molecular and cellular processes. Accordingly, these findings should motivate functional studies, pathway analyses, and integrative genomic approaches that determine why specific variants confer selective advantages. Such complementary research will not only validate the drivers identified here but also provide mechanistic insights that can guide the development of effective, stage-specific therapeutic strategies. Finally, our analysis was limited to coding single-nucleotide variants, whereas other processes—copy number alterations, gene fusions, epigenetic modifications, transcriptional reprogramming, and interactions with the tumor microenvironment—also play critical roles in metastatic progression. Thus, our framework captures only part of the complex landscape of thyroid cancer evolution. Extending cancer effect size analyses to encompass these additional molecular layers will be an important next step, enabling a more comprehensive view of the selective forces driving thyroid cancer initiation and metastatic spread. Declaration of interest The authors declare that there is no conflict of interest that could be perceived as prejudicing the impartiality of the research reported. Funding The authors would like to acknowledge the Elihu endowment at Yale for support. Acknowledgements The authors would like to acknowledge the American Association for Cancer Research for the development of the AACR Project GENIE registry, as well as members of the consortium for their commitment to data sharing. Interpretations are the responsibility of study authors. Funder Information Declared Yale University, https://ror.org/03v76x132 , Elihu endowment Footnotes Analysis Code: https://github.com/Townsend-Lab-Yale/primary_metastatic_tc_effect_size_analysis References 1. ↵ Siegel RL , Kratzer TB , Giaquinto AN , et al. Cancer statistics, 2025 . CA: A Cancer Journal for Clinicians 2025 ; 75 ( 1 ): 10 – 45 . OpenUrl CrossRef PubMed 2. ↵ Bray F , Laversanne M , Sung H , et al. Global cancer statistics 2022: GLOBOCAN estimates of incidence and mortality worldwide for 36 cancers in 185 countries . CA Cancer J Clin 2024 ; 74 ( 3 ): 229 – 263 . OpenUrl CrossRef PubMed 3. ↵ Simard EP , Ward EM , Siegel R , et al. Cancers with increasing incidence trends in the United States: 1999 through 2008 . CA Cancer J Clin 2012 ; 62 ( 2 ): 118 – 128 . OpenUrl CrossRef PubMed Web of Science 4. ↵ Máximo V , Melo M , Zhu Y , et al. Genomic profiling of primary and metastatic thyroid cancers . Endocr Relat Cancer 2024 ; 31 ( 2 ); doi: 10.1530/ERC-23-0144 . OpenUrl CrossRef 5. ↵ Cannataro VL , Gaffney SG , Townsend JP . Effect Sizes of Somatic Mutations in Cancer . J Natl Cancer Inst 2018 ; 110 ( 11 ): 1171 – 1177 . OpenUrl CrossRef PubMed 6. ↵ Masoodi T , Siraj AK , Siraj S , et al. Whole-Exome Sequencing of Matched Primary and Metastatic Papillary Thyroid Cancer . Thyroid 2020 ; 30 ( 1 ): 42 – 56 . OpenUrl CrossRef PubMed 7. ↵ AACR Project GENIE Consortium . AACR Project GENIE: Powering Precision Medicine through an International Consortium . Cancer Discov 2017 ; 7 ( 8 ): 818 – 831 . OpenUrl Abstract / FREE Full Text 8. ↵ Blokzijl F , Janssen R , van Boxtel R , et al. MutationalPatterns: comprehensive genome-wide analysis of mutational processes . Genome Med 2018 ; 10 ( 1 ): 33 . OpenUrl CrossRef PubMed 9. ↵ Mandell JD , Cannataro VL , Townsend JP . Estimation of Neutral Mutation Rates and Quantification of Somatic Variant Selection Using cancereffectsizeR . Cancer Res 2023 ; 83 ( 4 ): 500 – 505 . OpenUrl CrossRef PubMed 10. ↵ Cannataro VL , Mandell JD , Townsend JP . Attribution of Cancer Origins to Endogenous, Exogenous, and Preventable Mutational Processes . Mol Biol Evol 2022 ; 39 ( 5 ); doi: 10.1093/molbev/msac084 . OpenUrl CrossRef 11. ↵ Alexandrov LB , Kim J , Haradhvala NJ , et al. The repertoire of mutational signatures in human cancer . Nature 2020 ; 578 ( 7793 ): 94 – 101 . OpenUrl CrossRef PubMed 12. ↵ Martincorena I , Raine KM , Gerstung M , et al. Universal Patterns of Selection in Cancer and Somatic Tissues . Cell 2018 ; 173 ( 7 ): 1823 . OpenUrl CrossRef PubMed 13. Cabanillas ME , Patel A , Danysh BP , et al. BRAF inhibitors: experience in thyroid cancer and general review of toxicity . Horm Cancer 2015 ; 6 ( 1 ): 21 – 36 . OpenUrl PubMed 14. Fakhruddin N , Jabbour M , Novy M , et al. BRAF and NRAS Mutations in Papillary Thyroid Carcinoma and Concordance in BRAF Mutations Between Primary and Corresponding Lymph Node Metastases . Sci Rep 2017 ; 7 ( 1 ): 4666 . OpenUrl PubMed 15. Ahmadi S , Landa I. The prognostic power of gene mutations in thyroid cancer . Endocr Connect 2024 ; 13 ( 2 ); doi: 10.1530/EC-23-0297 . OpenUrl CrossRef 16. ↵ Heilmann AM , Subbiah V , Wang K , et al. Comprehensive Genomic Profiling of Clinically Advanced Medullary Thyroid Carcinoma . Oncology 2016 ; 90 ( 6 ): 339 – 346 . OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted October 08, 2025. Download PDF Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Deconvolving mutation and selection reveals stage-specific drivers of thyroid cancer Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Deconvolving mutation and selection reveals stage-specific drivers of thyroid cancer Moein Rajaei , Andrew Ju , Adebowale J. Adeniran , Jeffrey P. Townsend bioRxiv 2025.10.08.681166; doi: https://doi.org/10.1101/2025.10.08.681166 Share This Article: Copy Citation Tools Deconvolving mutation and selection reveals stage-specific drivers of thyroid cancer Moein Rajaei , Andrew Ju , Adebowale J. Adeniran , Jeffrey P. Townsend bioRxiv 2025.10.08.681166; doi: https://doi.org/10.1101/2025.10.08.681166 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Cancer Biology Subject Areas All Articles Animal Behavior and Cognition (7634) Biochemistry (17690) Bioengineering (13892) Bioinformatics (41935) Biophysics (21451) Cancer Biology (18587) Cell Biology (25499) Clinical Trials (138) Developmental Biology (13375) Ecology (19899) Epidemiology (2067) Evolutionary Biology (24316) Genetics (15609) Genomics (22505) Immunology (17736) Microbiology (40393) Molecular Biology (17180) Neuroscience (88598) Paleontology (666) Pathology (2832) Pharmacology and Toxicology (4824) Physiology (7641) Plant Biology (15151) Scientific Communication and Education (2045) Synthetic Biology (4294) Systems Biology (9824) Zoology (2271)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00
unpaywall
last seen: 2026-06-19T06:35:33.578913+00:00