Full text
66,156 characters
· extracted from
preprint-html
· click to expand
GASPS: A Multi-Omics Framework for Defining Genomic Aberration-Driven Signatures and Predicting Patient Outcomes in Lung Cancer | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results GASPS: A Multi-Omics Framework for Defining Genomic Aberration-Driven Signatures and Predicting Patient Outcomes in Lung Cancer Zijian Zhang , Xiang Wang , View ORCID Profile Chenyang Li , Robert Taylor Ripley , Jia Wu , Jianjun Zhang , Christopher I Amos , View ORCID Profile Chao Cheng doi: https://doi.org/10.1101/2025.08.21.671519 Zijian Zhang 1 Institute for Clinical and Translational Research, Baylor College of Medicine , Houston, Texas 2 Section of Epidemiology and Population Sciences, Department of Medicine, Baylor College of Medicine , Houston, Texas 3 Dan L Duncan Comprehensive Cancer Center, Baylor College of Medicine , Houston, Texas Find this author on Google Scholar Find this author on PubMed Search for this author on this site Xiang Wang 1 Institute for Clinical and Translational Research, Baylor College of Medicine , Houston, Texas 4 Graduate Program in Quantitative and Computational Biosciences, Baylor College of Medicine , Houston, Texas Find this author on Google Scholar Find this author on PubMed Search for this author on this site Chenyang Li 5 Department of Genomic Medicine, The University of Texas MD Anderson Cancer Center , Houston, Texas Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Chenyang Li Robert Taylor Ripley 6 David J. Sugarbaker Division of Thoracic Surgery, Michael E. DeBakey Department of Surgery, Baylor College of Medicine , Houston, Texas Find this author on Google Scholar Find this author on PubMed Search for this author on this site Jia Wu 7 Department of Imaging Physics, The University of Texas MD Anderson Cancer Center , Houston, Texas Find this author on Google Scholar Find this author on PubMed Search for this author on this site Jianjun Zhang 8 Department of Thoracic/Head and Neck Medical Oncology, The University of Texas MD Anderson Cancer Center , Houston, Texas 5 Department of Genomic Medicine, The University of Texas MD Anderson Cancer Center , Houston, Texas Find this author on Google Scholar Find this author on PubMed Search for this author on this site Christopher I Amos 9 University of New Mexico Comprehensive Cancer Center , Albuquerque, New Mexico 10 University of New Mexico Health Sciences Center , Albuquerque, New Mexico Find this author on Google Scholar Find this author on PubMed Search for this author on this site Chao Cheng 1 Institute for Clinical and Translational Research, Baylor College of Medicine , Houston, Texas 2 Section of Epidemiology and Population Sciences, Department of Medicine, Baylor College of Medicine , Houston, Texas 3 Dan L Duncan Comprehensive Cancer Center, Baylor College of Medicine , Houston, Texas Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Chao Cheng For correspondence: chao.cheng{at}bcm.edu Abstract Full Text Info/History Metrics Supplementary material Preview PDF Summary Lung cancer is the most common cause of cancer-related death worldwide. Recent advancements in targeted therapies and immunotherapies have achieved remarkable success. However, patient responses to treatments with lung cancer vary substantially. The mutation status of driver genes can direct personalized treatment, but their prognostic value and treatment efficacy are limited. In this study, we developed a statistical framework named Genomic Aberration-Derived Signature for Patient Stratification (GASPS) to characterize the transcriptomic deregulation of driver genomic aberrations and stratify patients. By applying GASPS to The Cancer Genome Atlas Lung Adenocarcinoma (TCGA-LUAD) data, we developed gene signatures for 38 driver genomic aberrations, including gene mutations, amplifications, and deletions. These signatures were applied to independent lung cancer transcriptomic datasets containing a total of 2,226 patient samples. Our results indicated that these driver gene signatures are much more prognostic than their corresponding genomic mutations. Interestingly, the two EGFR-related signatures characterizing EGFR mutation and amplification, respectively, exhibited contrasting associations with prognosis, treatment response, and immune infiltration in the tumor microenvironment. Moreover, the STK11 mutation signature, rather than the mutation status, was found to be predictive of the response and long-term benefit of patients treated with immune checkpoint blockade therapy in lung cancer. This framework is readily applicable to most cancer types using existing data to improve prognostic risk assessment and treatment efficacy by guiding personalized therapies. Introduction Lung cancer is the leading cause of cancer-related deaths in the U.S. and worldwide 1 . In 2024, the American Cancer Society estimated 234,580 new cases and 125,070 deaths from lung cancer in the United States 2 . Due to the majority of patients being diagnosed at an advanced stage, lung cancer is recognized as an aggressive disease with a poor prognosis 3 . In recent years, numerous new treatment options have been developed and many more are undergoing clinical trials for lung cancer, particularly targeted therapies and immune checkpoint blockade therapies (ICBT) 4 , 5 . Three generations of tyrosine kinase inhibitors targeting EGFR have been developed to treat non-small cell lung cancer (NSCLC) patients harboring mutations that lead to over-activation of the EGFR gene 6 . Additionally, ICBTs, such as anti-PD-1/PD-L1 treatments, have been widely implemented and have significantly improved the survival outcomes of patients with NSCLC 7 . These therapies are utilized as monotherapy or in combination with other treatments (e.g., chemotherapy), in neoadjuvant or adjuvant settings, based on the stage and clinicopathological characteristics of the patients 8 . Known as a heterogeneous disease, lung cancer patients exhibit substantial variation in prognosis and response to treatment 9 . Therefore, effective biomarkers are essential for identifying patients at high prognostic risk and enhancing treatment outcomes through precision cancer therapy. The intertumoral heterogeneity observed among lung cancer patients can largely be attributed to genomic variations, including somatic mutations and copy number alterations in their genomes 10 . The initiation and progression of lung cancer in each patient is driven by a distinct set of driver genomic aberrations, which, in turn, influence patient prognosis and treatment response. By identifying driver mutations in actionable genes, personalized treatment using targeted therapies can be implemented. This approach has led to the accelerated FDA approval of Vitrakvi (larotrectinib) for treating solid tumors harboring NTRK gene fusions 11 and Keytruda (pembrolizumab) for treating any solid tumors with microsatellite instability (MSI), regardless of the tissue of origin 12 . Despite some successful examples, the reliability of gene mutations in guiding the selection of targeted treatments remains uncertain 13 , 14 . For instance, in breast cancer, approximately 30-40% of patients harbor mutations in the PIK3CA gene. Although preclinical studies have shown that PIK3CA-mutated breast cancer cells are more responsive to PI3K inhibitors 15 , the reported predictive value of PIK3CA mutations in clinical settings remains contradictory. While some studies have demonstrated their predictive value for pan-PI3K inhibitors 16 , others have found no significant predictive benefit 17 – 19 . Essentially, tumor development is driven by the aberrant regulation of specific oncogenic or tumor-suppressive pathways, which can be deregulated by various mechanisms at both genomic and epigenomic levels. Although driver genomic aberrations, such as gene mutations, amplifications, deletions, and translocations, are the most likely mechanisms behind pathway deregulation during tumor initiation and progression, they are not the only ones. For example, somatic mutations in the TP53 gene have been observed in more than 50% of tumors. However, inactivation of the downstream p53 pathway can also occur through alternative mechanisms, including loss of TP53, hypermethylation of the TP53 promoter, and genomic alterations in other pathway-associated genes 20 . Therefore, relying exclusively on driver genomic aberrations to predict patient treatment outcomes may not provide sufficient accuracy for guiding personalized cancer treatment. In this study, we developed a novel statistical framework called Genomic Aberration-Derived Signature for Patient Stratification (GASPS) to integrate cancer genomic and transcriptomic data for improved patient stratification. GASPS defines gene signatures by simultaneously modeling the effects of genomic aberrations on gene expression changes in tumor samples. For a specific cancer type, it identifies gene signatures for each commonly observed driver genomic aberration, including gene mutations, amplifications, and deletions. These signatures can then be applied to independent cancer gene expression profiles to calculate patient-specific signature scores, collectively providing an overview of oncogenic and tumor-suppressive pathways in each tumor sample. In this study, we applied GASPS to lung adenocarcinoma (LUAD) data, defining a total of 38 signatures based on The Cancer Genome Atlas (TCGA) data. We demonstrated that these signatures served as reliable biomarkers for predicting patient prognosis and response to targeted or immunotherapy when validated on multiple independent lung cancer datasets. Methods Datasets Used in This Study TCGA-LUAD Data The TCGA LUAD dataset was obtained from the FireBrowse database ( http://firebrowse.org ), including RNA-seq, somatic mutation, copy number variation (CNV), DNA methylation data, and clinical information. RNA-seq data, normalized by the RSEM method 35 , were available for 515 LUAD patients. Somatic mutation data were provided in Mutation Annotation Format (MAF), detailing functionally relevant mutations such as Frame_Shift, Missense, Nonsense, and Splice_Site variants, while synonymous mutations were excluded. CNV data in Segment (SEG) files contained chromosomal segments with copy number alterations. Amplified and deleted genes were identified based on log 2 -transformed copy numbers. Driver genomic aberrations were determined for cancer-related genes present in at least 10% of LUAD samples, referencing the COSMIC database 36 . DNA methylation data, generated using the Illumina Human Methylation 450K BeadChip platform, provided CpG methylation levels. The median value across CpG sites was used to estimate global methylation per sample. TRACERx Data The TRACERx project investigates the evolutionary dynamics of NSCLC 37 . Processed RNA-seq, somatic mutation, and clinical data for 421 NSCLC patients were obtained from Zenodo (accession ID 7603386) 22 . The dataset includes primary, metastatic, and lymph node samples; however, only primary tumor samples were used in this study. Gentles Meta-data The Gentles dataset is a meta-cohort comprising seven NSCLC gene expression datasets with patient survival information 38 . The dataset, containing 1,106 NSCLC samples, was downloaded from the Gene Expression Omnibus (GEO) under accession ID GSE63679 39 . Patil-OAK Data The Phase 3 OAK trial ( NCT02008227 ) evaluated atezolizumab (anti-PD-L1) versus docetaxel in NSCLC patients 40 . RNA-seq profiles from 699 pretreatment tumor samples were obtained from the European Genome-phenome Archive (EGA) (EGAS00001005013) 23 . A summary of these datasets was included in the Suppl. Table S1. A more detailed description is provided in the Suppl. Methods and Materials. The GASPS framework GASPS is a statistical framework designed to define gene signatures for driver genomic aberrations in cancer. By analyzing the transcriptomic effects of these aberrations in tumor samples, GASPS enables the calculation of patient-specific signature scores, providing insights into tumor-specific biological pathways. The framework consists of three key components: GASPS-C1: Defining gene signatures for driver genomic aberrations GASPS constructs gene signatures by modeling the effects of genomic aberrations (e.g., mutations, amplifications, deletions) on gene expression. Using a multivariate linear regression model, informative genes are identified based on significant associations between genomic events and gene expression levels. Genes with significant coefficients are assigned weighted profiles (w⁺ and w⁻), which are trimmed to prevent extreme values and rescaled to a [0,1] range. In this study, we identified a total of 38 driver genomic aberrations based on the TCGA-LUAD somatic mutation and copy number variation data (Suppl. Table S2). These aberrations included 7 mutations, 28 amplifications, and 3 deletions of cancer-related genes that are present in at least 10% of tumor samples from the TCGA-LUAD data. GASPS-C2: Calculating signature scores Once gene signatures are established, they are applied to independent gene expression datasets to compute sample-specific scores. GASPS employs a modified binding association with sorted expression (BASE) algorithm to quantify pathway activity within tumor samples 41 , 42 . The method ranks genes by expression level and uses cumulative functions to assess the enrichment of informative genes. The deviation between these distributions is normalized against a null model, generating a final signature score (S = S⁺ - S⁻) that reflects pathway activation. In this study, we applied GASPS to three independent lung cancer transcriptomic data or meta-data including a total of 2226 tumor samples. For each sample, we calculated patient-specific scores for each of the 38 gene signatures to characterize its deregulated pathway. GASPS-C3: Predicting clinical outcomes Computed signature scores serve as candidate biomarkers for predicting clinical outcomes, including patient prognosis and response to therapy. These signatures can be integrated with clinical variables to improve predictive models, facilitating precision oncology approaches. In this study, we performed systematic analyses to examine the prognostic and predictive values of the 38 gene signatures in lung cancer. By leveraging genomic and transcriptomic data, GASPS provides a robust framework for patient stratification, advancing personalized cancer treatment strategies. More detailed description of this statistical framework is provided in the Suppl. Methods and Materials Clustering analysis of gene signature score We performed a hierarchical clustering analysis using the signature scores for the 1,106 lung cancer samples included in the Gentles dataset 38 . For each of the 38 driver gene signatures, we calculated the patient-specific scores in all samples. The resultant signature score matrix was used as the input data for clustering analysis to identify patient subgroups. The R function heatmap.2 was used to implement this analysis using the default parameter setting. Deconvolution analysis to infer immune infiltration The ESTIMATE algorithm was used to estimate the purity of tumor samples based on their gene expression profiles 43 . The TIMER algorithm was applied to deconvolute tumor gene expression data to infer infiltration levels of six major immune cell types, including B cells, CD4 T cells, CD8 T cells, neutrophils, macrophages, and dendritic cells 44 . Application of previous gene signatures We applied several previously published gene signatures to characterize tumor samples based on their gene expression data, including cell proliferation 45 , IFN-γ response 45 , and TGF-β response signatures 46 . These signatures have been applied to all TCGA-LUAD tumor samples by Thorsson et al. 47 , and the results from this article were used in our analysis. In addition, the data provided leukocyte and lymphocyte infiltration levels in each TCGA-LUAD sample, which were also included in our analysis. Survival analysis Cox proportional hazard models were applied to analyze the association between signature scores and patient survival outcomes, including overall survival (OS) and progression-free survival (PFS), based on the availability of survival data in each dataset. Univariable Cox regression models were applied to evaluate the prognostic effect of individual gene signatures using their scores as continuous variables. The multivariable Cox regression models were constructed to further evaluate their prognostic association after adjusting for established clinical variables such as age, gender, and tumor stage. The Kaplan-Meier plots and survival analyses were implemented using the “survival” and “survminer” packages developed for the R platform. Specifically, the “coxph” function was used to construct Cox proportional hazard models. The “survfit” and “ggsurvplot” functions were used to generate Kaplan-Meier survival curves. The “survdiff” function was used to compare the survival differences of two patient subgroups. Other statistical analyses Pearson and Spearman correlation coefficients were used to quantify and estimate the statistical significance of the associations between continuous variables. The Student t-test and the Wilcoxon rank sum test were applied to evaluate the differences in continuous variables (e.g., signature scores) between two patient groups (e.g., responders versus non-responders). When paired data were provided, paired tests were adopted. One-way ANOVA was conducted to compare continuous variables among multiple groups (e.g., tumor stages). All statistical analyses were performed using the R platform (version 4.3.1). Data and code availability All the data sets used in this study are publicly available. The TCGA-LUAD dataset analyzed in this study was obtained from FireBrowse database at http://firebrowse.org . The TRACERx data analyzed in this study were obtained from Zenodo at accession ID 7603386. The Gentles dataset analyzed in this study was downloaded from the Gene Expression Omnibus (GEO) at GSE63679. The Patil-OAK data analyzed in this study were obtained from the European Genome-phenome Archive (EGA) at EGAS00001005013. The original code for the analysis is publicly available for non-profit academic use as of the publication date. The example codes are deposited in Github: https://github.com/zijianzhang3/GASPS Results Define gene signatures to systematically model driver genomic aberration The development of cancer is driven by genomic alterations in oncogenes or tumor suppressors, including gene mutations, amplifications, and deletions. These driver genomic aberrations often occur in tumor samples in a co-occurring or mutually exclusive manner 21 . Within a single tumor, multiple genomic aberrations may coexist, deregulating downstream oncogenic or tumor-suppressive pathways. These deregulated pathways interact and collectively shape the transcriptomic output. The GASPS framework integrates somatic mutation, copy number variation, and transcriptomic data to define driver gene signatures simultaneously. By modeling the transcriptomic effects of all driver genomic aberrations together, GASPS takes into consideration their co-occurrence or mutual exclusivity while adjusting for established clinical factors such as age and tumor stage. These driver gene signatures can be applied to new cancer expression profiles to characterize the deregulated pathways underlying a sample. ( Figure 1a ) Compared to the original genomic aberrations, the resultant signature scores show stronger correlations with patient clinical outcomes. In this study, we utilized TCGA-LUAD data to define a total of 38 driver gene signatures, including 7 gene mutations, 28 amplifications, and 3 deletions. We then applied these signatures to multiple high-quality NSCLC datasets to evaluate their ability to predict patient prognosis and response to chemotherapy or immunotherapy ( Figure 1b ). Download figure Open in new tab Figure 1: The GASPS framework and its application to lung adenocarcinoma. (a) Overview of the GASPS framework. (b) Application of 38 gene signatures for genomic aberrations to predict patient outcomes in lung adenocarcinoma. Validate driver gene signatures using the TRACERx dataset To validate these signatures, we applied them to an independent RNA-seq dataset generated by the TRAcking Cancer Evolution through Therapy Rx (TRACERx) project. This dataset contains 1,011 multi-regional transcriptomic profiles and whole exome sequencing profiles from a total of 421 patients with NSCLC 22 . Out of the seven genes with defined mutation signatures, six genes—TP53, KRAS, EGFR, STK11, NF1, and SETBP1—are mutated in at least 50 patients (>10%). We expect that the signature scores for a driver mutation would be significantly higher in tumor regions harboring mutations of the corresponding gene compared to those without. Indeed, we validated the effectiveness of all mutation signatures, except for NF1 (Supp. Figure S1). For example, among the 1,011 TRACERx samples, 406 samples have a wild-type TP53 gene, while 605 have at least one TP53 mutation. Based on the predicted functional impact, the mutated samples were further categorized into 583 with at least one driver mutation in TP53 (Driver-mutation, D) and 22 with only non-driver mutations (Non-Driver mutation, ND). The TP53-Mut signature scores were significantly higher in both the Driver-mutation ( P = 6e-69) and non-driver mutation ( P = 6e-07) groups compared to the TP53 wild-type group. Although TP53-Mut signature scores were higher in the Driver-mutation group than in the non-driver mutation group, this difference was not statistically significant ( P > 0.1). For EGFR, KRAS, and STK11, the corresponding signature scores were significantly higher in the Driver-mutation group compared to both the non-driver mutation and wild-type groups, but no significant difference was observed between the latter two groups. For SETBP 1 , no driver mutations were identified, but 102 samples had non-driver mutations, which showed significantly higher SETBP1-Mut scores than their wild-type counterparts ( P = 0.002). These results indicate that the mutation signatures defined based on TCGA-LUAD data can be effectively applied to other datasets to infer gene mutation status and the underlying pathway activities. Association of driver gene signatures with patient prognosis We applied these signatures to the Gentles dataset, a LUAD meta-dataset comprising transcriptomic profiles of 1,086 lung adenocarcinoma samples from seven independent cohorts. For each sample, we calculated a vector of signature scores using the 38 driver gene signatures, transforming the gene expression matrix into a signature score matrix. Hierarchical clustering based on this matrix stratified patients into two distinct groups ( Figure 2a ), which exhibited significant differences in patient OS ( Figure 2b ). Next, we assessed the prognostic relevance of individual signatures, identifying 24 signatures that were significantly associated with patient OS, including 13 protective signatures (Hazard Ratio, HR < 1 and P 1 and P < 0.01) ( Figure 2c ). For example, the CDKN2A-Del signature score was strongly linked to poor prognosis ( P = 8e-11), with the high-score group showing significantly shorter OS when dichotomized by the median score ( Figure 2d , Suppl. Table S3). Conversely, the EXT1-Amp signature score was associated with favorable prognosis ( P = 6e-12), where the high-score group displayed significantly longer OS ( Figure 2e , Suppl. Table S3). Download figure Open in new tab Figure 2: Prognostic value of genomic aberration-derived gene signatures in lung adenocarcinoma. (a) Hierarchical clustering of LUAD samples based on gene signature scores stratified patients into two distinct groups. (b) Kaplan-Meier survival curves exhibiting significant overall survival between the two patient groups. (c) Volcano plot displaying the prognostic association of individual gene signatures. (d-e) Kaplan-Meier survival curves for representative hazardous (CDKN2A-Del) and protective (EXT1-Amp) signatures. Patients with high CDKN2A-Del scores had significantly shorter OS, while high EXT1-Amp scores were associated with improved survival. (f) The CDKN2A-Del signature provides additional prognostic values after adjusting for clinical factors. (g) Boxplot illustrating CDKN2A-Del signature scores across different lung cancer stages, showing increasing scores from early to late stages. (h-i) Kaplan-Meier survival curves for CDKN2A-Del in Stage I and Stage III patients, showing significant prognostic stratification. (j-m) Validation of the CDKN2A-Del and EXT1-Amp signatures in independent LUAD datasets (TCGA and TRACERx), confirming their prognostic significance. We further evaluated whether these gene signatures provided additional prognostic value after adjusting for established clinical factors through multivariable Cox regression analysis. Most signatures remained significant after adjusting for age, sex, and tumor stage (Suppl. Figure S2), exemplified by the CDKN2A-Del signature ( Figure 2f ). Stratified analyses within specific tumor stages revealed that CDKN2A-Del signature scores progressively increased from early to late stages, with significant differences observed between stages ( Figure 2g ). Moreover, this signature could further stratify prognosis within Stage I and Stage III patient subgroups ( Figure 2h-i ). The prognostic utility of our signatures was validated in independent LUAD datasets, including TCGA-LUAD and TRACERx, where CDKN2A-Del and EXT1-Amp signatures demonstrated consistent prognostic significance ( Figure 2j-m ). Predictive value of driver gene signatures to chemotherapy and immunotherapy After demonstrating the prognostic value of all signatures, we further evaluated their ability to predict patient responses to chemotherapy and immunotherapy using data from clinical trials. Specifically, we applied our gene signatures to the RNA-seq dataset from the Patil-OAK clinical trial, which includes a docetaxel arm (chemotherapy) and an atezolizumab (anti-PD-L1) arm (immune checkpoint blockade therapy, ICBT) for patients with advanced NSCLC 23 . By comparing signature scores between responders and non-responders in the chemotherapy arm, we identified 10 significant signatures ( P < 0.01) predictive of patient sensitivity to docetaxel ( Figure 3a , Suppl. Table S4). Among these, 5 signatures showed elevated scores in responders. For instance, patients with higher MYC-Amp signature scores were more likely to respond to chemotherapy ( Figure 3b ). Conversely, 5 signatures exhibited significantly lower scores in responders, such as the RAC1-Amp signature ( Figure 3c ). Notably, our analysis revealed that the EGFR-Mut signature, but not the EGFR-Amp signature, was associated with chemotherapy sensitivity, which will be discussed in a later section. Download figure Open in new tab Figure 3: Gene signature scores predict patient response to chemotherapy and immunotherapy. (a) Volcano plot showing gene signatures associated with response to chemotherapy (docetaxel) in the Patil-OAK trial cohort. The X-axis represents the difference in signature scores between responders (R) and non-responders (NR), while the Y-axis indicates the statistical significance (-log10 P -value). Red and blue dots denote signatures with significantly higher scores in responders and non-responders, respectively. (b-c) Boxplots showing the distribution of MYC-Amp (b) and RAC1-Amp (c) signature scores between responders and non-responders to chemotherapy. (d) Volcano plot showing gene signatures associated with response to anti-PD-L1 immunotherapy in the same cohort. (e-f) Boxplots depicting the distribution of TP53-Mut (e) and ELK4-Amp (f) signature scores between responders and non-responders to immunotherapy. Statistical significance is indicated above the plots. R: Responders; NR: Non-responders . Similarly, we identified a total of 5 signatures predictive of patient response to anti-PD-L1 therapy, including 2 signatures with elevated scores and 3 signatures with reduced scores in responders compared to non-responders ( Figure 3d ). For example, patients with a defective p53 pathway, as indicated by higher TP53-Mut signature scores, were more likely to respond to immunotherapy ( Figure 3e ), while those with higher ELK4-Amp signature scores were more likely to be non-responders ( Figure 3f ). Notably, the STK11-Mut signature emerged as the most predictive of response, which will also be discussed in detail in a later section. The predictive ability of gene signatures for chemotherapy and immunotherapy was not correlated ( R = 0.07, Suppl. Figure S3), indicating that distinct sets of signatures are required for response prediction in different treatment modalities. Differential prognostic values between EGFR-Mut and EGFR-Amp signatures Among all gene signatures, the EGFR-Mut and EGFR-Amp signatures were respectively defined based on the mutation and amplification status of the EGFR gene. Our analyses revealed substantial differences in their associations with clinical outcomes and molecular features. First, the EGFR-Mut signature was linked to favorable prognosis, whereas the EGFR-Amp signature was associated with unfavorable prognosis. Specifically, patients with higher EGFR-Mut signature scores demonstrated significantly longer survival times compared to those with lower scores across three independent datasets: Gentles, TRACERx, and TCGA-LUAD ( Figure 4a-c ). In contrast, the opposite pattern was observed for the EGFR-Amp signature ( Figure 4d-f ). Download figure Open in new tab Figure 4: Differential prognostic and predictive value of EGFR-Mut and EGFR-Amp gene signatures in lung cancer. (a-c) Higher EGFR-Mut signature scores were associated with a better prognosis in three independent datasets. (d-f) Higher EGFR-Amp signature scores were associated with a poorer prognosis in the same datasets. (g) EGFR-Mut but not EGFR-Amp signature scores showing significant difference between responders and non-responders to chemotherapy. (h-i) Progression-free survival (PFS) curves for patients treated with chemotherapy, showing that higher EGFR-Mut signature scores are associated with longer PFS, while EGFR-Amp scores show no significant correlation. (j-k) Correlation between EGFR-related signatures and tumor proliferation rates. (l) Heatmap illustrating the correlations of EGFR-Mut and EGFR-Amp signatures with the infiltration level of various immune cell types as well as the overall infiltration level (ImmuneScore). (m) Summary table highlighting differences in tumor proliferation, immune infiltration, prognosis, and treatment response between the two EGFR-related signatures. R: Responders; NR: Non-responders . Second, the EGFR-Mut signature, but not the EGFR-Amp signature, predicted patient sensitivity to chemotherapy in the Patil-OAK dataset. EGFR-Mut signature scores were significantly higher in responders compared to non-responders, a trend not seen for the EGFR-Amp signature ( Figure 4g ). Notably, patients with higher EGFR-Mut signature scores exhibited longer PFS under chemotherapy, suggesting a sustained benefit from treatment while the EGFR-Amp signature not ( Figure 4h-i ). However, in the immune checkpoint blockade therapy arm of the same cohort, neither the EGFR-Mut nor the EGFR-Amp signature was correlated with patient response to anti-PD-L1 treatment (Suppl. Figure S4). To explore the differential associations of these two EGFR-related signatures, we examined their correlations with tumor cell proliferation and immune infiltration in the tumor microenvironment (TME). Interestingly, the EGFR-Mut signature showed a strong negative correlation with tumor proliferation scores ( R = −0.71, P < 0.001), whereas the EGFR-Amp signature exhibited a positive correlation ( R = 0.35, P < 0.001) ( Figure 4j-k ). Additionally, the EGFR-Mut signature was associated with higher levels of overall immune infiltration (ImmuneScore) and key immune cell populations within the TME ( Figure 4l ). In contrast, the EGFR-Amp signature showed no significant association with immune infiltration. Taken together, our findings suggest that the EGFR-Mut and EGFR-Amp signatures have distinct effects on tumor proliferation and immune infiltration, which likely underlie their differing associations with patient prognosis and chemotherapy response ( Figure 4m ). STK11-Mut signature is a predictive biomarker for patient response to ICBT As described above, the STK11-Mut signature was strongly associated with patient response to ICBT in the Patil-OAK trial. Responders exhibited significantly lower STK11-Mut signature scores than non-responders in the ICBT arm; this difference was absent in the chemotherapy arm ( Figure 5a , Supplementary Figure 5). However, response rates did not significantly differ based on STK11 mutation status alone within the ICBT arm ( Figure 5b ; Fisher’s exact test, P > 0.1). Furthermore, when patients were divided at the median STK11-Mut signature score, the low-score group demonstrated significantly longer PFS than the high-score group, indicating sustained treatment benefits from ICBT ( Figure 5c ). In contrast, the STK11 mutation itself showed no correlation with PFS in the same cohort ( Figure 5d , P > 0.1). Download figure Open in new tab Figure 5 The STK11-Mut signature is predictive of patient response to immune checkpoint blockade therapy (ICBT). (a) STK11-Mut signature scores were significantly lower in responders (R) than in non-responders (NR) to ICBT. (b) STK11 mutation status was not associated with patient response to ICBT. (c-d) Patients with higher STK11-Mut signature scores showed significantly shorter progression-free survival (PFS) when treated by ICBT (c), which was not observed when stratified by the STK11 mutation status (d). (e) Scatter plot showing the lack of correlation between STK11-Mut signature scores and tumor proliferation rate. (f-h) Scatter plots demonstrating significant negative correlations between STK11-Mut signature scores and overall immune score (f), leukocyte infiltration (g), and lymphocyte infiltration (h), suggesting immunosuppressive properties. (i) Heatmap depicting the correlation of STK11-Mut signature scores with different immune cell populations in the tumor microenvironment. (j-k) Boxplots showing significantly higher IFN-gamma (j) and TGF-beta (k) scores in patients with low STK11-Mut signature scores. (l) Scatter plot illustrating a negative correlation between STK11-Mut signature scores and global DNA methylation levels. (m) Boxplot comparing global DNA methylation levels between STK11-mutant and wild-type (WT) samples, showing significantly increased methylation in STK11-mutant cases. (n) Scatter plot showing a positive correlation between global DNA methylation and immune score. To further investigate the underlying mechanism, we conducted additional analyses. Interestingly, the STK11-Mut signature score was not associated with tumor proliferation ( R = 0.006) ( Figure 5e ). However, it exhibited a strong negative correlation with the ImmuneScore ( R = −0.55), which reflects the overall level of immune infiltration in the TME ( Figure 5f ). Specifically, the STK11-Mut signature was inversely correlated with the infiltration of both leukocytes ( R = −0.36) and lymphocytes ( R = −0.28) ( Figure 5g-h ). Deconvolution analysis further revealed a negative correlation between this signature and the infiltration of all major immune cell types ( Figure 5i ). Moreover, patients with higher STK11-Mut scores tended to exhibit lower IFN-γ ( Figure 5j ) and TGF-β ( Figure 5k ) responses, suggesting a relatively "cold" immune TME in these samples. A previous study reported that STK11 loss in LUAD is associated with global DNA hypomethylation 24 . Using the TCGA-LUAD dataset, we calculated the correlation between all gene signatures and global methylation levels (measured as the median methylation fraction of all CpG sites). The STK11-Mut signature emerged as the most strongly correlated signature ( Figure 5l , R = −0.45). Indeed, patients with STK11 mutations exhibited significantly lower median methylation levels compared to their wild-type counterparts ( Figure 5m ). Interestingly, global methylation levels were also positively correlated with ImmuneScore ( Figure 5n , R = 0.36). However, the correlation between STK11-Mut scores and ImmuneScore ( R = −0.55) was much stronger and remained significant even after adjusting for global methylation levels (Partial Correlation Coefficient = −0.47). Although the global reduction in DNA methylation observed in STK11 -mutated samples is noteworthy, it does not account for the cold immune environment present in these tumors. Discussion In this study, we developed an integrative framework to model the downstream effects of driver genomic aberrations while accounting for their co-occurrence, mutual exclusivity, and clinical variables. Using TCGA-LUAD data, we defined gene signatures for 38 driver genomic aberrations. These signatures were applied to several lung cancer datasets to transform gene expression profiles into signature score profiles, providing a comprehensive landscape of deregulated pathways in each sample. Compared to the genomic aberrations themselves, these signatures proved more informative in predicting clinical outcomes. Many signatures demonstrated reproducible prognostic value, even when adjusted for established clinical factors. Additionally, some signatures were predictive of patient response to chemotherapy or immunotherapy. Interestingly, despite representing the same gene, we found that the EGFR-Mut and EGFR-Amp signatures differed significantly in their ability to predict clinical outcomes. Finally, we showed that the STK11-Mut signature could serve as a candidate biomarker for predicting patient sensitivity to immunotherapy in NSCLC. An interesting finding of this study is the differential clinical outcome association between the two EGFR signatures. While the EGFR-Mut signature was associated with favorable prognosis under standard care and predictive of patient response to chemotherapy, the EGFR-Amp signature was linked to unfavorable prognosis. These results highlight the distinct downstream effects of these two driver genomic aberrations. Most somatic mutations in the EGFR gene occur at specific hotspots, such as short deletions in exon 19 and the L858R point mutation, which lead to over-activation of the EGFR protein. In contrast, EGFR amplification typically involves broad amplification of chromosomal segments rather than focal amplification of the EGFR gene. Consequently, the EGFR-Amp signature reflects the combined downstream effects of many genes co-amplified with EGFR, rather than EGFR alone. Indeed, the EGFR-Mut and EGFR-Amp signature scores exhibited a negative correlation across all datasets (e.g., R = −0.39 in the Gentles dataset). These differences might also account for the inverse correlations between the two signatures and tumor proliferation scores, as well as the association of the EGFR-Mut signature-but not the EGFR-Amp signature-with a cold immune environment in the TME. A critical discovery from this study is the identification of the STK11-Mut signature as a potential biomarker for predicting patient sensitivity to immune checkpoint blockade therapy (ICBT). Previous studies have reported a link between STK11 mutations and resistance to immunotherapy 25 – 27 . STK11 is a tumor suppressor gene, with mutations observed in approximately 17-23% of patients with NSCLC 28 – 30 . Our results indicated that inactivation of the STK11 gene is associated with patient resistance to anti-PD-L1 treatment, potentially mediated by a cold immune environment in these patients. The association between STK11 mutations and immunotherapy resistance has been noted in prior research 31 – 33 . An interesting characteristic of STK11 mutations is global DNA hypomethylation, which has been reported in several studies 24 , 34 . In this study, we demonstrated that global methylation levels of LUAD samples are positively correlated with overall immune infiltration levels in the TME ( R = 0.36). However, further investigation suggested that global DNA hypomethylation may not be the primary driver of reduced immune infiltration in STK11-mutated samples. In summary, we developed a robust statistical framework to integrate somatic mutation and copy number variation data with transcriptomic profiles of cancer samples. The resulting gene signatures offer a synergistic representation of deregulated cancer-related pathways associated with a comprehensive list of driver genomic aberrations in a given cancer type. Although demonstrated in LUAD, this framework provides a powerful tool that can be readily applied to other cancer types. Author contributions Z.Z. performed formal analysis, investigation, validation, visualization, and contributed to original drafting and manuscript revision. X.W. conducted formal analysis, investigation, visualization, and contributed to manuscript revision. C.L. contributed to investigation, data curation, and manuscript revision. R.T.R., J.W., J.Z., and C.I.A. contributed to the investigation and critical review of the manuscript. C.C. conceived and supervised the study, developed the methodology, performed formal analysis, contributed to writing the original draft, manuscript revision, and obtained funding. All authors reviewed the manuscript. Declaration of interest R.T.R. reported grant funding from the National Institutes of Health (R37, R01, U01, U24) and the DeGregorio Family Foundation; clinical trial support from AstraZeneca and Genentech; Vice President of the Board of Directors for the Meso Foundation; and speakers’ bureau for Merck. J.Z. reports research funding from Helius, Johnson and Johnson, Merck, Novartis, Summit, and personal fees from AstraZeneca, Catalyst, GenePlus, Hengrui, Innovent, Johnson and Johnson, Novartis, Oncohost, Takeda and Varian outside the submitted work. The remaining authors declare no conflict of interest. Supplemental information titles and legends Document Supplementary Methods and Materials Supplementary Figure S1-S3 Supplementary Table S1-S4 Supplementary Figure S1: Driver gene mutation status reflected by genomic aberration signature scores. (a-f) Boxplots showing signature scores derived from TP53-Mut, EGFR-Mut, KRAS-Mut, STK11-Mut, SETBP1-Mut, and NF1-Mut (from left to right) in the TRACERx dataset, categorized by driver mutations (D), non-driver mutations (ND), and wild-type (WT). Driver mutation scores are significantly higher than wild type except for SETBP1 and NF1. However, non-driver mutation samples show significantly elevated scores compared to wild type in SETBP1. Sample sizes for each group are shown below the boxplots. Statistical significance is denoted by the p-values above each comparison. Supplementary Figure S2: The prognosis of genomic aberrations-derived signatures in lung cancer. (a) Volcano plot showing the association of each gene signatures with prognosis after adjusting for age, gender, and tumor stage using multivariable Cox regression model. Supplementary Figure S3: The treatment response prediction performance. (a) ROC curve showing the predictive performance of MYC-Amp and RAC1-Amp signatures as predictor factors for chemotherapy response. (b) ROC curve exhibiting TP53-Mut and ELK4-Amp signatures in predicting immunotherapy response. (c) Scatter plot displaying no significant correlation of AUC values between chemotherapy response and immune therapy response predictions for each signature. Supplementary Figure S4: The predictive value of EGFR-Mut and EGFR-Amp signatures for immune checkpoint blockade therapy. (a-b) Boxplots showing that no significant differences in EGFR-Amp (a) and EGFR-Mut (b) scores between responders and non-responders in the Patil-OAK immunotherapy arm, respectively. R: Responders; NR: Non-responders . Supplementary Figure S5: The predictive value of STK11-Mut signatures for chemotherapy. (a) Boxplots showing that the STK11-Mut signature was not associated with patient response to chemotherapy. (b) Patients with high STK11-Mut signature scores did not show a difference in progression-free survival compared to those with low scores. R: Responders; NR: Non-responders. Supplementary Table S1: Datasets used in this study. Supplementary Table S2: Genomic aberrations selected in TCGA-LUAD. Supplementary Table S3: The Cox regression model for signatures in the Gentles dataset. Supplementary Table S4: The difference in signature scores between responders (R) and non-responders (NR) in the Patil-OAK dataset. Acknowledgments This study is supported by the Cancer Prevention Research Institute of Texas (CPRIT) (RR180061) to C.C. and the National Cancer Institute of the National Institutes of Health (1R01CA269764) to C.C. C.C. is a CPRIT Scholar in Cancer Research. Funder Information Declared Cancer Prevention Research Institute of Texas , RR180061 National Cancer Institute of the National Institutes of Health , 1R01CA269764 References 1. ↵ Bray , F. , Laversanne , M. , Sung , H. , Ferlay , J. , Siegel , R.L. , Soerjomataram , I. , and Jemal , A . ( 2024 ). Global cancer statistics 2022: GLOBOCAN estimates of incidence and mortality worldwide for 36 cancers in 185 countries . CA Cancer J Clin 74 , 229 – 263 . doi: 10.3322/caac.21834 . OpenUrl CrossRef 2. ↵ Siegel , R.L. , Giaquinto , A.N. , and Jemal , A . ( 2024 ). Cancer statistics, 2024 . CA Cancer J Clin 74 , 12 – 49 . doi: 10.3322/caac.21820 . OpenUrl CrossRef PubMed 3. ↵ Herbst , R.S. , Morgensztern , D. , and Boshoff , C . ( 2018 ). The biology and management of non-small cell lung cancer . Nature 553 , 446 – 454 . doi: 10.1038/nature25183 . OpenUrl CrossRef PubMed 4. ↵ Tan , A.C. , and Tan , D.S.W . ( 2022 ). Targeted Therapies for Lung Cancer Patients With Oncogenic Driver Molecular Alterations . J Clin Oncol 40 , 611 – 625 . doi: 10.1200/JCO.21.01626 . OpenUrl CrossRef PubMed 5. ↵ Meyer , M.-L. , Fitzgerald , B.G. , Paz-Ares , L. , Cappuzzo , F. , Jänne , P.A. , Peters , S. , and Hirsch , F.R . ( 2024 ). New promises and challenges in the treatment of advanced non-small-cell lung cancer . Lancet 404 , 803 – 822 . doi: 10.1016/S0140-6736(24)01029-8 . OpenUrl CrossRef PubMed 6. ↵ Zhou , F. , Guo , H. , Xia , Y. , Le , X. , Tan , D.S.W. , Ramalingam , S.S. , and Zhou , C . ( 2025 ). The changing treatment landscape of EGFR-mutant non-small-cell lung cancer . Nat Rev Clin Oncol 22 , 95 – 116 . doi: 10.1038/s41571-024-00971-2 . OpenUrl CrossRef PubMed 7. ↵ Lahiri , A. , Maji , A. , Potdar , P.D. , Singh , N. , Parikh , P. , Bisht , B. , Mukherjee , A. , and Paul , M.K . ( 2023 ). Lung cancer immunotherapy: progress, pitfalls, and promises . Mol Cancer 22 , 40 . doi: 10.1186/s12943-023-01740-y . OpenUrl CrossRef PubMed 8. ↵ Mountzios , G. , Remon , J. , Hendriks , L.E.L. , García-Campelo , R. , Rolfo , C. , Van Schil , P. , Forde , P.M. , Besse , B. , Subbiah , V. , Reck , M. , et al. ( 2023 ). Immune-checkpoint inhibition for resectable non-small-cell lung cancer - opportunities and challenges . Nat Rev Clin Oncol 20 , 664 – 677 . doi: 10.1038/s41571-023-00794-7 . OpenUrl CrossRef PubMed 9. ↵ Chen , Z. , Fillmore , C.M. , Hammerman , P.S. , Kim , C.F. , and Wong , K.-K . ( 2014 ). Non-small-cell lung cancers: a heterogeneous set of diseases . Nat Rev Cancer 14 , 535 – 546 . doi: 10.1038/nrc3775 . OpenUrl CrossRef PubMed 10. ↵ Jamal-Hanjani , M. , Quezada , S.A. , Larkin , J. , and Swanton , C . ( 2015 ). Translational implications of tumor heterogeneity . Clin Cancer Res 21 , 1258 – 1266 . doi: 10.1158/1078-0432.CCR-14-1429 . OpenUrl Abstract / FREE Full Text 11. ↵ Scott , L.J . ( 2019 ). Larotrectinib: First Global Approval . Drugs 79 , 201 – 206 . doi: 10.1007/s40265-018-1044-x . OpenUrl CrossRef PubMed 12. ↵ Marcus , L. , Lemery , S.J. , Keegan , P. , and Pazdur , R . ( 2019 ). FDA Approval Summary: Pembrolizumab for the Treatment of Microsatellite Instability-High Solid Tumors . Clin Cancer Res 25 , 3753 – 3758 . doi: 10.1158/1078-0432.CCR-18-4070 . OpenUrl Abstract / FREE Full Text 13. ↵ Joyner , M.J. , and Paneth , N . ( 2019 ). Promises, promises, and precision medicine . J Clin Invest 129 , 946 – 948 . doi: 10.1172/JCI126119 . OpenUrl CrossRef PubMed 14. ↵ Marquart , J. , Chen , E.Y. , and Prasad , V . ( 2018 ). Estimation of the Percentage of US Patients With Cancer Who Benefit From Genome-Driven Oncology . JAMA Oncol 4 , 1093 – 1098 . doi: 10.1001/jamaoncol.2018.1660 . OpenUrl CrossRef PubMed 15. ↵ Beaver , J.A. , Gustin , J.P. , Yi , K.H. , Rajpurohit , A. , Thomas , M. , Gilbert , S.F. , Rosen , D.M. , Ho Park , B. , and Lauring , J . ( 2013 ). PIK3CA and AKT1 mutations have distinct effects on sensitivity to targeted pathway inhibitors in an isogenic luminal breast cancer model system . Clin Cancer Res 19 , 5413 – 5422 . doi: 10.1158/1078-0432.CCR-13-0884 . OpenUrl Abstract / FREE Full Text 16. ↵ Baselga , J. , Im , S.-A. , Iwata , H. , Cortés , J. , De Laurentiis , M. , Jiang , Z. , Arteaga , C.L. , Jonat , W. , Clemons , M. , Ito , Y. , et al. ( 2017 ). Buparlisib plus fulvestrant versus placebo plus fulvestrant in postmenopausal, hormone receptor-positive, HER2-negative, advanced breast cancer (BELLE-2): a randomised, double-blind, placebo-controlled, phase 3 trial . Lancet Oncol 18 , 904 – 916 . doi: 10.1016/S1470-2045(17)30376-5 . OpenUrl CrossRef PubMed 17. ↵ Martín , M. , Chan , A. , Dirix , L. , O’Shaughnessy , J. , Hegg , R. , Manikhas , A. , Shtivelband , M. , Krivorotko , P. , Batista López , N. , Campone , M. , et al. ( 2017 ). A randomized adaptive phase II/III study of buparlisib, a pan-class I PI3K inhibitor, combined with paclitaxel for the treatment of HER2-advanced breast cancer (BELLE-4) . Ann Oncol 28 , 313 – 320 . doi: 10.1093/annonc/mdw562 . OpenUrl CrossRef PubMed 18. Vuylsteke , P. , Huizing , M. , Petrakova , K. , Roylance , R. , Laing , R. , Chan , S. , Abell , F. , Gendreau , S. , Rooney , I. , Apt , D. , et al. ( 2016 ). Pictilisib PI3Kinase inhibitor (a phosphatidylinositol 3-kinase [PI3K] inhibitor) plus paclitaxel for the treatment of hormone receptor-positive, HER2-negative, locally recurrent, or metastatic breast cancer: interim analysis of the multicentre, placebo-controlled, phase II randomised PEGGY study . Ann Oncol 27 , 2059 – 2066 . doi: 10.1093/annonc/mdw320 . OpenUrl CrossRef PubMed 19. ↵ Krop , I.E. , Mayer , I.A. , Ganju , V. , Dickler , M. , Johnston , S. , Morales , S. , Yardley , D.A. , Melichar , B. , Forero-Torres , A. , Lee , S.C. , et al. ( 2016 ). Pictilisib for oestrogen receptor-positive, aromatase inhibitor-resistant, advanced or metastatic breast cancer (FERGI): a randomised, double-blind, placebo-controlled, phase 2 trial . Lancet Oncol 17 , 811 – 821 . doi: 10.1016/S1470-2045(16)00106-6 . OpenUrl CrossRef PubMed 20. ↵ Joerger , A.C. , and Fersht , A.R . ( 2016 ). The p53 Pathway: Origins, Inactivation in Cancer, and Emerging Therapeutic Approaches . Annu Rev Biochem 85 , 375 – 404 . doi: 10.1146/annurev-biochem-060815-014710 . OpenUrl CrossRef PubMed 21. ↵ El Tekle , G. , Bernasocchi , T. , Unni , A.M. , Bertoni , F. , Rossi , D. , Rubin , M.A. , and Theurillat , J.-P. ( 2021 ). Co-occurrence and mutual exclusivity: what cross-cancer mutation patterns can tell us . Trends Cancer 7 , 823 – 836 . doi: 10.1016/j.trecan.2021.04.009 . OpenUrl CrossRef PubMed 22. ↵ Martínez-Ruiz , C. , Black , J.R.M. , Puttick , C. , Hill , M.S. , Demeulemeester , J. , Larose Cadieux , E. , Thol , K. , Jones , T.P. , Veeriah , S. , Naceur-Lombardelli , C. , et al. ( 2023 ). Genomic-transcriptomic evolution in lung cancer and metastasis . Nature 616 , 543 – 552 . doi: 10.1038/s41586-023-05706-4 . OpenUrl CrossRef PubMed 23. ↵ Patil , N.S. , Nabet , B.Y. , Müller , S. , Koeppen , H. , Zou , W. , Giltnane , J. , Au-Yeung , A. , Srivats , S. , Cheng , J.H. , Takahashi , C. , et al. ( 2022 ). Intratumoral plasma cells predict outcomes to PD-L1 blockade in non-small cell lung cancer . Cancer Cell 40 , 289 – 300 .e4. doi: 10.1016/j.ccell.2022.02.002 . OpenUrl CrossRef PubMed 24. ↵ Koenig , M.J. , Agana , B.A. , Kaufman , J.M. , Sharpnack , M.F. , Wang , W.Z. , Weigel , C. , Navarro , F.C.P. , Amann , J.M. , Cacciato , N. , Arasada , R.R. , et al. ( 2021 ). STK11/LKB1 Loss of Function Is Associated with Global DNA Hypomethylation and S-Adenosyl-Methionine Depletion in Human Lung Adenocarcinoma . Cancer Res 81 , 4194 – 4204 . doi: 10.1158/0008-5472.CAN-20-3199 . OpenUrl Abstract / FREE Full Text 25. ↵ Skoulidis , F. , Goldberg , M.E. , Greenawalt , D.M. , Hellmann , M.D. , Awad , M.M. , Gainor , J.F. , Schrock , A.B. , Hartmaier , R.J. , Trabucco , S.E. , Gay , L. , et al. ( 2018 ). STK11/LKB1 Mutations and PD-1 Inhibitor Resistance in KRAS-Mutant Lung Adenocarcinoma . Cancer Discov 8 , 822 – 835 . doi: 10.1158/2159-8290.CD-18-0099 . OpenUrl Abstract / FREE Full Text 26. Ricciuti , B. , Arbour , K.C. , Lin , J.J. , Vajdi , A. , Vokes , N. , Hong , L. , Zhang , J. , Tolstorukov , M.Y. , Li , Y.Y. , Spurr , L.F. , et al. ( 2022 ). Diminished Efficacy of Programmed Death-(Ligand)1 Inhibition in STK11- and KEAP1-Mutant Lung Adenocarcinoma Is Affected by KRAS Mutation Status . J Thorac Oncol 17 , 399 – 410 . doi: 10.1016/j.jtho.2021.10.013 . OpenUrl CrossRef PubMed 27. ↵ Arbour , K.C. , Jordan , E. , Kim , H.R. , Dienstag , J. , Yu , H.A. , Sanchez-Vega , F. , Lito , P. , Berger , M. , Solit , D.B. , Hellmann , M. , et al. ( 2018 ). Effects of Co-occurring Genomic Alterations on Outcomes in Patients with KRAS-Mutant Non-Small Cell Lung Cancer . Clin Cancer Res 24 , 334 – 340 . doi: 10.1158/1078-0432.CCR-17-1841 . OpenUrl Abstract / FREE Full Text 28. ↵ Jordan , E.J. , Kim , H.R. , Arcila , M.E. , Barron , D. , Chakravarty , D. , Gao , J. , Chang , M.T. , Ni , A. , Kundra , R. , Jonsson , P. , et al. ( 2017 ). Prospective Comprehensive Molecular Characterization of Lung Adenocarcinomas for Efficient Patient Matching to Approved and Emerging Therapies . Cancer Discov 7 , 596 – 609 . doi: 10.1158/2159-8290.CD-16-1337 . OpenUrl Abstract / FREE Full Text 29. Sanchez-Cespedes , M. , Parrella , P. , Esteller , M. , Nomoto , S. , Trink , B. , Engles , J.M. , Westra , W.H. , Herman , J.G. , and Sidransky , D . ( 2002 ). Inactivation of LKB1/STK11 is a common event in adenocarcinomas of the lung . Cancer Res 62 , 3659 – 3662 . OpenUrl Abstract / FREE Full Text 30. ↵ Cancer Genome Atlas Research Network ( 2014 ). Comprehensive molecular profiling of lung adenocarcinoma . Nature 511 , 543 – 550 . doi: 10.1038/nature13385 . OpenUrl CrossRef PubMed Web of Science 31. ↵ Skoulidis , F. , Araujo , H.A. , Do , M.T. , Qian , Y. , Sun , X. , Cobo , A.G. , Le , J.T. , Montesion , M. , Palmer , R. , Jahchan , N. , et al. ( 2024 ). CTLA4 blockade abrogates KEAP1/STK11-related resistance to PD-(L)1 inhibitors . Nature 635 , 462 – 471 . doi: 10.1038/s41586-024-07943-7 . OpenUrl CrossRef PubMed 32. West , H.J. , McCleland , M. , Cappuzzo , F. , Reck , M. , Mok , T.S. , Jotte , R.M. , Nishio , M. , Kim , E. , Morris , S. , Zou , W. , et al. ( 2022 ). Clinical efficacy of atezolizumab plus bevacizumab and chemotherapy in KRAS-mutated non-small cell lung cancer with STK11, KEAP1, or TP53 comutations: subgroup results from the phase III IMpower150 trial . J Immunother Cancer 10 , e003027 . doi: 10.1136/jitc-2021-003027 . OpenUrl Abstract / FREE Full Text 33. ↵ Singh , A. , Daemen , A. , Nickles , D. , Jeon , S.-M. , Foreman , O. , Sudini , K. , Gnad , F. , Lajoie , S. , Gour , N. , Mitzner , W. , et al. ( 2021 ). NRF2 Activation Promotes Aggressive Lung Cancer and Associates with Poor Clinical Outcomes . Clin Cancer Res 27 , 877 – 888 . doi: 10.1158/1078-0432.CCR-20-1985 . OpenUrl Abstract / FREE Full Text 34. ↵ Kottakis , F. , Nicolay , B.N. , Roumane , A. , Karnik , R. , Gu , H. , Nagle , J.M. , Boukhali , M. , Hayward , M.C. , Li , Y.Y. , Chen , T. , et al. ( 2016 ). LKB1 loss links serine metabolism to DNA methylation and tumorigenesis . Nature 539 , 390 – 395 . doi: 10.1038/nature20132 . OpenUrl CrossRef PubMed 35. ↵ Li , B. , and Dewey , C.N . ( 2011 ). RSEM: accurate transcript quantification from RNA-Seq data with or without a reference genome . BMC Bioinformatics 12 , 323 . doi: 10.1186/1471-2105-12-323 . OpenUrl CrossRef PubMed 36. ↵ Sondka , Z. , Dhir , N.B. , Carvalho-Silva , D. , Jupe , S. , Madhumita , null, McLaren , K. , Starkey , M. , Ward , S. , Wilding , J. , Ahmed , M. , et al. ( 2024 ). COSMIC: a curated database of somatic variants and clinical data for cancer . Nucleic Acids Res 52 , D1210 – D1217 . doi: 10.1093/nar/gkad986 . OpenUrl CrossRef PubMed 37. ↵ Frankell , A.M. , Dietzen , M. , Al Bakir , M. , Lim , E.L. , Karasaki , T. , Ward , S. , Veeriah , S. , Colliver , E. , Huebner , A. , Bunkum , A. , et al. ( 2023 ). The evolution of lung cancer and impact of subclonal selection in TRACERx . Nature 616 , 525 – 533 . doi: 10.1038/s41586-023-05783-5 . OpenUrl CrossRef PubMed 38. ↵ Gentles , A.J. , Bratman , S.V. , Lee , L.J. , Harris , J.P. , Feng , W. , Nair , R.V. , Shultz , D.B. , Nair , V.S. , Hoang , C.D. , West , R.B. , et al. ( 2015 ). Integrating Tumor and Stromal Gene Expression Signatures With Clinical Indices for Survival Stratification of Early-Stage Non-Small Cell Lung Cancer . J Natl Cancer Inst 107 , djv211 . doi: 10.1093/jnci/djv211 . OpenUrl CrossRef PubMed 39. ↵ Clough , E. , and Barrett , T . ( 2016 ). The Gene Expression Omnibus Database . Methods Mol Biol 1418 , 93 – 110 . doi: 10.1007/978-1-4939-3578-9_5 . OpenUrl CrossRef PubMed 40. ↵ Rittmeyer , A. , Barlesi , F. , Waterkamp , D. , Park , K. , Ciardiello , F. , von Pawel , J. , Gadgeel , S.M. , Hida , T. , Kowalski , D.M. , Dols , M.C. , et al. ( 2017 ). Atezolizumab versus docetaxel in patients with previously treated non-small-cell lung cancer (OAK): a phase 3, open-label, multicentre randomised controlled trial . Lancet 389 , 255 – 265 . doi: 10.1016/S0140-6736(16)32517-X . OpenUrl CrossRef PubMed 41. ↵ Cheng , C. , Yan , X. , Sun , F. , and Li , L.M . ( 2007 ). Inferring activity changes of transcription factors by binding association with sorted expression profiles . BMC Bioinformatics 8 , 452 . doi: 10.1186/1471-2105-8-452 . OpenUrl CrossRef PubMed 42. ↵ Khaleel , S.S. , Andrews , E.H. , Ung , M. , DiRenzo , J. , and Cheng , C . ( 2014 ). E2F4 regulatory program predicts patient survival prognosis in breast cancer . Breast Cancer Res 16 , 486 . doi: 10.1186/s13058-014-0486-7 . OpenUrl CrossRef PubMed 43. ↵ Yoshihara , K. , Shahmoradgoli , M. , Martínez , E. , Vegesna , R. , Kim , H. , Torres-Garcia , W. , Treviño , V. , Shen , H. , Laird , P.W. , Levine , D.A. , et al. ( 2013 ). Inferring tumour purity and stromal and immune cell admixture from expression data . Nat Commun 4 , 2612 . doi: 10.1038/ncomms3612 . OpenUrl CrossRef PubMed 44. ↵ Li , T. , Fu , J. , Zeng , Z. , Cohen , D. , Li , J. , Chen , Q. , Li , B. , and Liu , X.S . ( 2020 ). TIMER2.0 for analysis of tumor-infiltrating immune cells . Nucleic Acids Res 48 , W509 – W514 . doi: 10.1093/nar/gkaa407 . OpenUrl CrossRef PubMed 45. ↵ Wolf , D.M. , Lenburg , M.E. , Yau , C. , Boudreau , A. , and van’t Veer , L.J. ( 2014 ). Gene co-expression modules as clinically relevant hallmarks of breast cancer diversity . PLoS One 9 , e88309 . doi: 10.1371/journal.pone.0088309 . OpenUrl CrossRef PubMed 46. ↵ Teschendorff , A.E. , Gomez , S. , Arenas , A. , El-Ashry , D. , Schmidt , M. , Gehrmann , M. , and Caldas , C . ( 2010 ). Improved prognostic classification of breast cancer defined by antagonistic activation patterns of immune response pathway modules . BMC Cancer 10 , 604 . doi: 10.1186/1471-2407-10-604 . OpenUrl CrossRef PubMed 47. ↵ Thorsson , V. , Gibbs , D.L. , Brown , S.D. , Wolf , D. , Bortone , D.S. , Ou Yang , T.-H. , Porta-Pardo , E. , Gao , G.F. , Plaisier , C.L. , Eddy , J.A. , et al. ( 2018 ). The Immune Landscape of Cancer . Immunity 48 , 812 – 830.e14 . doi: 10.1016/j.immuni.2018.03.023 . OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted August 25, 2025. Download PDF Supplementary Material Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following GASPS: A Multi-Omics Framework for Defining Genomic Aberration-Driven Signatures and Predicting Patient Outcomes in Lung Cancer Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share GASPS: A Multi-Omics Framework for Defining Genomic Aberration-Driven Signatures and Predicting Patient Outcomes in Lung Cancer Zijian Zhang , Xiang Wang , Chenyang Li , Robert Taylor Ripley , Jia Wu , Jianjun Zhang , Christopher I Amos , Chao Cheng bioRxiv 2025.08.21.671519; doi: https://doi.org/10.1101/2025.08.21.671519 Share This Article: Copy Citation Tools GASPS: A Multi-Omics Framework for Defining Genomic Aberration-Driven Signatures and Predicting Patient Outcomes in Lung Cancer Zijian Zhang , Xiang Wang , Chenyang Li , Robert Taylor Ripley , Jia Wu , Jianjun Zhang , Christopher I Amos , Chao Cheng bioRxiv 2025.08.21.671519; doi: https://doi.org/10.1101/2025.08.21.671519 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Bioinformatics Subject Areas All Articles Animal Behavior and Cognition (7640) Biochemistry (17707) Bioengineering (13903) Bioinformatics (41980) Biophysics (21465) Cancer Biology (18613) Cell Biology (25528) Clinical Trials (138) Developmental Biology (13387) Ecology (19920) Epidemiology (2067) Evolutionary Biology (24332) Genetics (15615) Genomics (22519) Immunology (17747) Microbiology (40424) Molecular Biology (17194) Neuroscience (88664) Paleontology (667) Pathology (2839) Pharmacology and Toxicology (4827) Physiology (7650) Plant Biology (15160) Scientific Communication and Education (2046) Synthetic Biology (4302) Systems Biology (9826) Zoology (2271)
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.