Full text
29,878 characters
· extracted from
preprint-html
· click to expand
Radiomics-Based Lung Nodule Classification with Stochastic Search Variable Selection and Bayesian Logistic Regression | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Radiomics-Based Lung Nodule Classification with Stochastic Search Variable Selection and Bayesian Logistic Regression View ORCID Profile Isaac Lam doi: https://doi.org/10.1101/2025.04.29.25326704 Isaac Lam 1 ISyE, Georgia Institute of Technology Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Isaac Lam For correspondence: ilam7{at}gatech.edu Abstract Full Text Info/History Metrics Data/Code Preview PDF Abstract Background Radiomics is an emerging field in medical science that involves extracting quantitative features from medical images using data characterization algorithms. These features, known as radiomic features, provide a quantitative approach to medical image analysis. In the context of lung cancer, radiomics-based approaches are transforming disease management by improving early detection, diagnosis, prognosis, and treatment decision-making. Objective This study aimed to explore the utility of Bayesian methods, specifically Stochastic Variable Selection and Shrinkage (SVSS) and Bayesian logistic regression, in the radiomics-based classification of small lung nodules with limited training data. Methods The Bayesian approach was compared to frequentist Lasso logistic regression on the test set. The performance of both methods was evaluated to determine their viability in the classification of small lung nodules. Results The Bayesian approach matched the performance of frequentist Lasso logistic regression on the test set, demonstrating its viability as an alternative approach. Annulus GLCM Entrop LLL was consistently identified as a feature positively influencing small lung nodule malignancy prediction across multiple models. This finding enhances confidence in the effect of this feature, suggesting that future Bayesian analyses can incorporate this information for greater reliability in feature selection and coefficient estimates. Conclusion This study highlights the potential of Bayesian methods to address the challenges of limited data in medical image analysis, offering a robust alternative to traditional statistical approaches and contributing to improved clinical decision-making. Introduction Radiomics is an emerging field in medical science that involves extracting a large number of quantitative features from medical images using data characterization algorithms. These features, known as radiomic features, contain textural information such as spatial distribution of signal intensities and pixel interre-lationships that can provide a quantitative approach to medical image analysis [ 8 ]. In lung cancer research, radiomics-based methods are revolutionizing disease management by enhancing early detection, diagnosis, prognosis, and treatment decision-making. A critical clinical metric for evaluating cancer risk is the presence of lung nodules, with the size of these nodules being a significant factor [ 4 ]. The diameter of a nodule is measured to categorize it as either small or large. The radiomics-based approach has emerged as a cutting-edge method for enhancing lung cancer risk prediction. Extracting radiomic features from medical images and analyzing them with machine learning (ML) models offers a non-invasive non-invasive complement to CT scans for classifying of lung nodules. This approach has important implications for clinical decision making, as it can enhance diagnostic and predictive accuracy, particularly for indeterminate nodules [ 6 ]. Given that radiomic features can be represented in high-dimensional datasets containing hundreds or thousands of features, previous research have employed feature selection methods such as Lasso regression [ 2 ], random forest feature ranking [ 6 ], and principal component analysis for dimensionality reduction [ 3 ]. Others have selected specific features based on the morphological characteristics they represent [ 5 ]. However, to my best knowledge, stochastic search variable selection (SSVS) has yet to be implemented in this context. Medical image analysis often faces the challenge of limited data availability. This scarcity can be attributed to the rarity of certain medical conditions and the high cost of imaging procedures. Traditional statistical methods struggle with small sample sizes, leading to unstable and unreliable estimates. In contrast, Bayesian methods, such as Bayesian logistic regression and Stochastic Variable Selection and Shrinkage (SVSS), offer a robust solution by incorporating prior information into the model. This integration stabilizes estimates and enhances model performance, making Bayesian approaches particularly valuable in medical image classification tasks [ 7 ]. Additionally, these Bayesian methods improve interpretability by providing a range of probability estimates for each parameter, which offer a more nuanced understanding of the model’s predictions. The objective of this study is to integrate SSVS and bayesian logistic regression into radiomics-based classification of small lung nodules. By leveraging the strengths of Bayesian methods, this study aims to enhance the accuracy and reliability of lung nodule classification, ultimately contributing to improved clinical decision-making and patient outcomes. Data Source The dataset utilized in this study is publicly accessible and was initially collected and annotated by Hunter et al. [ 2 ]. The original dataset consists of CT images of lung nodules, which were processed to extract radiomic features using TexLab2.0. The final dataset comprises 736 images, each containing 1998 radiomic features that quantitatively describe the shape, texture, and intensity of the nodules. More details regarding the data collection, annotation procedures, and radiomic feature extraction can be found in the paper by Hunter et al. [ 2 ]. Methodology The methodology employed in this study is adapted from Hunter et al. [ 2 ]. To evaluate the effectiveness of SVSS and bayesian logistic regression on limited data, 50 images were utilized for training while the remaining 686 were set aside for testing. All 1998 radiomic features underwent Z-score normalization, defined as . To mitigate computational demands, an initial layer of feature selection was performed using univariate frequentist logistic regression to identify significant features. Features were deemed significant if they did not exceed the adjusted critical value after false discovery rate (FDR) correction, utilizing the Benjamini-Hochberg procedure with an FDR set to 0.1. This process identified 316 significant features. Subsequently, Stochastic Variational Subset Selection (SVSS) was applied to the remaining dataset to select the final model features. The top three features with the greatest posterior probabilities from SVSS were selected. Bayesian logistic regression models were developed to predict malignancy using radiomic features selected by SVSS. Four distinct Bayesian logistic regression models were constructed, each differing by the precision parameter τ for the normal priors applied to the coefficients and intercept. The specific τ values used were 0.01, 0.1, 1, and 10. Pareto-smoothed importance sampling leave-one-out cross-validation (PSIS-LOO-CV) was employed to determine the most suitable model. The performance of the optimal bayseian logistic regression model was compared against a baseline frequentist Lasso logistic regression model, which was constructed using the significant features identified from the univariate logistic regressions. The regularization hyperparameter C for the Lasso model was tuned in a five fold cross-validation loop, optimizing for the area under receiver operating characteristic curve (AUROC). Model Evaluation Receiver Operating Characteristic (ROC) curves were employed to evaluate the performance of both models. AUROC was utilized as the primary metric for assessment. To estimate the 95% confidence intervals for the AUROC, resampling was conducted using 1000 bootstrap iterations. Threshold-based performance metrics, including accuracy, precision, recall, and F1-Scores, were calculated based on the ROC cutoff that maximized the Youden index on the training set. The Youden index, which provides equal weight to both sensitivity and specificity, was selected as a balanced metric for this purpose. Stochastic Search Variable Selection (SSVS) SSVS aims to identify which predictors should be included in the model. It does this by introducing binary indicators for each predictor, which determine whether a predictor is included or excluded from the model at each sampling iteration in a Markov Chain Monte Carlo (MCMC) simulation. To perform variable selection, a binary indicator δ k was introduced for each radiomic feature x k . The indicator δ k follows a Bernoulli distribution with a probability of 0.0015: The prior distribution for the coefficients α k was defined as: The actual coefficient β k was then determined by the product of δ k and α k : The intercept β 0 was assigned a normal prior distribution: The linear predictor η i was defined as: where p is the number of predictors, and i represents the i th data point. The probability of the binary outcome y i = 1 was modeled using the sigmoid function: The likelihood of the observed data y was specified as a Bernoulli distribution: τ α and τ 0 were set to 1 because smaller values of the precision parameter resulted in divergences during sampling. MCMC methods from the pymc python module were used to sample from the posterior distribution of the parameters. The python scripts for model development are available at: https://github.com/isaaclhk/Projects/tree/main/lungnoduleSVSS . Results Nodule Classification Statistics Among the 736 samples in the dataset, 377 nodules (51.2%) were classified as malignant, while 356 nodules (48.8%) were identified as benign. In the training set, 26 nodules (52%) were malignant and 24 nodules (48%) were benign. The test set comprised 686 samples, with a similar distribution of 351 malignant nodules (51.2%) and 335 benign nodules (48.8%). For more detailed information on patient and nodule characteristics, refer to the study by Hunter et al. [ 2 ]. Convergence Statistics A total of 4 chains of 11000 draws were simulated for SVSS, discarding the first 1000 as burn-in. values were 1.0 for all binary indicators δ k . The bulk and tail effective sample size (ESS) for all δ exceeded 3000, indicating adequate sampling (Table S1). For each Bayesian logistic regression model, I simulated 4 chains with 6,000 draws each, also discarding the first 1,000 as burn-in. The best performing model had bulk and tail ESS values exceeding 10,000 for all coefficients, with values of 1.0 (see Table S2). Trace plots are provided in Figure S1 in the supplementary materials. SVSS The top three features selected by SVSS and the posterior means of their corresponding indicator parameters δ k are reported in Table 1 . View this table: View inline View popup Download powerpoint Table 1: Corresponding posterior mean of the indicator parameter δ k for each selected feature Bayesian Logistic Regression Model The model with prior precision parameter τ = 1 was identified as the optimal model, achieving the greatest Expected log pointwise predictive density for leave-one-out cross-validation (elpd_loo) value of -26.89. Additionally, this model demonstrated an effective number of parameters (p_loo) of approximately 2 (Table S3). The posterior distributions of the model coefficients and their highest density intervals (HDIs) are summarized in Table 2 . β 1 has a mean of 0.791(95% HDI: -0.324 to 1.859), indicating that it is positively associated with malignancy prediction. In contrast, β 2 and β 3 have means of -0.592(95% HDI: -2.174 to 0.941) and -0.611(95% HDI: -2.165 to 0.951), respectively, suggesting negative influence. View this table: View inline View popup Download powerpoint Table 2: Coefficients of Bayesian Logistic Regression model with τ = 1 Baseline Lasso Logistic Regression Model An optimal value for the regularization parameter was determined to be C = 0.184. The Lasso method identified 8 features, with their corresponding coefficients detailed in Table 3 . Notably, two of the three features selected by SVSS —Annulus_GLRLM_SRLGLE_LLL and Annulus_GLCM_Entropy_LLL— were also chosen by Lasso. However, the third feature, Annulus_GLRLM_LGLRE_LLL, was not selected by Lasso. Similar to Bayesian logistic regression, the Lasso coefficients suggest that Annulus_GLRLM_SRLGLE_LLL has a negative effect on malignancy prediction. Additionally, Annulus_GLCM_Entropy_LLL was predicted by Lasso to increase the risk of malignancy. View this table: View inline View popup Download powerpoint Table 3: Selected features and their coefficients from Lasso logistic regression Model Evaluation The selected Bayesian logistic regression model achieved an AUROC score of 0.832 (95% CI: 0.704 to 0.933) on the training set and 0.795 (95% CI: 0.759 to 0.829) on the test set ( Figure 1 ). Additionally, the accuracy score was 0.738 (95% CI: 0.620 to 0.860) on the training set and 0.722 (95% CI: 0.688 to 0.755) on the test set. Download figure Open in new tab Figure 1. AUC-ROC plot of the Bayesian and Lasso logistic models on the (a) training set, (b) test set In comparison, the Lasso logistic regression model achieved an AUROC score of 0.868 (95% CI: 0.741 to 0.958) on the training set and 0.793 (95% CI: 0.757 to 0.827) on the test set ( Figure 1 ). The accuracy score for the Lasso model was 0.781 (95% CI: 0.660 to 0.900) on the training set and 0.728 (95% CI: 0.694 to 0.762) on the test set. The Precision, Recall and F1-Scores of both models are summarized in Table 4 . View this table: View inline View popup Download powerpoint Table 4: Precision, Recall, and F1-Scores of the Bayesian and Logistic regression models Discussion This study demonstrates that SVSS, in conjunction with bayesian logistic regression, is a viable approach to radiomic-based small lung nodule classification. Generally, the performance of this approach on the that from the baseline Lasso logistic regression model, but the performance on the test set is similar ( Figure 1 and Table 4 ). The Bayesian approach excels in its ability to integrate prior information into the model via priors. For instance, the small p assigned to the Bernoulli prior in the SVSS model suggests that most features are irrelevant and should be excluded. The mildly informative priors used in this study reflect the uncertainty in feature selection during SVSS and the strength of coefficients in Bayesian logistic regression. In the SVSS model, reducing τ below 1 led to divergences during sampling, which is expected given the small sample size used for training, necessitating the specification of informative priors [ 7 ]. Although previous research [ 2 ] provided prior knowledge on promising candidate features, equal weight was assigned to all features to investigate whether SVSS would select different ones. Indeed, out of the three features selected by SVSS, only Annulus GLCM Entrop LLL was common with the set of features selected by Hunter et al. [ 2 ]. This feature was consistently identified across all experiments and has generally been shown to increase malignancy prediction. Thus, future analyses using the bayesian approach should place greater emphasis on this feature to express confidence in it’s effect. Another benefit of the Bayesian approach is it’s ability to quantify uncertainty in parameter estimates. Unlike traditional frequentist approaches, such as Lasso logistic regression, which typically provide point estimates and confidence intervals, Bayesian methods generate posterior distributions for each parameter. These parameter estimates represent the range of plausible values for the parameters, given prior information combined with the likelihood of observed data. This capability can offer valuable insights in the context of medical research, where decisions often need to be made under conditions of uncertainty. The HDI of the coefficients estimated from the bayesian logistic regression model was relatively large ( Table 2 ). As more knowledge is acquired and increasingly informative priors are utilized for prediction, the coefficient estimates will improve. The utility of Bayesian methods is particularly pronounced in settings with limited data. Traditional statistical methods often face challenges with small sample sizes, resulting in unstable and unreliable estimates. For instance, the univariate logistic regression models used in the initial layer of feature selection encounter convergence issues when the training sample size drops below 50. In contrast, Bayesian approaches effectively address this issue by integrating prior information, which stabilizes the estimates and improves model performance [ 7 ]. This characteristic makes Bayesian methods a powerful tool for radiomic analysis, where obtaining large datasets can be challenging due to the rarity of certain conditions or the high cost of imaging. Consequently, the Bayesian approach provides reliable and interpretable results in medical image classification tasks, such as the classification of radiomic-based small lung nodules. Despite the advantages of incorporating prior information and improved interpretability, SVSS and Bayesian logistic regression can be computationally expensive, and scaling these methods to large datasets may present challenges. Furthermore, these methods are sensitive to the choice of priors, and poorly chosen priors can lead to biased or misleading conclusions. Therefore, careful consideration and tuning of priors are essential to ensure robust and accurate model performance. Additionally, leveraging advanced computational techniques, such as parallel processing and efficient sampling algorithms [ 1 ], can help mitigate the computational challenges and enhance scalability. Conclusion This study aimed to explore the utility of Bayesian methods, specifically Stochastic Variable Selection and Shrinkage (SVSS) and Bayesian logistic regression, in radiomics-based classification of small lung nodules with limited training data. Although these methods could not be evaluated on a sample size smaller than 50 due to convergence issues in the univariate logistic regressions during the initial layer of feature selection, the Bayesian approach successfully matched the performance of frequentist Lasso logistic regression on the test set. This demonstrates its viability as an alternative approach. Annulus_GLCM_Entrop_LLL was identified as a feature that consistently exerts a positive influence on small lung nodule malignancy prediction across various models. This finding enhances our confidence in the effect of this feature, suggesting that future Bayesian analyses can incorporate this information to achieve greater reliability in feature selection and coefficient estimates. In conclusion, this study highlights the potential of Bayesian methods to address the challenges of limited data in medical image analysis. By leveraging prior information, these methods can stabilize estimates and improve model performance, offering a robust alternative to traditional statistical approaches. Future research should focus on further refining these Bayesian techniques and exploring their application in other high-dimensional radiomic datasets to enhance their utility and effectiveness in clinical decision-making. Data Availability The radiomics data utilized in this study is publicly accessible in the Mendeley database under the accession code 10.17632/rxn95mp24d.1. Additionally, the python scripts for model development are available at: https://github.com/isaaclhk/Projects/tree/main/lung_nodule_SVSS https://data.mendeley.com/datasets/rxn95mp24d/1 https://github.com/isaaclhk/Projects/tree/main/lung_nodule_SVSS Supplementary Materials View this table: View inline View popup Download powerpoint Table S1: SVSS diagnostic statistics View this table: View inline View popup Download powerpoint Table S2: Bayesian logistic regression diagnostic statistics View this table: View inline View popup Download powerpoint Table S3: Comparison of Bayesian Logistic Regression Models with varying prior parameters τ Download figure Open in new tab Figure S1: Bayesian Logistic Regression trace plots with τ =0.01 (a), 0.1 (b), 1 (c) and 10 (d) Footnotes The abstract was updated from an unstructured format to a structured format. References [1]. ↵ Oriol Abril-Pla , Virgile Andreani , Colin Carroll , Larry Dong , Christopher J Fonnesbeck , Maxim Kochurov , Ravin Kumar , Junpeng Lao , Christian C Luhmann , Osvaldo A Martin , et al. Pymc: a modern, and comprehensive probabilistic programming framework in python . PeerJ Computer Science , 9 : e1516 , 2023 . OpenUrl CrossRef [2]. ↵ Benjamin Hunter , Christos Argyros , Marianna Inglese , Kristofer Linton-Reid , Ilaria Pulzato , Andrew G Nicholson , Samuel V Kemp , Pallav L. Shah , Philip L Molyneaux , Cillian McNamara , et al. Radiomics-based decision support tool assists radiologists in small lung nodule classification and improves lung cancer early diagnosis . British Journal of Cancer , 129 ( 12 ): 1949 – 1955 , 2023 . OpenUrl PubMed [3]. ↵ Isaac Lam , Shao Ming Koh , and Mai Nguyen Thanh . Radiomics-based lung nodule classification with stacking ensembles . medRxiv , 2025 . [4]. ↵ Anna Rita Larici , Alessandra Farchione , Paola Franchi , Mario Ciliberto , Giuseppe Cicchetti , Lucio Calandriello , Annemilia Del Ciello , and Lorenzo Bonomo . Lung nodules: size still matters . European respiratory review , 26 ( 146 ), 2017 . [5]. ↵ Jiaying Liu , Anna Corti , Valentina DA Corino , and Luca Mainardi . Lung nodule classification using radiomics model trained on degraded sdct images . Computer Methods and Programs in Biomedicine , 257 : 108474 , 2024 . OpenUrl PubMed [6]. ↵ Minmini Selvam , Anupama Chandrasekharan , Abjasree Sadanandan , Vikas Kumar Anand , Arunan Murali , and Ganapathy Krishnamurthi . Radiomics as a non-invasive adjunct to chest ct in distin-guishing benign and malignant lung nodules . Scientific Reports , 13 ( 1 ): 19062 , 2023 . OpenUrl PubMed [7]. ↵ Sanne C Smid and Yves Rosseel . Sem with small samples: Two-step modeling and factor score regression versus bayesian estimation with informative priors . In Small sample size solutions , pages 239 – 254 . Routledge, 2020 . [8]. ↵ Janita E Van Timmeren , Davide Cester , Stephanie Tanadini-Lang , Hatem Alkadhi , and Bettina Baessler . Radiomics in medical imaging—”how-to” guide and critical reflection . Insights into imaging , 11 ( 1 ): 91 , 2020 . OpenUrl PubMed View the discussion thread. Back to top Previous Next Posted May 05, 2025. Download PDF Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Radiomics-Based Lung Nodule Classification with Stochastic Search Variable Selection and Bayesian Logistic Regression Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Radiomics-Based Lung Nodule Classification with Stochastic Search Variable Selection and Bayesian Logistic Regression Isaac Lam medRxiv 2025.04.29.25326704; doi: https://doi.org/10.1101/2025.04.29.25326704 Share This Article: Copy Citation Tools Radiomics-Based Lung Nodule Classification with Stochastic Search Variable Selection and Bayesian Logistic Regression Isaac Lam medRxiv 2025.04.29.25326704; doi: https://doi.org/10.1101/2025.04.29.25326704 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Oncology Subject Areas All Articles Addiction Medicine (570) Allergy and Immunology (863) Anesthesia (301) Cardiovascular Medicine (4442) Dentistry and Oral Medicine (444) Dermatology (383) Emergency Medicine (609) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1511) Epidemiology (15231) Forensic Medicine (30) Gastroenterology (1126) Genetic and Genomic Medicine (6610) Geriatric Medicine (668) Health Economics (998) Health Informatics (4542) Health Policy (1370) Health Systems and Quality Improvement (1613) Hematology (543) HIV/AIDS (1266) Infectious Diseases (except HIV/AIDS) (15924) Intensive Care and Critical Care Medicine (1103) Medical Education (623) Medical Ethics (147) Nephrology (668) Neurology (6608) Nursing (346) Nutrition (999) Obstetrics and Gynecology (1146) Occupational and Environmental Health (957) Oncology (3338) Ophthalmology (974) Orthopedics (369) Otolaryngology (420) Pain Medicine (436) Palliative Medicine (130) Pathology (665) Pediatrics (1693) Pharmacology and Therapeutics (692) Primary Care Research (712) Psychiatry and Clinical Psychology (5449) Public and Global Health (9240) Radiology and Imaging (2203) Rehabilitation Medicine and Physical Therapy (1370) Respiratory Medicine (1196) Rheumatology (596) Sexual and Reproductive Health (714) Sports Medicine (530) Surgery (712) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'a0207f54a8d458d3',t:'MTc3OTgzNzQ4OQ=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.