Full text
52,366 characters
· extracted from
preprint-html
· click to expand
Extracting Carotid Stenosis Severity from Clinical Notes Using Natural Language Processing: Development, Validation, and Application in a Nationwide Veteran Cohort | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Extracting Carotid Stenosis Severity from Clinical Notes Using Natural Language Processing: Development, Validation, and Application in a Nationwide Veteran Cohort Kyung Min Lee , Patrick R. Alba , Gina M. Biagetti , Anthony Gao , Ming Yin , Peter N. Danilov , Tia DiNatale , Cristina Perez , Katherine Hartmann , Gabrielle E. Shakt , Renae L. Judy , Tiffany R. Bellomo , Kathryn M. Pridgen , Philip S. Tsao , Naveen Balasundaram , View ORCID Profile Michael G. Levin , View ORCID Profile Scott M. Damrauer , View ORCID Profile Julie A. Lynch doi: https://doi.org/10.1101/2025.05.16.25327773 Kyung Min Lee 1 VA Informatics and Computing Infrastructure (VINCI), VA Salt Lake City Health Care System , Salt Lake City, UT, USA PhD, MPH Find this author on Google Scholar Find this author on PubMed Search for this author on this site Patrick R. Alba 1 VA Informatics and Computing Infrastructure (VINCI), VA Salt Lake City Health Care System , Salt Lake City, UT, USA 2 Division of Epidemiology, Department of Internal Medicine, University of Utah School of Medicine , Salt Lake City, UT, USA MS Find this author on Google Scholar Find this author on PubMed Search for this author on this site Gina M. Biagetti 3 Department of Surgery, Hospital of the University of Pennsylvania , Philadelphia, PA, USA MD Find this author on Google Scholar Find this author on PubMed Search for this author on this site Anthony Gao 1 VA Informatics and Computing Infrastructure (VINCI), VA Salt Lake City Health Care System , Salt Lake City, UT, USA BS Find this author on Google Scholar Find this author on PubMed Search for this author on this site Ming Yin 1 VA Informatics and Computing Infrastructure (VINCI), VA Salt Lake City Health Care System , Salt Lake City, UT, USA MS Find this author on Google Scholar Find this author on PubMed Search for this author on this site Peter N. Danilov 1 VA Informatics and Computing Infrastructure (VINCI), VA Salt Lake City Health Care System , Salt Lake City, UT, USA BA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Tia DiNatale 1 VA Informatics and Computing Infrastructure (VINCI), VA Salt Lake City Health Care System , Salt Lake City, UT, USA MPH Find this author on Google Scholar Find this author on PubMed Search for this author on this site Cristina Perez 1 VA Informatics and Computing Infrastructure (VINCI), VA Salt Lake City Health Care System , Salt Lake City, UT, USA MS Find this author on Google Scholar Find this author on PubMed Search for this author on this site Katherine Hartmann 4 Department of Radiology, Hospital of the University of Pennsylvania , Philadelphia, PA, USA MD, PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site Gabrielle E. Shakt 5 Corporal Michael J. Crescenz VA Medical Center , Philadelphia, PA, USA 6 Department of Surgery, Perelman School of Medicine and the University of Pennsylvania , Philadelphia, PA, USA BS Find this author on Google Scholar Find this author on PubMed Search for this author on this site Renae L. Judy 5 Corporal Michael J. Crescenz VA Medical Center , Philadelphia, PA, USA 6 Department of Surgery, Perelman School of Medicine and the University of Pennsylvania , Philadelphia, PA, USA MS Find this author on Google Scholar Find this author on PubMed Search for this author on this site Tiffany R. Bellomo 7 Division of Vascular and Endovascular Surgery, Massachusetts General Hospital , Boston, MA, USA MD Find this author on Google Scholar Find this author on PubMed Search for this author on this site Kathryn M. Pridgen 1 VA Informatics and Computing Infrastructure (VINCI), VA Salt Lake City Health Care System , Salt Lake City, UT, USA MA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Philip S. Tsao 8 Palo Alto Epidemiology Research and Information Center for Genomics , VA Palo Alto, CA, USA 9 Department of Medicine, Stanford University School of Medicine , Stanford, CA, USA PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site Naveen Balasundaram 5 Corporal Michael J. Crescenz VA Medical Center , Philadelphia, PA, USA 10 Department of Medicine, Perelman School of Medicine and the University of Pennsylvania , Philadelphia, PA, USA MD Find this author on Google Scholar Find this author on PubMed Search for this author on this site Michael G. Levin 5 Corporal Michael J. Crescenz VA Medical Center , Philadelphia, PA, USA 10 Department of Medicine, Perelman School of Medicine and the University of Pennsylvania , Philadelphia, PA, USA MD Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Michael G. Levin Scott M. Damrauer 5 Corporal Michael J. Crescenz VA Medical Center , Philadelphia, PA, USA 6 Department of Surgery, Perelman School of Medicine and the University of Pennsylvania , Philadelphia, PA, USA MD Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Scott M. Damrauer Julie A. Lynch 1 VA Informatics and Computing Infrastructure (VINCI), VA Salt Lake City Health Care System , Salt Lake City, UT, USA 2 Division of Epidemiology, Department of Internal Medicine, University of Utah School of Medicine , Salt Lake City, UT, USA PhD, RN, MBA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Julie A. Lynch For correspondence: julie.lynch{at}va.gov Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF ABSTRACT Importance Carotid stenosis, which is atherosclerotic narrowing of the extracranial carotid arteries, is an important risk factor for ischemic stroke. The prevalence of asymptomatic carotid stenosis is generally low, with moderate and severe stenosis present in up to ~6% and ~2% of the population, respectively. Prior studies of carotid stenosis have been small, and risk factors for carotid stenosis severity have been incompletely described. We sought to leverage the rich electronic health record data within the Veterans Health Administration to assess the prevalence and risk factors for carotid stenosis at the population level. Objective Develop and validate a natural language processing (NLP) tool to extract the ratio of peak systolic velocity of the internal carotid artery to that of the common carotid artery (ICA/CCA ratio) from carotid duplex ultrasound reports. Identify significant risk factors, presence and severity of carotid stenosis. Design Retrospective cross-sectional analysis Setting Veterans Health Administration (VHA) from 2001 to 2020 Participants Veterans who underwent carotid artery duplex scans in the VHA from 2001 to 2020 and who had at least one valid ICA/CCA ratio. We excluded patients who had undergone carotid endarterectomy or stenting or who had a stroke or transient ischemic attack prior to the index date. Exposure(s) Carotid artery duplex scan and cardiovascular disease risk factors including age, sex, self-identified race and ethnicity, healthcare utilization, smoking status, body mass index (BMI), blood pressure, hypertension, coronary heart disease, type 2 diabetes, and selected laboratory measures (i.e., hemoglobin A1c, low-density lipoprotein cholesterol, high-density lipoprotein cholesterol, triglyceride, and creatinine). Main outcome A categorical variable indicating carotid stenosis severity (<50%, 50-69%, ≥70%) based on ICA/CCA ratio (<2, ≥2 to <4, ≥4). Results The harmonic F1 score of the NLP tool was 0.907 for right value, 0.882 for left value, and 0.920 for max value. Among the 290,517 Veterans in the cohort, the median age was 68.2 years (IQR 61.9–75.0). 277,934 (95.7%) were males and 28,348 (10%) were of self-reported Black race. Black patients had 16% decreased risk of more severe carotid stenosis (OR 0.84, 95% CI 0.81–0.87, p<0.001). Yet, sensitivity analysis showed that among those with hemodynamically significant carotid stenosis (≥70% vs. 50–69%), Black race was associated with a 33% increased risk of severe carotid stenosis compared to White race (OR 1.33, 95% CI 1.23-1.43, p<0.001). All patient-level risk factors except high-density lipoprotein cholesterol were significantly associated with carotid stenosis severity. Conclusion and relevance The NLP tool performed well, and the study performed with our NLP-created cohort largely validates the risk factors identified by previous smaller studies, speaking to the validity of our tool to create usable cohorts for future large-scale research. INTRODUCTION Carotid stenosis, which results from atherosclerotic plaque that causes a narrowing of the carotid artery, is a well-recognized risk factor for stroke, and the risk of stroke varies depending on the severity of stenosis. 1 – 3 Asymptomatic carotid stenosis occurs in the absence of stroke or transient ischemic attack (TIA) history. 4 The prevalence of asymptomatic carotid stenosis is generally low, with moderate and severe stenosis identified in up to ~6% and ~2% of the population, respectively. 5 Carotid stenosis is typically diagnosed via carotid duplex ultrasound, a noninvasive means of measuring vessel diameter, visualizing atherosclerotic plaque, and capturing secondary signs of stenosis including changes in blood flow velocity. Diagnosis and risk stratification of carotid stenosis is made primarily using measures of the peak systolic velocity (PSV) of the internal carotid artery (ICA) and the common carotid artery (CCA) as well as the ratio of the former to the latter (ICA/CCA PSV ratio). 6 , 7 Understanding carotid disease, particularly disease severity, is important because presence and severity of disease help guide intervention strategies. 8 Our current knowledge of asymptomatic carotid stenosis comes mainly from relatively small cohorts, 3 , 9 – 11 comprising only hundreds or thousands of participants. Using existing large datasets to create cohorts to study carotid stenosis severity has proved difficult because information about disease severity is generally included in patient notes and procedure reports as free text and not as structured data. As such, harnessing the power of natural language processing (NLP), which can be used to extract data from large electronic health records (EHR) datasets, may improve efficacy in epidemiologic research by making it easier to create larger, more diverse cohorts. 12 Advances in NLP have enabled large-scale studies of EHR data such as radiology reports to identify individuals with carotid stenosis. 13 – 16 In this study, we present the development and validation of an NLP tool to identify presence and severity of carotid stenosis within the Veteran’s Health Administration (VHA), the largest integrated healthcare system in the United States. This is the first NLP tool that extracts ICA/CCA ratio from carotid duplex ultrasound reports. Using the resulting cohort of Veterans, we performed the largest study of risk factors for asymptomatic carotid stenosis to date, demonstrating the utility of big data and NLP in carotid stenosis research. METHODS We conducted a cross-sectional analysis of Veterans who received care at the VHA from 2001 to 2020. This study was approved by the institutional review boards of the VA Salt Lake City Healthcare System and the Corporal Michael J. Crescenz VA Medical Center. Data sources Patient demographic and clinical data, including healthcare utilization, comorbidity, prescriptions, smoking status, body mass index (BMI), blood pressure, laboratory test results, and unstructured clinical notes containing reports of carotid artery ultrasounds were obtained from the Corporate Data Warehouse (CDW) of the VHA. The CDW is a national data repository that contains longitudinal clinical and administrative data for Veterans who received care at the VHA. Study sample We identified active users of the VA from 2001 to 2020 who underwent a carotid artery duplex scan of either one or both carotid arteries, identified by current procedural terminology codes 93880 and 93882. We restricted the analysis to patients who had at least one valid ICA/CCA ratio, defined as a patient’s same-day duplex measurement with laterality being only one of the following: 1 left, 1 right, 1 left 1 right, 1 bilateral. We then identified the first valid duplex result for each patient. The greatest value of the first valid duplex result for each patient is the value used in analysis. The index date represents the earliest date of all duplex scan results extracted by the NLP algorithm. We excluded patients who 1) had undergone carotid endarterectomy or stenting or 2) had a stroke or TIA prior to the index date. Development of NLP tool We used the java-based LEO framework 17 created by the VHA to develop and validate NLP tools that extracted and categorized duplex results based on whether these results were reported as quantitative, qualitative, or as the ICA/CCA ratio. The initial NLP system was designed to identify four key concepts from carotid duplex studies; anatomy (internal carotid artery, discerning other non-relevant anatomies such as external carotid artery), laterality (left, right or bilateral), degree of stenosis expressed in qualitative terms or percentages (no stenosis, mild, moderate, severe, occluded, 50% etc.), and presence of ICA/CCA ratios. Further development and validation of that NLP tool, which is reported here, focused on extracting ICA/CCA ratio results. The ICA/CCA ratio was extracted from the unstructured carotid artery duplex scan results using a rule-based NLP algorithm. All NLP code for the system can be found at the following git repository: https://github.com/VINCI-AppliedNLP/CarotidStenosis . Manual annotation Annotation was completed by two nurse annotators, with the training batches double annotated and adjudicated by the study team. For development of the initial NLP tool, there were 100 distinct carotid duplex studies reviewed by two independent reviewers, with any discrepancies being adjudicated by a third, resulting in a Cohens Kappa Inter-annotator agreement of 0.83. For the ICA/CCA ratio NLP tool, the annotation team documented the ICA/CCA ratios for the right and left carotid arteries from 300 carotid duplexes achieving an inter-annotator agreement with Cohen’s kappa greater than 0.85 across all batches annotated. NLP validation We assessed the performance of the NLP system using the following metrics: precision, recall (sensitivity), accuracy, and F-measure (F1 score) of the right value, the left value, and the maximum value found in a report. Performance was evaluated using the results of the 300 duplex scans that were manually annotated and held out from development. Ratios were rounded to the second decimal before being compared. For example, an annotated value 0.891 and an NLP extracted 0.89 would be counted as a true positive. Outcome The outcome variable was a categorical variable indicating carotid stenosis severity as defined by ICA/CCA PSV ratio according to the currently recommended criteria for carotid interpretation (<2: normal/4: ≥70% severe stenosis). 18 , 19 Less than 50% stenosis is non-hemodynamically significant. Risk factors The following patient-level risk factors were assessed at the index date (i.e., date of carotid duplex): age, sex, self-identified race and ethnicity, the total number of encounters (inpatient admissions or outpatient visits) in the prior two years, smoking status, BMI, systolic and diastolic blood pressures (SBP and DBP, respectively), indicator variables for pre-existing hypertension, coronary heart disease (CHD), and type 2 diabetes (T2D), and selected laboratory measures (i.e., hemoglobin A1c [HbA1c], low-density lipoprotein cholesterol [LDL-c], high-density lipoprotein cholesterol [HDL-c], triglyceride, and creatinine). We obtained the most recent laboratory measures in the five years preceding the index date to minimize missing values. LDL-c and triglyceride levels were adjusted for lipid lowering therapies including statins and ezetimibe. 20 We determined the receipt of prescriptions for selected drugs (statins, ezetimibe and other antilipemics, antiplatelets, anticoagulants, and acetylsalicylic acid; Table B1 ) in the 90 days prior to index date for descriptive analysis; however, we did not include them as risk factors in multivariable models due to the likely confounding by indication across the three categories of carotid stenosis severity. We included standardized BMI, blood pressures, and laboratory measures in all regression models to allow for comparisons of odds ratios of continuous variables with different units of measurement. We performed multiple imputation by predictive mean matching to impute missing BMI, blood pressures, and laboratory measures. 21 , 22 The “ Other” racial category included American Indian or Alaska Natives, Native Hawaiian or Other Pacific Islanders, and Asian individuals. Statistical analysis We performed Wilcoxon rank-sum tests for continuous variables and chi-squared tests for categorical variables to examine the differences in the included patient characteristics among carotid stenosis severity categories. We calculated bootstrap 95% confidence intervals of the differences in medians to compare the medians of continuous variables between two severity categories. We quantified the independent associations of patient-level risk factors on carotid stenosis severity by regressing carotid stenosis severity on each risk factor separately using ordinal logistic regression model. 23 , 24 We estimated a multivariable ordinal logistic regression model to determine the associations of the risk factors with carotid stenosis severity as a three-level categorical variable. Ordinal logistic regression, used to model outcomes with ordered categories, assumes that the odds ratios across all categories are the same; biased estimates may result when this proportional odds assumption is violated. 25 , 26 However, studies with large sample sizes such as the current analysis are less likely to violate the proportional odds assumption. 27 , 28 Therefore, we chose ordinal logistic regression to model the currently recommended carotid stenosis severity categories in this analysis. As a sensitivity analysis, we performed binary logistic regression analysis to make four pairwise comparisons of carotid stenosis severity categories: ≥50% vs. <50%, 50–69% vs. <50%, ≥70% vs. <50%, and ≥70% vs. 50–69%. By comparing ≥50% group (combination of 50–69% and ≥70% categories) with 2). We then quantified the associations of risk factors with the presence of hemodynamically significant stenosis of varying severity (moderate or severe) by comparing <50% category with 50–69% and ≥70% categories separately. Finally, we compared ≥70% category with 50-69% category to investigate the associations of patient-level risk factors with having more severe stenosis. We performed the Z-test to compare odds ratios across different comparisons. 29 We used SAS 9.4 to prepare the analytic dataset and R 4.4.1 to perform statistical tests and estimate regression models. All hypothesis tests were two-tailed with the significance level of 5%. RESULTS We identified 13,058,116 Veterans who were active recipients of healthcare in the VHA between 2001 and 2020. There were 1,340,075 patients with at least one carotid duplex from 2001-2020, which included 2,594,346 distinct procedures. There were 974,889 (72.7%) patients who had 2,335,802 (90.3%) procedures with relevant radiology or clinical notes available for processing by the NLP tools. Of those, 414,455 patients had a report that included a valid ICA/CCA ratio value with laterality documented as left, right, or bilateral. There were 560,434 patients excluded whose reports did not include a valid ICA/CCA ratio. The majority were excluded because the ratio was missing from the report. In some cases, the ratio or laterality was ambiguous or not documented. Among the 414,455 Veterans with ICA/CCA ratio results, 290,517 had no carotid endarterectomy or stent procedures, and no stroke or TIA prior to the index date ( Figure 1 ). Download figure Open in new tab Figure 1. Study sample derivation NLP performance Performance was evaluated against 300 held-out reports. Precision was >0.9 for all measurements (right value: 0.978; left value: 0.943; max value: 0.925), as was accuracy (right value: 0.940; left value: 0.927; max value: 0.943). Recall was 0.845 for right value, 0.828 for left value, and 0.916 for max value. F-measure was 0.907 for right value, 0.882 for left value, and 0.920 for max value. ( Table 1 ) See Appendix A for additional information. View this table: View inline View popup Download powerpoint Table 1. NLP validation results Patient characteristics Participants in the final study sample had a median age of 68.2 years (IQR 61.9–75.0). There were 277,934 (95.7%) men, 235,190 (81%) were of self-reported White race, and 28,348 (10%) were of self-reported Black race. The proportions of missing values for all imputed variables except HbA1c were less than 3% ( Table B2 ). The distributions of the imputed variables remained unchanged after imputation. Among the 290,517 Veterans with available duplex data and no symptoms of carotid disease 240,190 had ICA:CCA ratio <2, corresponding to a <50% stenosis, 38,971 had a ratio ≥2 and <4 corresponding to a 50% - 69% stenosis, and 11,356 had a ratio ≥4 corresponding to a ≥70% stenosis. Compared to those with <50% stenosis, patients with ≥70% stenosis were older (median difference 3.2 years, 95% CI 3.0–3.4) and more likely to have cardiovascular comorbidities (7%, 12%, and 3% higher rates of hypertension, CHD, and T2D, respectively; p<0.001). They were also more likely to be current smokers (28% vs. 23%, p<0.001), and had higher median levels of HbA1c (median difference 0.1%, 95% CI 0.1–0.1) and blood lipids except HDL-c (LDL-c: median difference 4.9 mg/dl, 95% CI 3.8–6.0; triglyceride: median difference 9.0 mg/dl, 95% CI 7.2–12.0; creatinine: median difference 0.1 mg/dl, 95% CI 0.1–0.1; Table 2 ). View this table: View inline View popup Table 2. Patient characteristics Associations of patient-level risk factors with severity of carotid stenosis All patient-level risk factors except HDL-c were significantly associated with carotid stenosis severity in a univariable analysis ( Table B3 ). Older age, comorbidities, higher laboratory measures (except HDL-c), SBP, and current or former smoking were associated with an increased risk for more severe carotid stenosis. The results of the multivariable ordinal logistic regression models are reported in Table 3 . Every 10-year increase in age conferred a 22% increase in the likelihood of more severe carotid stenosis (odds ratio [OR] 1.022, 95% confidence interval [CI] 1.020–1.023, p<0.001). Compared to White patients, Black patients and those in the Other racial category had 16% and 26% decreased risk of more severe carotid stenosis, respectively (OR 0.84, 95% CI 0.81–0.87, p<0.001 for Black; OR 0.74, 95% CI 0.68-0.80 for Other). Individuals with pre-existing hypertension or CHD had a 44% increased risk of more severe carotid stenosis (OR 1.44, 95% CI 1.38–1.51 for hypertension; OR 1.44, 95% CI 1.41–1.47, p<0.001 for CHD). Each one standard deviation increase in HbA1c, LDL-c, HDL-c, triglyceride, and creatinine levels was associated with a 1–5% increased risk of more severe carotid stenosis. Current smokers were 67% more likely to experience more severe carotid stenosis compared with never smokers (OR 1.67, 95% CI 1.62–1.74, p<0.001). View this table: View inline View popup Download powerpoint Table 3. Association of patient-level factors with carotid stenosis severity from a multivariable ordinal logistic regression model Our sensitivity analysis revealed that while the associations of patient-level risk factors remained practically unchanged when comparing patients with hemodynamically significant stenosis (≥50%) to those with non-hemodynamically significant stenosis (<50%), the associations of certain risk factors changed either in magnitude or in the direction of association in pairwise comparisons of carotid stenosis severity categories ( Table B4 ). Among those with hemodynamically significant carotid stenosis (≥70% vs. 50–69%), Black race was associated with a 33% increased risk of severe carotid stenosis compared to White race (OR 1.33, 95% CI 1.23-1.43, p<0.001)..Pre-existing hypertension and CHD conferred smaller increased risks of severe carotid stenosis among patients with hemodynamically significant stenosis (hypertension: OR 1.18, 95% CI 1.05–1.32, p=0.005 in ≥70% vs. 50–69%, OR 1.68, 95% CI 1.52–1.87, p<0.001 in ≥70% vs. <50%, Z-test p<0.001; CHD: OR 1.08, 95% CI 1.03–1.13, p=0.002 in ≥70% vs. 50–69%, OR 1.51, 95% CI 1.45–1.58, p<0.001 in ≥70% vs. <50%, Z-test p<0.001). In ≥70% vs. <50% comparison, current smokers had more than two-fold increase in the risk of severe carotid stenosis (OR 2.37, 95% CI 2.20–2.56, p<0.001), which is markedly higher than the risk of increase in the other two comparisons (OR 1.51, 95% CI 1.45–1.57, p<0.001 in 50–69% vs. <50%, Z-test p<0.001; OR 1.55, 95% CI 1.43–1.69, p<0.001 in ≥70% vs. 50–69%, Z-test p10-fold larger compared to previous studies. 13 – 16 We then performed ordinal logistic regression analysis within this cohort to examine the association of known patient-level risk factors for carotid stenosis with severity of carotid stenosis. The current study highlights the powerful potential of using NLP to mine data from emerging health record biobanks. This study leveraged EHR data to construct a cohort of patients screened for carotid stenosis using carotid duplex ultrasound and extract detailed phenotype data consisting of patients’ demographics, comorbidities, medication use, vitals, laboratory measures, and smoking status to facilitate the largest study to date of clinical risk factors for carotid stenosis. NLP algorithms have been used previously to extract documentation of a carotid stenosis diagnosis, however, to our knowledge this is the first study to extract more granular severity using ICA/CCA ratios. Further, the number of individuals in the current cohort is much larger compared to previous studies and may serve as a basis for further investigation in disease progression and outcomes. 13 – 16 There have been previous limited attempts to extract carotid stenosis information from the EHR using NLP. In 2016, Mowery et al created an NLP system to identify reports with finding of significant carotid stenosis from radiology reports; however, this algorithm did not differentiate between moderate and severe stenosis. 14 Our system builds up on this by now extracting quantitative measures of disease severity with high precision (right: 0.978; left: 0.943; max: 0.925) and accuracy (right: 0.940; left: 0.927; max: 0.943). A different NLP system created by Chang et al (2021) does stratify by severity and also specifies the laterality of each case. 16 This system identified normal carotid arteries with a precision of 0.98 and abnormal carotid arteries with a precision of 0.76, resulting in a cohort of over 15,000 patients and demonstrating the potential utility of NLP to create large cohorts. Our system, when applied to the VHA EHR, was able to generate a dataset approximately 20 times larger than that of Chang et al. An error analysis of the system performance when compared to the held-out data set revealed the most common errors emanating from random variation in the text format that was not accounted for in the training data. While values were accurately captured from many templates and semi-structured forms, these errors primarily resulted from ad hoc templates and document structures created within the note. The majority of false positives occurred due to clinical guidelines presented in the note being misinterpreted as test results. Despite this the overall false positive rate was low (2.2% to 7.6% depending on measure and laterality). Using our NLP extracted data we identified a cohort of 290,517 asymptomatic Veterans with carotid duplex measurements for analysis. We found that older age, pre-existing hypertension, CHD, and T2D, higher levels of HbA1c, LDL-c, HDL-c, triglyceride, creatinine, higher SBP, and smoking was associated with higher likelihood of experiencing severe carotid stenosis, largely validating the risk factors identified in previous, smaller studies. 10 , 11 , 30 , 31 The fact that the study done within our NLP-created cohort validates previous studies speaks to the legitimacy of our tool to create usable cohorts for large-scale research. Our findings indicated that the well-established risk factors for atherosclerotic cardiovascular disease (ASCVD) are also significant risk factors for not only the likelihood of having a carotid stenosis but also the likelihood of having a more severe carotid stenosis. The results of this study suggest that the general approaches to primary and secondary prevention of ASCVD should also be effective in preventing carotid stenosis across the disease severity spectrum. Except for age, sex, and race/ethnicity, many of the traditional atherosclerotic risk factors including dyslipidemia, hypertension, diabetes, and smoking are modifiable through lifestyle and behavioral changes. The largest odds ratios were seen with smoking, hypertension, and CHD, suggesting that management of these modifiable risk factors through established prevention strategies 32 may decrease severity of carotid stenosis. The associations of self-identified race and ethnicity with carotid stenosis severity suggests that individuals of non-White racial groups and Hispanic patients were less likely to experience severe carotid stenosis compared to White and non-Hispanic patients, respectively. The lower odds of having a hemodynamically significant carotid stenosis among Black patients and Hispanic patients compared to White patients and non-Hispanic patients, respectively, are consistent with previous studies that reported lower prevalence of carotid stenosis among Black patients and Hispanic patients. 33 – 36 However, results of the sensitivity analysis suggest that of those with hemodynamically significant stenosis (i.e., ≥50%), Black patients were more likely to present with severe rather than moderate stenosis compared to White patients. These seemingly paradoxical findings may be attributable to several reasons. First, index event bias is potentially present as Black patients may be less likely to receive carotid imaging. 37 Since the current study analyzed individuals who had received a clinical duplex scan, Black patients may have been disproportionately excluded from the study due to their lower likelihood of receiving a scan. 26 – 28 Additionally, the Black patients’ higher likelihood of experiencing a more severe carotid stenosis among a subset of patients with hemodynamically significant stenosis may be due to treatment disparity as Black patients may be less likely to undergo carotid endarterectomy 38 , 39 and more likely to experience delays in receiving treatment. 40 The weaker associations of age and comorbidities seen among those with hemodynamically significant stenosis in the sensitivity analysis are likely due to survivorship bias, as older patients are more likely to have died before developing severe carotid stenosis (≥70%). This study has other limitations as well. The VHA’s EHR data are subject to the limitations of any other large-scale EHR data including missing data, potential inconsistencies in coding practices across different medical centers and unreliability of self-reported race and ethnicity. We attempted to minimize the influence of missing data by implementing multiple imputation by predictive mean matching for continuous variables and including “ Unknown” categories for categorical variables. Despite the promising performance in identifying ICA/CCA ratios, our NLP system still exhibits some limitations, primarily related to occasional variations in report text formats that might cause false negatives or missed literalities. While racially and ethnically diverse, the Veteran patient population in the VHA consists of predominantly older men, thereby limiting the generalizability of the study results. CONCLUSIONS The rules-based NLP system reliably identified degree of stenosis in our patient population, allowing for the largest study of clinical risk factors for carotid stenosis to date. The risk factors we identified for both the presence and severity of carotid stenosis largely validated previous studies on the subject, suggesting that this NLP tool may be able to create large cohorts for future research studies. The risk factors were also similar to well-established risk factors ASCVD, suggesting that prevention strategies used for CVD may also reduce the risk of carotid stenosis across the disease spectrum. Data Availability Deidentified patient-level data are currently accessible to all VA researchers with appropriate IRB approvals. ACKNOWLEDGEMENTS This research was supported by the Department of Veterans Affairs, Veterans Health Administration, Office of Research and Development, Biomedical Laboratory Research and Development Service Award I01-BX0061459 and IK2-BX006551. This work was supported using resources and facilities of the Department of Veterans Affairs (VA) Informatics and Computing Infrastructure (VINCI), including data analytics conducted by its Precision Medicine research team, which is funded under the research priority to Put VA Data to Work for Veterans (VA ORD 24-D4V-02). The views expressed in this article are those of the authors and do not necessarily reflect the position or policy of the Department of Veterans Affairs or the United States government. JAL, PRA, PND, TD, and KMP report grants from Alnylam Pharmaceuticals, Inc., AstraZeneca Pharmaceuticals LP, Biodesix, Inc., Janssen Pharmaceuticals, Inc., Novartis International AG, Parexel International Corporation through the University of Utah or Western Institute for Veteran Research outside the submitted work. MGL reports grants from the Doris Duke Foundation (2023-0224, research funding to the institution from MyOme, and consulting fees from BridgeBio outside the submitted work. SMD reports grants from the National Heart Lung and Blood Institute, in kind support from Novo Nordisk, and consulting fees from Tourmaline Bio, outside the current work. Footnotes ↵ * Joint first authors ↵ ** Joint senior authors REFERENCES 1. ↵ Dharmakidari S , Bhattacharya P , Chaturvedi S. Carotid artery stenosis: Medical therapy, surgery, and stenting . Curr Neurol Neurosci Rep . 2017 ; 17 ( 10 ): 77 . OpenUrl CrossRef PubMed 2. Chang RW , Tucker LY , Rothenberg KA , et al. Incidence of ischemic stroke in patients with asymptomatic severe carotid stenosis without surgical intervention . JAMA . 2022 ; 327 ( 20 ): 1974 – 1982 . OpenUrl CrossRef PubMed 3. ↵ Howard DPJ , Gaziano L , Rothwell PM , Oxford Vascular Study . Risk of stroke in relation to degree of asymptomatic carotid stenosis: a population-based cohort study, systematic review, and meta-analysis . Lancet Neurol . 2021 ; 20 ( 3 ): 193 – 202 . doi: 10.1016/S1474-4422(20)30484-1 OpenUrl CrossRef PubMed 4. ↵ Kim HW , Regenhardt RW , D’Amato SA , et al. Asymptomatic carotid artery stenosis: a summary of current state of evidence for revascularization and emerging high-risk features . J Neurointerv Surg . 2023 ; 15 ( 7 ): 717 – 722 . doi: 10.1136/jnis-2022-018732 OpenUrl Abstract / FREE Full Text 5. ↵ de Weerd M , Greving JP , Hedblad B , et al. Prevalence of asymptomatic carotid artery stenosis in the general population: an individual participant data meta-analysis . Stroke . 2010 ; 41 ( 6 ): 1294 – 1297 . doi: 10.1161/STROKEAHA.110.581058 OpenUrl Abstract / FREE Full Text 6. ↵ Grant EG , Benson CB , Moneta GL , et al. Carotid artery stenosis: gray-scale and Doppler US diagnosis–Society of Radiologists in Ultrasound Consensus Conference . Radiology . 2003 ; 229 ( 2 ): 340 – 346 . OpenUrl CrossRef PubMed Web of Science 7. ↵ Hathout GM , Fink JR , El-Saden SM , Grant EG . Sonographic NASCET index: a new doppler parameter for assessment of internal carotid artery stenosis . AJNR Am J Neuroradiol . 2005 ; 26 ( 1 ): 68 – 75 . OpenUrl PubMed Web of Science 8. ↵ Hackam DG . Optimal Medical Management of Asymptomatic Carotid Stenosis . Stroke . 2021 ; 52 ( 6 ): 2191 – 2198 . doi: 10.1161/STROKEAHA.120.033994 OpenUrl CrossRef PubMed 9. ↵ Gasior SA , O’Donnell JPM , Davey M , et al. Optimal Management of Asymptomatic Carotid Artery Stenosis: A Systematic Review and Network Meta-Analysis . Eur J Vasc Endovasc Surg . 2023 ; 65 ( 5 ): 690 – 699 . doi: 10.1016/j.ejvs.2023.01.020 OpenUrl CrossRef PubMed 10. ↵ de Weerd M , Greving JP , de Jong Anne W F and Buskens E , Bots ML . Prevalence of asymptomatic carotid artery stenosis according to age and sex: systematic review and metaregression analysis . Stroke . 2009 ; 40 ( 4 ): 1105 – 1113 . OpenUrl Abstract / FREE Full Text 11. ↵ Song P , Fang Z , Wang H , et al. Global and regional prevalence, burden, and risk factors for carotid atherosclerosis: a systematic review, meta-analysis, and modelling study . Lancet Glob Health . 2020 ; 8 ( 5 ): e721 – e729 . OpenUrl PubMed 12. ↵ Pons E , Braun LMM , Hunink MGM , Kors JA . Natural Language Processing in Radiology: A Systematic Review . Radiology . 2016 ; 279 ( 2 ): 329 – 343 . doi: 10.1148/radiol.16142770 OpenUrl CrossRef PubMed 13. ↵ Chan C , Fort D , Velasco-Gonzalez C , et al. Rapid progression of carotid stenosis was rare in a large integrated healthcare system during an eight-year period . J Vasc Surg . 2021 ; 73 ( 5 ): 1623 – 1629 . OpenUrl PubMed 14. ↵ Mowery DL , Chapman BE , Conway M , et al. Extracting a stroke phenotype risk factor from Veteran Health Administration clinical reports: an information content analysis . J Biomed Semantics . 2016 ; 7 ( 1 ): 26 . OpenUrl PubMed 15. Wu X , Zhao Y , Radev D , Malhotra A. Identification of patients with carotid stenosis using natural language processing . Eur Radiol . 2020 ; 30 ( 7 ): 4125 – 4133 . OpenUrl PubMed 16. ↵ Chang RW , Tucker LY , Rothenberg KA , et al. Establishing a carotid artery stenosis disease cohort for comparative effectiveness research using natural language processing . J Vasc Surg . 2021 ; 74 ( 6 ): 1937 – 1947 .e3. OpenUrl PubMed 17. ↵ Cornia R , Patterson O V , Ginter T , Duvall SL . Rapid NLP Development with Leo . In: American Medical Informatics Association Annual Symposium .; 2014 . https://api.semanticscholar.org/CorpusID:45097230 18. ↵ Gornik HL , Rundek T , Gardener H , et al. Optimization of duplex velocity criteria for diagnosis of internal carotid artery (ICA) stenosis: A report of the Intersocietal Accreditation Commission (IAC) Vascular Testing Division Carotid Diagnostic Criteria Committee . Vasc Med . 2021 ; 26 ( 5 ): 515 – 525 . OpenUrl PubMed 19. ↵ IAC Vascular Testing Communication Updated Recommendations for Carotid Stenosis Interpretation Criteria . Intersocietal Accreditation Commission, Vascular Testing . October 2021 . Accessed December 4, 2024 . https://intersocietal.org/wp-content/uploads/2021/10/IAC-Vascular-Testing-Communication_Updated-Recommendations-for-Carotid-Stenosis-Interpretation-Criteria.pdf . 20. ↵ Arnold-Reed DE , Brett T , Troeung L , et al. Detection and management of familial hypercholesterolaemia in primary care in Australia: protocol for a pragmatic cluster intervention study with pre-post intervention comparisons . BMJ Open . 2017 ; 7 ( 10 ): e017539 . OpenUrl Abstract / FREE Full Text 21. ↵ Rubin DB . Statistical Matching Using File Concatenation With Adjusted Weights and Multiple Imputations . Journal of Business & Economic Statistics . 1986 ; 4 ( 1 ): 87 – 94 . doi: 10.1080/07350015.1986.10509497 OpenUrl CrossRef 22. ↵ Morris TP , White IR , Royston P. Tuning multiple imputation by predictive mean matching and local residual draws . BMC Med Res Methodol . 2014 ; 14 ( 1 ): 75 . OpenUrl CrossRef PubMed 23. ↵ Scott SC , Goldberg MS , Mayo NE . Statistical assessment of ordinal outcomes in comparative studies . J Clin Epidemiol . 1997 ; 50 ( 1 ): 45 – 55 . OpenUrl CrossRef PubMed Web of Science 24. ↵ Bender R , Grouven U. Ordinal logistic regression in medical research . J R Coll Physicians Lond . 1997 ; 31 ( 5 ): 546 – 551 . OpenUrl PubMed Web of Science 25. ↵ Edlinger M , van Smeden M , Alber Hannes F and Wanitschek M , Van Calster B. Risk prediction models for discrete ordinal outcomes: Calibration and the impact of the proportional odds assumption . Stat Med . 2022 ; 41 ( 8 ): 1334 – 1360 . OpenUrl PubMed 26. ↵ Bender R , Grouven U. Using binary logistic regression models for ordinal data with non-proportional odds . J Clin Epidemiol . 1998 ; 51 ( 10 ): 809 – 816 . OpenUrl CrossRef PubMed Web of Science 27. ↵ Liu A , He H , Tu XM , Tang W. On testing proportional odds assumptions for proportional odds models . Gen Psychiatr . 2023 ; 36 ( 3 ): e101048 . OpenUrl 28. ↵ Allison PD . Logistic Regression Using the SAS System: Theory and Application . 1st ed. SAS Publishing ; 1999 . 29. ↵ Clogg CC , Petkova E , Haritou A. Statistical Methods for Comparing Regression Coefficients Between Models . American Journal of Sociology . 1995 ; 100 ( 5 ): 1261 – 1293 . doi: 10.1086/230638 OpenUrl CrossRef Web of Science 30. ↵ Liu Y , Zhu Y , Jia W , et al. Association between lipid profiles and presence of carotid plaque . Sci Rep . 2019 ; 9 ( 1 ): 18011 . OpenUrl PubMed 31. ↵ Alsalmi DK , Abdeen R. Prevalence and risk factors of carotid artery stenosis (CAS) among cardiac surgery patients . Cureus . 2023 ; 15 ( 4 ): e37634 . OpenUrl 32. ↵ Arnett DK , Blumenthal RS , Albert MA , et al. 2019 ACC/AHA Guideline on the Primary Prevention of Cardiovascular Disease: Executive Summary: A Report of the American College of Cardiology/American Heart Association Task Force on Clinical Practice Guidelines . Circulation . 2019 ; 140 ( 11 ): e563 – e595 . doi: 10.1161/CIR.0000000000000677 OpenUrl CrossRef PubMed 33. ↵ Gil-Peralta A , Alter M , Lai SM , et al. Duplex Doppler and spectral flow analysis of racial differences in cerebrovascular atherosclerosis . Stroke . 1990 ; 21 ( 5 ): 740 – 744 . doi: 10.1161/01.str.21.5.740 OpenUrl Abstract / FREE Full Text 34. Lal BK , Meschia JF , Brott TG , et al. Race differences in high-grade carotid artery stenosis . Stroke . 2021 ; 52 ( 6 ): 2053 – 2059 . OpenUrl PubMed 35. Rockman CB , Hoang H , Guo Y , et al. The prevalence of carotid artery stenosis varies significantly by race . J Vasc Surg . 2013 ; 57 ( 2 ): 327 – 337 . OpenUrl CrossRef PubMed 36. ↵ Renedo D , Acosta JN , Sujijantarat N , et al. Carotid Artery Disease Among Broadly Defined Underrepresented Groups: The All of Us Research Program . Stroke . 2022 ; 53 ( 3 ): e88 – e89 . doi: 10.1161/STROKEAHA.121.037554 OpenUrl CrossRef PubMed 37. ↵ Oddone EZ , Horner RD , Sloane R , et al. Race, presenting signs and symptoms, use of carotid artery imaging, and appropriateness of carotid endarterectomy . Stroke . 1999 ; 30 ( 7 ): 1350 – 1356 . OpenUrl Abstract / FREE Full Text 38. ↵ Hicks CW , Daya NR , Black 3rd JH , Matsushita K , Selvin E. Race and sex-based disparities associated with carotid endarterectomy in the Atherosclerosis Risk in Communities (ARIC) study . Atherosclerosis . 2020 ; 292 : 10 – 16 . OpenUrl PubMed 39. ↵ Pothof AB , Soden PA , Deery SE , et al. The impact of race on outcomes after carotid endarterectomy in the United States . J Vasc Surg . 2018 ; 68 ( 2 ): 426 – 435 . OpenUrl PubMed 40. ↵ Wise ES , Ladner TR , Song J , et al. Race as a predictor of delay from diagnosis to endarterectomy in clinically significant carotid stenosis . J Vasc Surg . 2015 ; 62 ( 1 ): 49 – 56 . doi: 10.1016/j.jvs.2015.01.057 OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted May 16, 2025. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Extracting Carotid Stenosis Severity from Clinical Notes Using Natural Language Processing: Development, Validation, and Application in a Nationwide Veteran Cohort Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Extracting Carotid Stenosis Severity from Clinical Notes Using Natural Language Processing: Development, Validation, and Application in a Nationwide Veteran Cohort Kyung Min Lee , Patrick R. Alba , Gina M. Biagetti , Anthony Gao , Ming Yin , Peter N. Danilov , Tia DiNatale , Cristina Perez , Katherine Hartmann , Gabrielle E. Shakt , Renae L. Judy , Tiffany R. Bellomo , Kathryn M. Pridgen , Philip S. Tsao , Naveen Balasundaram , Michael G. Levin , Scott M. Damrauer , Julie A. Lynch medRxiv 2025.05.16.25327773; doi: https://doi.org/10.1101/2025.05.16.25327773 Share This Article: Copy Citation Tools Extracting Carotid Stenosis Severity from Clinical Notes Using Natural Language Processing: Development, Validation, and Application in a Nationwide Veteran Cohort Kyung Min Lee , Patrick R. Alba , Gina M. Biagetti , Anthony Gao , Ming Yin , Peter N. Danilov , Tia DiNatale , Cristina Perez , Katherine Hartmann , Gabrielle E. Shakt , Renae L. Judy , Tiffany R. Bellomo , Kathryn M. Pridgen , Philip S. Tsao , Naveen Balasundaram , Michael G. Levin , Scott M. Damrauer , Julie A. Lynch medRxiv 2025.05.16.25327773; doi: https://doi.org/10.1101/2025.05.16.25327773 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Cardiovascular Medicine Subject Areas All Articles Addiction Medicine (572) Allergy and Immunology (864) Anesthesia (302) Cardiovascular Medicine (4448) Dentistry and Oral Medicine (444) Dermatology (383) Emergency Medicine (609) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1515) Epidemiology (15240) Forensic Medicine (30) Gastroenterology (1130) Genetic and Genomic Medicine (6614) Geriatric Medicine (669) Health Economics (1000) Health Informatics (4550) Health Policy (1372) Health Systems and Quality Improvement (1613) Hematology (543) HIV/AIDS (1268) Infectious Diseases (except HIV/AIDS) (15928) Intensive Care and Critical Care Medicine (1106) Medical Education (624) Medical Ethics (147) Nephrology (668) Neurology (6621) Nursing (346) Nutrition (999) Obstetrics and Gynecology (1147) Occupational and Environmental Health (957) Oncology (3343) Ophthalmology (977) Orthopedics (369) Otolaryngology (421) Pain Medicine (436) Palliative Medicine (130) Pathology (665) Pediatrics (1695) Pharmacology and Therapeutics (693) Primary Care Research (714) Psychiatry and Clinical Psychology (5459) Public and Global Health (9248) Radiology and Imaging (2205) Rehabilitation Medicine and Physical Therapy (1371) Respiratory Medicine (1197) Rheumatology (597) Sexual and Reproductive Health (715) Sports Medicine (530) Surgery (714) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'a0287b83acef300f',t:'MTc3OTkyMTIxOQ=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.