Developing A Data Pipeline to Quantify Ventilator Waveforms

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 50,227 characters · extracted from preprint-html · click to expand
Developing A Data Pipeline to Quantify Ventilator Waveforms | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Developing A Data Pipeline to Quantify Ventilator Waveforms Peter D Sottile , Lenny Larchick , J.N. Stroh , David Albers , Bradford Smith doi: https://doi.org/10.1101/2025.10.28.25339000 Peter D Sottile 1 Division of Pulmonary, Allergy, and Critical Care Medicine, University of Colorado | Anschutz School of Medicine MD Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: peter.sottile{at}cuanschutz.edu Lenny Larchick 2 UCHealth Find this author on Google Scholar Find this author on PubMed Search for this author on this site J.N. Stroh 3 Department of Bioinformatics, University of Colorado | Anschutz School of Medicine PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site David Albers 3 Department of Bioinformatics, University of Colorado | Anschutz School of Medicine PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site Bradford Smith 4 Department of Bioengineering, University of Colorado Denver | Anschutz Medical Campus 5 Department of Pediatrics, University of Colorado | Anschutz School of Medicine PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF A bstract O bjective To automatically collect ventilator waveforms and integrate them with curated electronic health record data from thousands of patients to provide the data necessary to analyze the complex interactions between lung injury, patient effort, ventilator dyssynchrony, and ventilator mechanics. Such datasets do not currently exist, hampering the understanding of ventilator trajectories. D esign A prospective, observational study which utilizes a multidisciplinary team of data scientists, biomedical engineers, and clinicians to develop an automated pipeline collecting high-fidelity ventilator waveform data and integrating these data with electronic health record data, including vital signs, sedation and agitation scores, lab results, and medications (drug, dose, and route). Importantly, electronic health record data are collected over a patient’s entire hospital course, allowing for a complete description of patient trajectories. S ettings The Medical Intensive Care Unit at the University of Colorado. P atients All mechanically ventilated adult patients. I nterventions None. M easurements Automated collection of high-fidelity ventilator waveforms and electronic health record data. R esults Between July 2023 and May 2025, we collected data from 1,116 patients, 968 (87%) of whom had >12 hours of mechanical ventilation. These patients generated 4,767 ventilator days (>13 ventilator years) of analyzable ventilator waveforms and had a median duration of ventilation of 2.6[1.25, 6.06] days. Over 146 million breaths were segmented from the waveforms, of which 49 million breaths were able to fit the linear single-compartment model accurately and had a median compliance of 35.7 [25.2, 45.3] mL/H 2 O. Electronic health record data was linked to the waveforms to provide 8,511 [3,835, 17,040] records per patient. These data constitute a comprehensive database for studying the effects of mechanical ventilation, patient effort, ventilator dyssynchrony, and key non-ventilator covariates, such as sedation, across a large and heterogeneous cohort of patients. C onclusion We created a fully automated data pipeline to continuously collect mechanical ventilation waveform data and integrate it with detailed EHR data to generate a unique, high-fidelity dataset that will be crucial for understanding the complex relationships among lung injury, patient effort, sedation, ventilator dyssynchrony, and ventilator mechanics. Q uestion To create an automated data pipeline to collect and integrate continuous ventilator waveform data with electronic health record data. F indings Between July 2023 and May 2025, we automatically collected data from 1,116 patients, 968 (87%) of whom received mechanical ventilation for more than 12 hours. M eaning This fully automated data collection pipeline will facilitate advances in understanding the complex relationships between lung injury, patient effort, sedation, ventilator dyssynchrony, and ventilator mechanics. I ntroduction Invasive mechanical ventilation is a life-saving intervention. Continuous ventilator waveforms of airway pressure, flow, and volume are routinely displayed on modern ventilators, providing detailed diagnostic and prognostic information at the bedside related to lung physiology and injury, patient respiratory effort, ventilator dyssynchrony, and ventilator mechanics, which can rapidly change over time.( 1 ) However, systematic and longitudinal analysis of these data have historically been limited to a few descriptive variables, such as tidal volume, peak inspiratory pressure, or respiratory rate. Such variables are recorded relatively infrequently in the electronic health record (EHR) and inadequately capture the feature-rich, high-fidelity waveform data observed at the bedside. Importantly, mechanical ventilation can injure the lungs.( 2 ) Ventilator-induced lung injury (VILI) is caused by increases in lung strain (approximated as volumetric lung deformation) and stress (approximated as the force per unit area or transpulmonary pressure).( 3 , 4 ). Low-tidal volume ventilation is one strategy to decrease lung strain and stress in patients, thereby improving outcomes in patients both at risk for and with acute respiratory distress syndrome (ARDS).( 5 – 9 ) However, low-tidal volume ventilation does not always prevent VILI, especially in the presence of respiratory efforts.(10– 13) Indeed, ventilator dyssynchrony is defined as the inappropriate timing and delivery of a ventilator breath in response to respiratory effort and is associated with increased markers of lung strain and stress, as well as increased mortality.( 14 – 21 ) Consequently, to understand the complex interactions between lung injury, patient effort, ventilator dyssynchrony, sedation, and ventilator mechanics, it is essential to analyze complete waveforms of each breath, as details related to lung mechanics, patient effort, and ventilator dyssynchrony are not well captured in traditional descriptive electronic health record (EHR) data. Such detailed data have been unavailable for analysis due to several reasons. First, the average patient receiving mechanical ventilation receives over 25,000 breaths daily. Historically, nearly 40% of intensive care unit (ICU) admissions require mechanical ventilation, resulting in millions of mechanically ventilated breaths daily in a single hospital.( 22 ) To recapitulate the details of airway pressure, flow, and volume waveforms, data must be captured at a sufficient resolution, typically 30-50 Hz for each waveform, over the entire course of mechanical ventilation (typically several days). Moreover, to fully understand a patient’s clinical course, data must be collected throughout their entire duration of mechanical ventilation. For instance, snapshots of data miss short but critical events (i.e., clusters of dyssynchrony) that define a patient’s clinical trajectory, while the development and resolution of VILI occurs over days.( 23 ) The technology to capture, transmit, and store these data has only recently been introduced to the ICU, generating tremendous amounts of data that healthcare systems have traditionally been ill-equipped to collect. Second, elucidating meaningful interpretations of these waveform data throughout mechanical ventilation requires the development of automated analysis pipelines. A single patient generates approximately 25,000 breaths in a day, which rapidly scales to millions when studying hundreds or thousands of patients. Tasks range from the seemingly simple to the complex, including 1) extracting waveform data from different ventilators, 2) securely transmitting that data to secure servers, 3) transforming waveform data into usable data streams, 4) segmenting continuous waveforms into individual breaths, 5) aligning timestamps from different sources (ventilator and EHR), and 6) developing methods to analyze individual breaths, including the creation and validation of automated machine learning algorithms to identify dyssynchrony and quantify critical features observed in ventilator waveforms.( 15 , 24 – 33 ) Only in the last decade has the computational capacity to handle such tasks become readily available. Third, waveform data only partially describes the respiratory system and lacks the context of the patient’s condition, treatments, and outcomes. Ventilation strategies often require a delicate balance between optimizing respiratory targets, minimizing sedation, and ensuring adequate hemodynamics. In other words, the ventilator is not utilized in isolation from the rest of the patient. Consequently, accurately interpreting ventilator waveform data requires quantifying the broader context of the patient’s condition. To accomplish this, ventilator waveform data must be integrated into the larger EHR, including vital signs, sedation and agitation scores, lab results, positioning, fluid balance, and medication strategies (e.g., sedation). Finally, developing such pipelines requires a multidisciplinary team of data scientists, biomedical engineers, health system information technology (IT) experts, and clinicians to build, test, and validate the end-to-end data pipeline. Integrating waveform pipelines with EHR data requires motivated and persistent individuals with expertise in wrangling incomplete and “messy” EHR data. Building such teams has only recently become a priority for healthcare systems. O bjective The inability to automatically capture ventilator waveform data and integrate it with curated EHR results throughout a patient’s entire hospital encounter impairs our understanding of the complex interactions between lung injury, patient effort, ventilator dyssynchrony, sedation strategies, and ventilator mechanics. Prior data are limited to short durations of mechanical ventilation or lack integration with the EHR to obtain key non-ventilator covariates. Large, heterogeneous databases with such data do not exist for analysis. Moreover, building such a pipeline is the first step in leveraging these data streams for real-time clinical utilization by developing, testing, and validating predictive models to inform clinical decision-making. Consequently, we sought to develop a secure computational pipeline to automatically collect high-fidelity ventilator waveform data on all mechanically ventilated patients in the Medical Intensive Care Unit (MICU) at the University of Colorado, a quaternary-care university hospital. We integrated these data with EHR data, including vital signs, sedation and agitation scores, lab results, and medications (drug, dose, and route) from the entire hospitalization. This pipeline conforms to modern data exchange standards (Health Level Seven International (HL7)) and regulatory requirements (Health Insurance Portability and Accountability Act (HIPAA)), satisfying both US regulatory requirements and international interoperability expectations.( 34 – 36 ) Previously, such a dataset did not exist to aid ventilator research. This study presents a computational pipeline and describes the dataset collected to facilitate future studies aimed at reducing ventilation-related morbidity and mortality, providing insight into the effects of ventilator dyssynchrony and key non-ventilatory covariates, such as sedation, in a large and heterogeneous patient cohort. M aterials and M ethods P atients I ncluded The data pipeline was developed at the UCHealth University of Colorado Hospital to capture data from all patients admitted to the Medical Intensive Care Unit (MICU) who receive mechanical ventilation. The UCHealth University of Colorado Hospital is a multi-specialty, quaternary hospital with over 800 beds and 2.6 million annual patient visits. The MICU provides sub-specialty care for adult patients, ages greater than 14 years old, with a variety of critical illnesses, including septic shock, ARDS, and general respiratory failure (i.e., pneumonia, asthma, interstitial lung disease (ILD), chronic obstructive pulmonary disease (COPD)), gastrointestinal hemorrhage, and a variety of oncological disorders. The MICU does not routinely care for postoperative patients or patients with primary cardiac pathology. Patients are ventilated in the MICU with either a Hamilton G5 or a C6 ventilator (Hamilton Medical AG, Switzerland). This data pipeline was approved by the University of Colorado Combined Institutional Review Board (COMIRB, #20-2160) with waived consent, allowing the collection of clinical waveform and EHR data from all mechanically ventilated patients. D evelopment of A D ata M odel Ventilator data, including continuous airway pressure, flow, and volume measured at 50 Hz, are included to recapitulate ventilator waveforms. Ventilator settings are captured once per minute, including set ventilator mode, tidal volume, inspiratory pressure, positive end-expiratory pressure (PEEP), rate, inspiratory to expiratory time ratio (I:E ratio), rise time, flow pattern, and other mode-specific settings (i.e., high time (t-high) if the patient was in an airway pressure release ventilation (APRV) mode of ventilation). EHR data included patient age, sex, race, ethnicity, vital signs (i.e, temperature, blood pressure, heart rate, observed respiratory rate, pulse oximetry), physiologic data (i.e, Richmond Agitation and Sedation Score (RASS), hourly urine output, patient positioning, and nursing and respiratory therapist assessments), all laboratory test results, medication administration times, route, and dosages (i.e., vasopressors, sedatives, anxiolytics, and neuromuscular blockage agents), in-hospital transfers between units, and outcomes (i.e., discharge location and mortality). These data were deemed necessary by the clinical team to understand the effects of mechanical ventilation, especially ventilator dyssynchrony, and key non-ventilator covariates, such as sedation, on a large and heterogeneous patient cohort. W aveform D ata C ollection We established a team within UCHealth comprising data scientists, biomedical engineers, health system information technology (IT) experts, and clinicians to collect high-fidelity waveform data as outlined in Figure 1 . Each bed in the MICU uses the Capsule Neuron 3 (Philips, Cambridge, MA) to automate data collection from accessory devices, including IV pumps, dialysis machines, and mechanical ventilators. The Capsule management software is part of the on-site hospital computing infrastructure, running on a local virtual machine (VM) (VM1 in Figure 1 ). This software allows for the management of the Neurons (including updating software and changing settings), facilitates the translation of proprietary ventilator data streams to HL7, and has ‘output connectors’ for transferring the data to the desired data sink. The Capsule management software sends clinical production data to the local Epic instance (Epic, Verona, WI, US) and the research waveform data through our research pipeline. The details of our research data pipeline, including data transfer, transformation, breath segmentation, and pipeline monitoring, are described in Appendix I: Waveform Data Processing. Download figure Open in new tab Figure 1: Data pipeline flowchart: Ventilator waveform data travels through the Capsule Neuron in-room devices to a management server (Virtual Machine 1). This pathway shares infrastructure with the production EHR pipeline. The data are then sent to Virtual Machine 2, where they are aggregated and uploaded to an Azure Cloud Storage instance. This infrastructure is hospital-managed but not part of the production EHR pipeline. Our research server downloads those waveforms once daily for the Azure Cloud. EHR data is provided by Health Data Compass on request and linked to the waveforms using bed occupancy. E hr I ntegration We leverage Health Data Compass (HDC) ( healthdatacompass.org ), a multi-institutional health data warehouse at UCHealth, to link time-stamped patient-specific EHR data to the ventilator waveform data. Patient data is integrated into the HDC enterprise data warehouse through processes developed by software engineers to extract data from various source systems, transform that data into a standard schema (OMOP CDM V5), and load the data into the data warehouse. Relevant administrative and clinical data are then extracted into data marts. The details of our research EHR data pipeline are described in Appendix II: EHR Integration. R egulatory C ompliance This data pipeline was primarily designed to maintain HIPAA and HL7 compliance. Importantly, HDC data analysts provide institutional honest-broker services for investigators requiring access to limited data sets, de-identified data sets, or data marts, which are critical to this project. The Colorado Clinical and Translational Sciences Institute (CCTSI) ensures the HIPAA compliance of the research computational server. W aveform A nalysis Basic individual-breath descriptive variables, such as peak pressure, peak flow, delivered tidal volume, respiratory rate, and observed PEEP, are readily calculated from the raw waveform data. The continuous waveform data also allows for the calculation of more advanced metrics. For example, the linear single compartment model (SCM) model was efficiently fit to each breath using matrix inversion, yielding accurate estimates of resistance and compliance independent of specific ventilator maneuvers performed at the bedside to measure these values.( 37 ) Moreover, continuous mechanical power was directly calculated as the time-based integral of the pressure flow product for each breath. Patient characteristics or other EHR derived variables can then stratify these data. To demonstrate the power of these data, we utilized International Classification of Diseases, 10th revision (ICD-10) codes to identify patients with ARDS or ARDS risk factors, as previously described. We compared them with patients with other causes of respiratory failure.( 38 – 40 ) Values were compared with logistic regressions for binomial tests, Wilcoxon rank sum for non-normally distributed variables, t-tests for normally distributed variables, and mixed-effects models to account for repeated measurements within a patient for breath characteristics. Importantly, these data lend themselves to much more nuanced, time-based analysis. R esults This rich, unique data pipeline yields a substantial amount of harmonized data detailing the entire patient encounter. Between July 2023 and May 2025, we collected data from 1116 patients, 968 (87%) of whom had received mechanical ventilation for more than 12 hours. Of these patients, 704 (72%) have ARDS or ARDS risk factors as defined by ICD-10 codes, and 421 were female (43%); demographics are detailed in Table 1 . Patients had an average age of 55.2 ± 17.4 and an in-hospital mortality of 33.8%. View this table: View inline View popup Download powerpoint Table 1: Descriptive characteristics (demographics, IV infusions for analgesia, sedation, and neuromuscular blockade, RASS, and mortality) of patients captured by the data pipeline between July 2023 and May 2025 and stratified by patients with ARDS or ARDS risk factors compared to other patients. * p < 0.05, *** p 13 ventilator years) of analyzable ventilator waveforms and had a median duration of ventilation of 2.6 [IQR 1.25, 6.06] days. Waveform data generated 146 million individual breaths. Our rule-based segmentation algorithm achieved an accuracy of over 97.1% in matching the start and stop points of breaths within 0.1 seconds, compared with the approach used by the Hamilton DataLogger software, which identifies when the ventilator’s inspiratory and expiratory valves open and close. Equally important, our pipeline monitoring tools improved and ensured the collection of complete data, as demonstrated in Figure 2 . Download figure Open in new tab Figure 2: Ventilator Utilization and Data Pipeline Uptime: Time series of the number of simultaneous MICU ventilator waveforms collected over time (blue). Red bands show pipeline outages. The linkage of EHR to waveform data was effective, and 98.3% of 2024 waveforms were assigned to a patient with waveform data, as shown in Figure 3 . Temporal alignment of EHR and waveform data was checked by comparing the waveform-estimated and EHR-reported PEEP. The median difference was −0.06 [−0.25, 0.03] cmH 2 O, and inspection of breaths with substantial errors shows many instances of respiratory efforts pulling the waveforms below the set (EHR-reported) PEEP. Download figure Open in new tab Figure 3: Ventilator Utilization vs Bed Occupancy Overlap between ventilator waveform data (heavy black lines) and patient bed occupancy from the EHR (narrower colored lines). Each patient is shown in a unique color. EHR data is only received for discharged patients, which explains the ventilator waveforms without corresponding patients from April 2025 onward. Hamilton’s dual-mode ventilation (adaptive pressure ventilation with controlled mandatory ventilation (APVcmv)) was the most commonly utilized (59.4% of breaths), followed by pressure control (16.6% of breaths) and pressure support (14.2% of breaths). The SCM was fit to each breath. The SCM coefficient of determination (COD) is a measure of fit quality for which we assigned an empirical threshold COD = 0.985 based on visual inspection of the data to identify breaths with signs of respiratory effort. Using this threshold, respiratory effort (or other factors) decreased model fit in 97 million breaths. In the 49 million breaths with accurate fits, the compliance was 35.7 [25.2, 45.3] mL/cmH 2 O and the resistance was 11.4 [9.7, 13.8] cmH 2 O/L/s. Table 2 shows basic descriptors calculated for each breath. These SCM calculated compliance values correlated with clinical values recorded by the RT (Pearson Correlation: 0.86) and could be calculated more frequently; a median of every 0.046 minutes [0.038, 0.056] compared to RT documentation (a median of every 255 minutes [195, 390]). Finally, mechanical power was calculated for every breath from pressure and flow waveforms, with each breath dissipating a median of 8.8 [6.2, 12.5] J/s. View this table: View inline View popup Download powerpoint Table 2: Descriptive Properties of Breaths of in Patients with ARDS or ARDS Risk factors compared to other etiologies of respiratory failure. E rs : respiratory system elastance which is the inverse of compliance, R rs : respiratory system resistance. RR : respiratory rate, V t : observed tidal volume, normalized to predicted body weight, PIP : peak inspiratory pressure, PEEP : positive end expiratory pressure. All reported values are median [25%, 75% inter-quartile range]. EHR data was similarly rich, with a median of 8,511 [3,835, 17,040] records per patient. For instance, a total of 12,351 ABGs were collected during these patients’ care, a median of 6 [2, 16] per patient, with a mean pH of 7.37 ± 0.078, P a CO 2 of 37.1 ± 9.1, and P a O 2 of 97.7 ± 27.3. Moreover, an hourly ratio could be easily calculated from documented clinical flow sheet data, yielding 122,000 data points with a mean of 185.7 ± 67.2 and generating a high fidelity measure of respiratory failure severity that is highly correlated with mortality.( 41 – 45 ) Finally, the Richmond Agitation and Sedation Score (RASS) is documented a median of 75 times per patient [IQR 30-134] and a median score of −0.87 [−1.71, −0.41]. A total of 96% of patients received continuous analgesics with fentanyl drips, and 93% received sedation with propofol drips. A total of 7.2% of patients received neuromuscular blockade (NMB) during their course of mechanical ventilation. D iscussion This paper describes a comprehensive data pipeline for integrating continuous ventilator waveform data with detailed EHR data necessary to describe the complex interactions between lung injury, patient effort, ventilator dyssynchrony, sedation, and ventilator mechanics. The data pipeline and resulting dataset have several unique aspects. First, the dataset captures the patient’s entire hospital course. This facilitates detailed analysis of patient trajectories. Second, we capture both ventilator and EHR data. With this dense data collection, we can define high-fidelity subphenotypes and treatable traits, delineate sophisticated lung state markers, and track intermediate, short-term markers of VILI. This allows us to investigate how clinical interventions affect short-term changes, such as those observed 6 or 12 hours later, as well as classic long-term outcomes, including ventilator length of stay and mortality. Third, the dataset includes numerous time-varying covariates, such as markers of lung physiology, evolving sedation strategies, and temporal changes in the severity of illness. This enables complex time-series analysis that surpasses traditional multivariable adjustments based on variables collected at admission and analyzed in relation to discharge outcomes. Finally, these data include all mechanically ventilated patients in the MICU, a rich and heterogeneous population with causes of acute respiratory failure, including, but not limited to, ARDS. Moreover, this data pipeline represents a significant multidisciplinary investment. A skilled team of data scientists, biomedical engineers, health system information technology experts, and clinicians was necessary to build, test, and validate the end data. Indeed, without HDC, obtaining EHR data would have been infinitely more difficult. Even with the HDC team in place, building and refining the waveform data pipeline took over 2 years and was only possible with the UCHealth team’s gracious and skilled assistance. This study has several limitations. First, we record waveform data only in the MICU. While EHR data is available, periods of mechanical ventilation in other units (i.e., emergency department, operating room, time in other ICUs, or during transport) are missing from the waveform data. Expansion to include other departments is feasible in future iterations of our data pipeline and requires simply expanding the Capsule licensing to these units. Transportation periods are generally short — less than 10 minutes — and unlikely to significantly alter a patient’s clinical course. Second, that data is observational, limiting causal analysis. Although the data set is rich, unmeasured confounders are present. Particularly, it is difficult to capture the reasoning behind a given clinical intervention. Third, this dataset is from a single ICU (MICU) at a single hospital, using a single brand of ventilator. Thus, any observations may not be generalizable beyond our institute. Finally, this data is derived from the EHR. Finally, these data incorporate elements of the EHR, such as vital signs and ICD-10 codes, that are manually entered and susceptible to error. Similarly, because data are entered irregularly during clinical care, it is impossible to quantify missingness from the dataset. Many of these limitations can be overcome by generating large-scale, multi-site ventilator waveforms and EHR datasets containing a spectrum of ventilator types and care practices. This requires first establishing standards for data formatting, structure, and file types. For the EHR, we must determine a set of necessary covariates with defined data types and units. For categorical variables, such as ventilator mode, standard definitions must be established and consistently applied. Definitions related to waveforms will be more challenging. They should start with a common language for breath types (e.g., ventilator dyssynchrony types) that clearly delineates the start and end of every kind of breath. We must then establish a standard methodology for segmenting breaths to enable interoperability between data collected from and analyses performed at multiple sites. C onclusion For the first time, we created a fully automated data pipeline to continuously collect mechanical ventilation waveform data and integrate it with detailed EHR data to generate a unique, high-fidelity dataset. This dataset will facilitate future observational studies to delineate the complex relationships between lung injury, patient effort, sedation, ventilator dyssynchrony, and ventilator mechanics. Moreover, creating such a data pipeline is the first step in leveraging these data streams for real-time clinical utilization, which involves building, testing, and validating predictive models to inform clinical decision-making. Data Availability All data produced in the present study are available upon reasonable request to the authors D eclarations E thics A pproval This data pipeline and study were approved by the University of Colorado Combined Institutional Review Board (COMIRB, #20-2160). A vailability of data and materials The datasets generated and/or analyzed during the current study are not publicly available due to PHI. Nevertheless, a subset of de-identified and time-shifted data is available from the corresponding author upon reasonable request. A uthors’ contributions BS contributed to pipeline design and management, data analysis, and manuscript preparation and revision. PS contributed to pipeline design, data analysis, and manuscript preparation and revision. LL contributed to the design and development of the pipeline and to manuscript revision. DA and JS contributed to data analysis, manuscript preparation, and revision. A cknowledgements We would like to acknowledge Corey Montano, Michele Edelman, Michael Kahn, and Bujia Zhang at HDC for their work and assistance in building the HDC component of this data pipeline. Daniel Hoberecht and Tom Libric at UCHealth provided essential contributions to the development, testing, and deployment of the waveform infrastructure. Footnotes F inancial S upport Dr. Smith is supported by an NIH NHLBI R01 HL151630. Dr. Sottile was supported by an NIH NHLBI K23 HL145011. F inancial D isclosures and C onflicts of I nterest None G lossary ADT Admit, Discharge, Transfer s5 APRV airway pressure release ventilation 6 APVcmv adaptive pressure ventilation with controlled mandatory ventilation 7 ARDS acute respiratory distress syndrome 4, 5, 7, 8 CCTSI Colorado Clinical and Translational Sciences Institute 7, s2 COD coefficient of determination 7 COPD chronic obstructive pulmonary disease 5 EHR electronic health record 2, 3, 4, 5, 6, 7, 8, 9, 12, s1, s2, s5 HDC Health Data Compass 6, 8, 10, s5 HIPAA Health Insurance Portability and Accountability Act 5, 6 HL7 Health Level Seven International 5, 6, s2 I:E ratio inspiratory to expiratory time ratio 6 ICD-10 International Classification of Diseases, 10th revision 7 ICU intensive care unit 4, 8, 9 ILD interstitial lung disease 5 MICU Medical Intensive Care Unit 2, 5, 6, 8, 9, s5 PEEP positive end-expiratory pressure 6, 7 PHI protected health information s5 RASS Richmond Agitation and Sedation Score 6, 15 SCM single compartment model 7, 8 TCP Transmission Control Protocol s2 VILI ventilator-induced lung injury 4, 8 VM virtual machine 6, s2 B ibliography 1. ↵ Principles and Practice of Mechanical Ventilation . 3rd ed. New York : McGraw-Hill Medical ; 2013 . 2. ↵ Slutsky AS , Ranieri VM : Ventilator-Induced Lung Injury [Internet] . N Engl J Med 2013 ; 369 : 2126 – 2136 Available from: https://www.ncbi.nlm.nih.gov/pubmed/24283226%20 http://www.nejm.org/doi/pdf/10.1056/NEJMra1208707 OpenUrl CrossRef PubMed Web of Science 3. ↵ Protti A , Andreis DT , Milesi M , et al : Lung Anatomy, Energy Load, and Ventilator-Induced Lung Injury [Internet] . Intensive Care Med Exp 2015 ; 3 : 34 Available from: https://www.ncbi.nlm.nih.gov/pubmed/26671060%20 https://air.unimi.it/retrieve/handle/2434/348619/557196/40635_2015_Article_70.pdf OpenUrl PubMed 4. ↵ Bates JHT , Smith BJ : Ventilator-Induced Lung Injury and Lung Mechanics . Annals of Translational Medicine 2018 ; 6 : 378 OpenUrl PubMed 5. ↵ Webb HH , Tierney DF : Experimental Pulmonary Edema Due to Intermittent Positive Pressure Ventilation with High Inflation Pressures. Protection by Positive End-Expiratory Pressure . The American review of respiratory disease 1974 ; 110 : 556 – 565 OpenUrl PubMed Web of Science 6. Brower RG , Matthay MA , Morris A , et al : Ventilation with Lower Tidal Volumes as Compared with Traditional Tidal Volumes for Acute Lung Injury and the Acute Respiratory Distress Syndrome [Internet] . N Engl J Med 2000 ; 342 : 1301 – 1308 Available from: https://www.ncbi.nlm.nih.gov/pubmed/10793162%20 http://www.nejm.org/doi/pdf/10.1056/NEJM200005043421801 OpenUrl CrossRef PubMed Web of Science 7. Futier E , Constantin J-M , Paugam-Burtz C , et al : A Trial of Intraoperative Low-Tidal-Volume Ventilation in Abdominal Surgery . The New England journal of medicine 2013 ; 369 : 428 – 437 OpenUrl CrossRef PubMed Web of Science 8. Guay J , Ochroch EA : Intraoperative Use of Low Volume Ventilation to Decrease Postoperative Mortality, Mechanical Ventilation, Lengths of Stay and Lung Injury in Patients Without Acute Lung Injury [Internet] . Cochrane Database Syst Rev 2015 ; 12 :CD11151Available from: https://www.ncbi.nlm.nih.gov/pubmed/26641378%20 http://onlinelibrary.wiley.com/store/10.1002/14651858.CD011151.pub2/asset/CD011151.pdf?v=1&t=j6yaomf7&s=dc54d8b3e5e971cdc2dac8fda3a2c24879dff324 9. ↵ Determann RM , Royakkers A , Wolthuis EK , et al : Ventilation with Lower Tidal Volumes as Compared with Conventional Tidal Volumes for Patients Without Acute Lung Injury: A Preventive Randomized Controlled Trial [Internet] . Crit Care 2010 ; 14 : R1 Available from: https://www.ncbi.nlm.nih.gov/pubmed/20055989%20 https://www.ncbi.nlm.nih.gov/pmc/articles/PMC2875503/pdf/cc8230.pdf OpenUrl CrossRef PubMed 10. Yoshida T , Uchiyama A , Fujino Y : The Role of Spontaneous Effort During Mechanical Ventilation: Normal Lung Versus Injured Lung [Internet] . J Intensive Care 2015 ; 3 : 18 Available from: https://www.ncbi.nlm.nih.gov/pubmed/27408729%20 https://www.ncbi.nlm.nih.gov/pmc/articles/PMC4940771/pdf/40560_2015_Article_83.pdf OpenUrl PubMed 11. Yoshida T , Fujino Y , Amato MBP , et al : Fifty Years of Research in ARDS. Spontaneous Breathing during Mechanical Ventilation. Risks, Mechanisms, and Management [Internet] . Am J Respir Crit Care Med 2017 ; 195 : 985 – 992 [cited 2023 Sept 26 ] Available from: https://www.atsjournals.org/doi/10.1164/rccm.201604-0748CP OpenUrl PubMed 12. Telias I , Madorno M , Pham T , et al : Magnitude of Synchronous and Dyssynchronous Inspiratory Efforts during Mechanical Ventilation: A Novel Method . Am J Respir Crit Care Med 2023 ; 207 : 1239 – 1243 OpenUrl PubMed 13. Bertoni M , Telias I , Urner M , et al : A Novel Non-Invasive Method to Detect Excessively High Respiratory Effort and Dynamic Transpulmonary Driving Pressure during Mechanical Ventilation . Crit Care 2019 ; 23 : 346 OpenUrl PubMed 14. ↵ Gilstrap D , Davies J : Patient-Ventilator Interactions . Clin Chest Med 2016 ; 37 : 669 – 681 OpenUrl PubMed 15. ↵ Sottile PD , Albers D , Higgins C , et al : The Association Between Ventilator Dyssynchrony, Delivered Tidal Volume, and Sedation Using a Novel Automated Ventilator Dyssynchrony Detection Algorithm . Crit Care Med 2018 ; 46 : e151 – e157 OpenUrl PubMed 16. Sottile PD , Smith B , Stroh JN , et al : Flow-Limited and Reverse-Triggered Ventilator Dyssynchrony Are Associated With Increased Tidal and Dynamic Transpulmonary Pressure [Internet] . Critical Care Medicine 2024 ; 52 : 743 – 751 [cited 2025 Feb 13 ] Available from: https://journals.lww.com/10.1097/CCM.0000000000006180 OpenUrl PubMed 17. Gilstrap D , Macintyre N : Patient-Ventilator Interactions. Implications for Clinical Management [Internet] . Am J Respir Crit Care Med 2013 ; 188 : 1058 – 1068 Available from: https://www.ncbi.nlm.nih.gov/pubmed/24070493 OpenUrl CrossRef PubMed 18. Docci M , Rodrigues A , Dubo S , et al : Does Patient-Ventilator Asynchrony Really Matter? [Internet] . Current Opinion in Critical Care 2025 ; 31 : 21 [cited 2025 Feb 24 ] Available from: https://journals.lww.com/co-criticalcare/abstract/2025/02000/does_patient_ventilator_asynchrony_really_matter_.5.aspx OpenUrl PubMed 19. Blanch L , Villagra A , Sales B , et al : Asynchronies During Mechanical Ventilation Are Associated with Mortality [Internet] . Intensive Care Med 2015 ; 41 : 633 – 641 Available from: https://link.springer.com/content/pdf/10.1007%2Fs00134-015-3692-6.pdf OpenUrl PubMed 20. Thille AW , Rodriguez P , Cabello B , et al : Patient-Ventilator Asynchrony during Assisted Mechanical Ventilation [Internet] . Intensive Care Med 2006 ; 32 : 1515 – 1522 Available from: https://link.springer.com/content/pdf/10.1007%2Fs00134-006-0301-8.pdf OpenUrl CrossRef PubMed Web of Science 21. ↵ De Wit M , Pedram S , Best AM , et al : Observational Study of Patient-Ventilator Asynchrony and Relationship to Sedation Level [Internet] . J Crit Care 2009 ; 24 : 74 – 80 Available from: https://www.ncbi.nlm.nih.gov/pubmed/19272542%20 http://www.jccjournal.org/article/S0883-9441(08)00193-7/pdf OpenUrl CrossRef PubMed 22. ↵ Wunsch H , Wagner J , Herlim M , et al : ICU Occupancy and Mechanical Ventilator Use in the United States [Internet] . Crit Care Med 2013 ; 41 : doi: 10.1097/CCM.0b013e318298a139 [cited 2023 Jan 25 ] Available from: https://www.ncbi.nlm.nih.gov/pmc/articles/PMC3840149/ OpenUrl CrossRef PubMed 23. ↵ Sousa MLEA , Magrans R , Hayashi FK , et al : Clusters of Double Triggering Impact Clinical Outcomes: Insights From the EPIdemiology of Patient-Ventilator aSYNChrony (EPISYNC) Cohort Study [Internet] . Critical Care Medicine 2021 ; 49 : 1460 – 1469 [cited 2023 Dec 19 ] Available from: https://journals.lww.com/10.1097/CCM.0000000000005029 OpenUrl PubMed 24. ↵ Sottile PD , Smith BJ , Moss M , et al : The Development, Optimization, and Validation of Four Different Machine Learning Algorithms to Identify Ventilator Dyssynchrony . medRxiv [Preprint] 2023 ; 25. Agrawal DK , Smith BJ , Sottile PD , et al : A Damaged-Informed Lung Ventilator Model for Ventilator Waveforms . Front Physiol 2021 ; 12 : 724046 OpenUrl PubMed 26. Agrawal DK , Smith BJ , Sottile PD , et al : Quantifiable Identification of Flow-Limited Ventilator Dyssynchrony with the Deformed Lung Ventilator Model . Comput Biol Med 2024 ; 173 : 108349 OpenUrl PubMed 27. Stroh JN , Smith BJ , Sottile PD , et al : Hypothesis-Driven Modeling of the Human Lung-Ventilator System: A Characterization Tool for Acute Respiratory Distress Syndrome Research . J Biomed Inform 2023 ; 137 : 104275 OpenUrl PubMed 28. Hripcsak G , Albers DJ , Perotte A : Exploiting Time in Electronic Health Record Correlations . J Am Med Inform Assoc 2011 ; i109 – 115 29. Albers DJ , Hripcsak G : Estimation of Time-Delayed Mutual Information and Bias for Irregularly and Sparsely Sampled Time-Series [Internet] . Chaos Solitons Fractals 2012 ; 45 : 853 – 860 [cited 2023 Dec 12 ] Available from: https://www.ncbi.nlm.nih.gov/pmc/articles/PMC3332129/ OpenUrl PubMed 30. Albers DJ , Hripcsak G : Using Time-Delayed Mutual Information to Discover and Interpret Temporal Correlation Structure in Complex Populations [Internet] . Chaos 2012 ; 22 : 13111 Available from: https://www.ncbi.nlm.nih.gov/pubmed/22462987%20 https://www.ncbi.nlm.nih.gov/pmc/articles/PMC3277606/pdf/CHAOEH-000022-013111_1.pdf OpenUrl 31. Levine ME , Albers DJ , Hripcsak G : Comparing Lagged Linear Correlation, Lagged Regression, Granger Causality, and Vector Autoregression for Uncovering Associations in EHR Data . AMIA Annu Symp Proc 2016 ; 2016 : 779 – 788 OpenUrl PubMed 32. Levine ME , Albers DJ , Hripcsak G : Methodological Variations in Lagged Regression for Detecting Physiologic Drug Effects in EHR Data . J Biomed Inform 2018 ; 86 : 149 – 159 OpenUrl PubMed 33. ↵ Peterson RA , Cavanaugh JE : Ranked Sparsity: A Cogent Regularization Framework for Selecting and Estimating Feature Interactions and Polynomials [Internet] . AStA Adv Stat Anal 2022 ; 106 : 427 – 454 [cited 2025 Feb 13 ] Available from: https://link.springer.com/10.1007/s10182-021-00431-7 OpenUrl 34. ↵ Hammond W : HL7–more than a communications standard . Advanced Health Telematics and Telemedicine 2003 ; 266 – 271 35. Stang PE , Ryan PB , Racoosin JA , et al : Advancing the science for active surveillance: rationale and design for the Observational Medical Outcomes Partnership . Annals of internal medicine 2010 ; 153 : 600 – 606 OpenUrl CrossRef PubMed Web of Science 36. ↵ Hripcsak G , Duke JD , Shah NH , et al : Observational Health Data Sciences and Informatics (OHDSI): opportunities for observational researchers . MEDINFO 2015: eHealth-enabled Health 2015 ; 574 – 578 37. ↵ Bates JHT : Lung Mechanics [Internet] . Cambridge : Cambridge University Press ; 2009 . Available from: http://ebooks.cambridge.org/ref/id/CBO9780511627156 38. ↵ Sottile PD , Kiser TH , Burnham EL , et al : An Observational Study of the Efficacy of Cisatracurium Compared with Vecuronium in Patients with or at Risk for Acute Respiratory Distress Syndrome . Am J Respir Crit Care Med 2018 ; 197 : 897 – 904 OpenUrl PubMed 39. Dunbar PJ , Peterson R , McGrath M , et al : Analgesia and sedation use during noninvasive ventilation for acute respiratory failure . Critical Care Medicine 2024 ; 52 : 1043 – 1053 OpenUrl CrossRef PubMed 40. ↵ Dunbar PJ , Peterson RA , McGrath M , et al : Sedation practices during continuous neuromuscular blockade for acute respiratory distress syndrome . Annals of the American Thoracic Society 2025 ; 41. ↵ Ranieri VM , Rubenfeld GD , Thompson BT , et al : Acute Respiratory Distress Syndrome: The Berlin Definition . JAMA 2012 ; 307 : 2526 – 2533 OpenUrl CrossRef PubMed Web of Science 42. Bellani G , Laffey JG , Pham T , et al : Epidemiology, Patterns of Care, and Mortality for Patients with Acute Respiratory Distress Syndrome in Intensive Care Units in 50 Countries [Internet] . JAMA 2016 ; 315 : 788 – 800 Available from: https://www.ncbi.nlm.nih.gov/pubmed/26903337%20 http://jama.jamanetwork.com/data/journals/jama/935012/joi160008.pdf OpenUrl CrossRef PubMed 43. Brown SM , Grissom CK , Moss M , et al : Nonlinear Imputation of Pao2/Fio2 From Spo2/Fio2 Among Patients With Acute Respiratory Distress Syndrome . Chest 2016 ; 150 : 307 – 313 OpenUrl CrossRef PubMed 44. Chen W , Janz DR , Shaver CM , et al : Clinical Characteristics and Outcomes Are Similar in ARDS Diagnosed by Oxygen Saturation/Fio2 Ratio Compared With Pao2/Fio2 Ratio . Chest 2015 ; 148 : 1477 – 1483 OpenUrl CrossRef PubMed 45. ↵ Rice TW , Wheeler AP , Bernard GR , et al : Comparison of the SpO2/FIO2 Ratio and the PaO2/FIO2 Ratio in Patients with Acute Lung Injury or ARDS . Chest 2007 ; 132 : 410 – 417 OpenUrl CrossRef PubMed Web of Science View the discussion thread. Back to top Previous Next Posted October 30, 2025. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Developing A Data Pipeline to Quantify Ventilator Waveforms Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Developing A Data Pipeline to Quantify Ventilator Waveforms Peter D Sottile , Lenny Larchick , J.N. Stroh , David Albers , Bradford Smith medRxiv 2025.10.28.25339000; doi: https://doi.org/10.1101/2025.10.28.25339000 Share This Article: Copy Citation Tools Developing A Data Pipeline to Quantify Ventilator Waveforms Peter D Sottile , Lenny Larchick , J.N. Stroh , David Albers , Bradford Smith medRxiv 2025.10.28.25339000; doi: https://doi.org/10.1101/2025.10.28.25339000 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Respiratory Medicine Subject Areas All Articles Addiction Medicine (568) Allergy and Immunology (863) Anesthesia (297) Cardiovascular Medicine (4421) Dentistry and Oral Medicine (443) Dermatology (381) Emergency Medicine (606) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1507) Epidemiology (15212) Forensic Medicine (30) Gastroenterology (1121) Genetic and Genomic Medicine (6581) Geriatric Medicine (667) Health Economics (996) Health Informatics (4520) Health Policy (1366) Health Systems and Quality Improvement (1611) Hematology (539) HIV/AIDS (1264) Infectious Diseases (except HIV/AIDS) (15906) Intensive Care and Critical Care Medicine (1103) Medical Education (620) Medical Ethics (144) Nephrology (667) Neurology (6580) Nursing (345) Nutrition (998) Obstetrics and Gynecology (1141) Occupational and Environmental Health (956) Oncology (3324) Ophthalmology (970) Orthopedics (369) Otolaryngology (420) Pain Medicine (435) Palliative Medicine (129) Pathology (663) Pediatrics (1689) Pharmacology and Therapeutics (691) Primary Care Research (710) Psychiatry and Clinical Psychology (5431) Public and Global Health (9212) Radiology and Imaging (2193) Rehabilitation Medicine and Physical Therapy (1368) Respiratory Medicine (1194) Rheumatology (593) Sexual and Reproductive Health (709) Sports Medicine (529) Surgery (709) Toxicology (99) Transplantation (288) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'9ff0da8eabb209d6',t:'MTc3OTMzNzkwOQ=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00