Model-Based Assessment of Photoplethysmogram Signal Quality in Real-Life Environments

doi:10.1101/2024.06.07.24308621

Model-Based Assessment of Photoplethysmogram Signal Quality in Real-Life Environments

2024 · doi:10.1101/2024.06.07.24308621

preprint OA: closed

📄 Open PDF Full text JSON View at publisher

Full text 44,162 characters · extracted from preprint-html · click to expand

Model-Based Assessment of Photoplethysmogram Signal Quality in Real-Life Environments | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Model-Based Assessment of Photoplethysmogram Signal Quality in Real-Life Environments Yan-Wei Su , Chia-Cheng Hao , Gi-Ren Liu , Yuan-Chung Sheu , View ORCID Profile Hau-Tieng Wu doi: https://doi.org/10.1101/2024.06.07.24308621 Yan-Wei Su 1 Department of Applied Mathematics, National Yang Ming Chiao Tung University , Hsinchu, Taiwan Find this author on Google Scholar Find this author on PubMed Search for this author on this site Chia-Cheng Hao 2 Data Science Degree Program, National Taiwan University and Academia Sinica , Taipei, Taiwan Find this author on Google Scholar Find this author on PubMed Search for this author on this site Gi-Ren Liu 3 Department of Mathematics, National Cheng-Kung University , Tainan, Taiwan 4 National Center for Theoretical Sciences, National Taiwan University , Taipei, Taiwan Find this author on Google Scholar Find this author on PubMed Search for this author on this site Yuan-Chung Sheu 1 Department of Applied Mathematics, National Yang Ming Chiao Tung University , Hsinchu, Taiwan Find this author on Google Scholar Find this author on PubMed Search for this author on this site Hau-Tieng Wu 5 Courant Institute of Mathematical Sciences, New York University , New York, NY, 10012 USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Hau-Tieng Wu For correspondence: hauwu{at}cims.nyu.edu Abstract Full Text Info/History Metrics Data/Code Preview PDF A bstract Assessing signal quality is crucial for photoplethysmogram analysis, yet a precise mathematical model for defining signal quality is often lacking, posing challenges in the quantitative analysis. To tackle this problem, we propose a Signal Quality Index (SQI) based on the adaptive non-harmonic model (ANHM) and a Signal Quality Assessment (SQA) model, which is trained using the boosting learning algorithm. The effectiveness of the proposed SQA model is tested on publicly available databases with experts’ annotations. Result: The DaLiA database [ 20 ] is used to train the SQA model, which achieves favorable accuracy and macro-F1 scores in other public databases (accuracy 0.83, 0.76 and 0.87 and macro-F1 0.81, 0.75 and 0.87 for DaLiA-testing dataset, TROIKA dataset [ 31 ], and WESAD dataset [ 23 ], respectively). This preliminary result shows that the ANHM model and the model-based SQI have potential for establishing an interpretable SQA system. 1. I ntroduction Photoplethysmogram (PPG) is widely utilized in clinical and consumer devices for their non-invasive and cost-effective nature [ 1 ]. Initially employed to measure blood oxygen saturation and monitor resting heart rate (HR), the PPG signal also holds rich information on the cardiovascular, respiratory, autonomic nervous systems, or even blood pressure, which has not been routinely exploited but has started to gain attention in the digital health era. However, like other biomedical signals, PPG information’s accuracy relies on signal quality, which is high at rest but usually diminishes with movement [ 2 , 10 ]. Therefore, a robust signal quality assessment method is crucial to identify noise-corrupted segments, ensuring reliable measurements of parameters like heart rate and oxygen saturation from high-quality signal segments [ 19 ]. Various methods exist for assessing the quality of a PPG signal [ 15 ] under different criteria, such as the presence of clear pulse peaks [ 19 , 8 ] for HR extraction or clean pulse waveforms, cardiac component, or visible systolic and diastolic waves [ 16 ] for diagnosis demands. Additional considerations include pulse amplitude and width consistency with adjacent pulses, adherence to typical PPG pulse morphology [ 28 ]. Alternatively, simultaneous recording of other signals, as demonstrated in [ 17 ], can be employed to define quality. To automatically quantify PPG quality, signal processing techniques are needed. This can be achieved through time-domain, frequency-domain, or hybrid approaches, guided by predefined rules or machine learning techniques. See [ 19 ] for a review. To our knowledge, experts seem to rely on the visibility of the cardiac component to label the quality of a PPG segment. Despite implicitly consented PPG signal quality criteria among experts and numerous proposed PPG signal quality assessments (SQA), there is, to our knowledge, no precise definition of PPG signal quality with a mathematical model, particularly in a free-living environment. We model the PPG signal by the adaptive non-harmonic model (ANHM), which incorporates respiration-induced intensity variation (RIIV) [ 25 ] and motion rhythm, being non-sinusoidal when exists and apply time-frequency (TF) analysis to recover harmonics of the cardiac component. Based on these, we introduce our model-based signal quality index (SQI) to evaluate the quality of cardiac component residing in a PPG signal and an interpretable learning based SQA model based on the proposed and existing signal quality indices. We apply the SQA model to publicly available databases with expert annotations, showcasing its applicability. 2. M athematical model and signal decomposition It is well known that a PPG signal is composed of possible multiple components, including a cardiac component, a respiratory component [ 25 ], and a motion rhythm when a subject is exercising. The oscillatory morphology of the cardiac component changes from cycle to cycle, encoding the underlying physiological status [ 7 ], and the similar observation might hold for other components. Also, noise is inevitable. Jointly, we consider the adaptive non- harmonic model (ANHM) [ 13 ] to model the PPG signal. Fix small constants ϵ,ϵ ′ > 0 and Δ > 0. We model a clean PPG signal by the ANHM [ 13 ]: where is called the intrinsic model type (IMT) function, ϕ 𝓁 ,1 and are called the phase and the instantaneous frequency (IF) of the 𝓁 -th IMT function, b 𝓁,j ( t ) > 0 is the amplitude modulation (AM), and T ( · ) is a smooth function so that its Fourier transform is compactly supported in [−Δ, Δ]. For each 𝓁 ∈ {1, …, L }, we assume the following additionally: (C1) ϕ 𝓁,j ∈ C 2 (ℝ) for j = 1, …, D 𝓁 . When for all t ∈ ℝ; when and for all t ∈ ℝ. (C2) b 𝓁,j ∈ C 1 (ℝ) for j = 1, …, D 𝓁 . When j ≥ 2, b 𝓁,j ( t ) ≤ c 𝓁,j b 𝓁 ,1 ( t ) and for all t ∈ ℝ, where c 𝓁 ,1 > 0, c 𝓁,j ≥ 0 and (C3) When L > 1, for any t ∈ ℝ, for 𝓁 = 2, …, L , and for any 𝓁 < 𝓁 𝓁 . When ϵ ′ = 0 and b 𝓁,j ( t ) = c 𝓁,j b 𝓁 ,1 ( t ) for all j ≥ 2, the ANHM can be expressed as a function with fixed wave-shape functions (WSF); that is, where s 𝓁 is a 1-periodic function [ 13 ]. For each 𝓁 ∈ {1, …, L }, D 𝓁 ∈ ℕ is called the harmonic order for the 𝓁 -th IMT function. When D 𝓁 = 1, the 𝓁 -th IMT function oscillates with a sinusoidal WSF. Note that in general it is possible that for 𝓁 ≠ 𝓁 ′ and some j, k ∈ ℕ. We call b 𝓁 ,1 ( t ) cos(2 πϕ 𝓁 ,1 ( t )) the fundamental component of the 𝓁 -th IMT function, and for j > 1, we call b 𝓁,j ( t ) cos(2 πϕ 𝓁,j ( t )) the j-th harmonic of the 𝓁 -th IMT function. We refer readers to [ 13 ] for more detailed discussion of the model and these conditions. When L = 1, the only IMT function is the cardiac component, which usually can be well modeled by D 1 = 6. When respiration and/or walking patterns exist, L > 1, and their harmonic orders are lower, like 3. In a PPG example shown in Figure 5 , it is difficult to visualize the cardiac oscillation in the raw signal, even if it exists and is of high quality after decomposition. In practice, we can remove the trend component T by applying a high-pass filter, so from now on we assume T = 0. With the ANHM model, we consider the time-frequency (TF) analysis approach to decompose the signal, due to the time-varying frequency and amplitude nature of PPG signals. This approach has been applied to solve several signal processing problems, such as the extraction of the phase and the amplitude information, signal decomposition into essential components (IMT functions and their harmonics), denoising, and dynamic feature extraction. While there are several choices, we consider the short-time Fourier transform (STFT) based synchrosqueezing transform (SST) [ 5 , 18 ]. SST generates a TF representation (TFR) of the PPG signal. It has been theoretically established that when a signal adheres ANHM with sinusoidal WSFs, the ridges of STFT closely approximate the IFs of all IMT functions [ 6 ], and SST utilizes the phase information of STFT to sharpen the TFR and hence the performance of ridge detection (RD) is enhanced [ 14 ]. When we decompose a signal, we assume the knowledge of L . In general, estimating L is still a challenging problem, but estimating D 𝓁 could be achieved by the trigonometric regression [ 22 ]. Under the ANHM, by the RD and reconstruction formula for SST [ 5 ], we could robustly and accurately estimate [ 3 ], and the first IMT function can be reconstructed via taking the real part of the superposition of these estimated harmonics components. By subtracting the first IMT function from the PPG signal, we proceed with reconstructing the second IMT function by the same approach. By iteration, we obtain a decomposition of all IMT functions. The overall flowchart of ridge detection and harmonic decomposition algorithm, shape-adaptive mode decomposition (SAMD) is shown in Figure 1 . Download figure Open in new tab Figure 1. The overall flowchart of ridge detection and harmonic decomposition algorithm. (a) A segment of PPG signal that contains a cardiac component and a respiratory component. (b) The time-frequency representation of (a) determined by the second-order SST. (c) The detected ridges are superimposed as red-dashed curves on the TFR shown in (b). (d) The reconstructed harmonics of the cardiac component, which are related to the detected ridges shown in (c). (e) The reconstructed cardiac component, which comes from the superposition of reconstructed harmonics shown in (d). (f) The reconstruct fundamental component of the respiratory component that is related to the ridge shown as the blue-dashed curve in (c). (g) The superposition of (e) and (f). 3. S ignal quality indices for a ppg signal To our understanding, “signal quality” is a broad term typically described and quantified by implicitly equating it with the visibility of the cardiac component, sometimes considering conditions like systolic or diastolic phase behavior as indicators of high quality. Let us now quantify this traditional idea. To quantify this idea precisely, we model a PPG signal by (1), assume 𝓁 = 1 is the cardiac component, and define the SQI by where n ( t ) is the inevitable noise, and In other words, we view non-cardiac component as “noise”. Clearly, when the cardiac component as the signal is strong and the noise is weak, is large and SQI M ( t ) is close to 1. Otherwise it is close to 0. In the ideal situation when L = 1, ñ ( t ) = n ( t ) and which is the relationship between the cardiac component and the noise. In practice, the PPG signal is uniformly sampled at a fixed sampling rate, f s Hz, and saved as a vector x ∈ ℝ N ; that is, for 1 ≤ i ≤ N , where n i is a mean zero noise with finite variance. Clearly, each component of f is also uniformly sampled as an ℝ N vector. For example, the cardiac component is given by where 1 ≤ i ≤ N , and b 1, k , ϕ 1, k ∈ ℝ N are uniformly sampled from b 1, k ( t ) and ϕ 1, k ( t ). Numerically, the estimation of b 1, k , ϕ 1, k and noise n from the PPG signal is achieved by the reconstruction formula for SST [ 5 ]. Then, compute SQI M every d/f s s, where d ∈ ℕ is chosen by the user; that is, where The Matlab implementation of SQI M can be found in https://github.com/yanweiSu/PPG-SQIm . We also compare SQI M with existing SQIs, including the skewness (SQI S ) [ 12 , 8 ] computed for each 4 s PPG segment, the entropy ( SQI E ) [ 24 , 8 ] for each 4 s PPG, and harmonic integrity index of order n ∈ ℕ, H n , motivated by studying the strength dynamics of various harmonics of ambulatory blood pressure signal (ABP) [ 30 , 4 ]. Let f 1, k ∈ ℝ N be the k -th harmonics component of the cardiac component, H of the j -th sample is defined as The perfusion index [ 8 ] is not considered since the databases we use have gone through a high pass filter. 3.1. Implementation details Each PPG segment is 30 s in this paper. With f s = 64 Hz, we used a 6th-order Butterworth bandpass filter with cutoff frequencies at 20 Hz and 0.5 Hz. Denote the pre-processed PPG segment as . We used the second-order STFT- based synchrosqueezed transformation (SST) [ 18 ] with the window function , which leads to a N -by- M complex-valued matrix S ∈ ℂ N×M as the discretized TFR, where N = 30 f s , , and Δ ξ = 0.02 Hz. Then apply the multiple harmonics RD (MHRD) [ 26 ] on S with two ridges and parameters ( λ 1 , λ 2 ) = (1, 1) and ( µ 1 , µ 2 ) = (0, 0.07) to obtain IFs of the first two harmonics, followed by the single curve RD [ 26 ] with λ = 1 to obtain IFs of remaining higher harmonics, where we apply the masking technique; that is, at time i/f s , the band ranging from Hz to Hz is masked. Finally, set Δ = 0.2 to reconstruct b 1, k ( t ) cos(2 πϕ 1, k ( t )), where k = 1, …, 5, denoted as f 1, k ∈ ℂ N , which leads to b 1, k , ϕ 1, k ∈ ℝ N , where b 1, k [ i ] = | f 1, k [ i ]| and ϕ 1, k comes from phase unwrapping f 1, k . 3.2. Train an interpretable signal quality assessment model For each 30 s PPG segment, the label sequence is a {0, 1}-valued sequence, , where 1 indicates “with artifact” (low quality) and 0 indicates “no-artifact” (high quality). To avoid the boundary effect, the first and last 5 seconds are discarded. This is not a serious problem since in practice the PPG signal is usually much longer than 30 second. To speed up, downsample y to 2Hz by the voting process over each 0.5s. The features defined by different SQIs are converted correspondingly by taking the median over each 0.5s. With SQIs and labels from all 30 second segments in the training dataset, we apply an interpretable learner, Light Gradient Boosting Machine (LightGBM) [ 11 ], to train a SQA model, with the learning rate of 0.1, the max number of leaves of each tree 7, the max number of bins for the feature values 255, and the cross-entropy as the loss function. 4. M aterials and statistics 4.1. Dataset We employed the publicly available dataset from [ 9 ] for validating the proposed SQA model. There are 7,306 segments with quality annotations in total. The labels are binary (1 for “artifact” or “low quality”, and 0 for “clean”, “no artifact” or “high quality”) to each sample point in the segment. These segments are derived from three public datasets: DaLiA [ 20 ], TROIKA [ 31 ], and WESAD [ 23 ]. Details of data preparation and labeling can be found in [ 9 ]. 4.2. More details about the public databases The employed publicly available datasets with experts’ labels [ 9 ] can be downloaded from https://github.com/chengstark/Segade/tree/main/data . There are 7,306 30-second PPG recordings in total, each accompanied by quality annotations. The labels assign binary values (1 for “artifact” or “low quality”, and 0 for “clean”, “no artifact” or “high quality”) to each sample point in the segment. These segments are derived from processing PPG signals from three public datasets: DaLiA [ 20 ], TROIKA [ 31 ], and WESAD [ 23 ], and the set that comes from DaLiA is split further into one training set, called the DaLiA-training (DTrain) set, and one testing set, called the DaLiA-testing (DTest) set. All 30-second PPG segments are uniformly sampled at the sampling rate 64 Hz, and the signal values are normalized to the range [0, 1]. A second-order Butterworth filter with a low end cutoff of 0.9 Hz and a high end cutoff of 5 Hz was applied to the segments of both DaLiA and WESAD dataset 1 by the authors in [ 9 ]. The TROIKA dataset was pre-processed by its original author in [ 31 ] with bandpass from 0.4 Hz to 5 Hz. 2 To be consistent, we pre-process the databases used in [ 9 ] by applying a 6th-order Butterworth filter with a low end cutoff of 0.5 Hz and a high end cutoff of 20 Hz. In the TROIKA dataset, both the PPG signal and triaxial acceleration signal were recorded from the wrist. Subjects performed treadmill running with changing speeds during data collection. For datasets labeled as TYPE01 , running speeds changed as follows: rest (30 s) → 8 km/hr (1 minute) → 15 km/hr (1 minute) → 8 km/hr (1 minute) → 15 km/hr (1 minute) → rest (30 s). For datasets labeled as TYPE02 , illustrated in Figure 1 in the main article, running speeds changed as follows: rest (30 s) → 6 km/hr (1 minute) → 12 km/hr (1 minute) → 6 km/hr (1 minute) → 12 km/hr (1 minute) → rest (30 s) [ 31 ]. In the DaLiA dataset, subjects performed 8 activity statuses plus one transient status: sitting, ascending and descending stairs, table soccer, cycling, car driving, lunch break, walking, and working, marked by IDs 1 to 8, respectively. The transient state, representing transitions between statuses, is marked by ID 0. Both the PPG signal used for analysis and the accelerometer signal plotted in Figure 1 in the main article were recorded from the wrist-worn device. Both TROIKA and DaLiA datasets provide ECG signals and the detected R peaks as ground truth for HR estimation. The WESAD dataset was recorded from both wrist- and chest-worn devices, from 15 subjects (age ranging from 21 to 55 years old, median 28 years old) during a lab study under different emotional states, including neutral, stress, and amusement. Subjects were allowed to move freely while performing tasks. The signals include ECG signals, tri-axis accelerometer signal, electrodermal activities record and PPG signals. The PPG signals in WESAD dataset are recorded from the wrist at the sampling rate 64 Hz [ 23 ]. The label generation procedure used in [ 9 ] is summarized here for readers’ convenience. Binary labels were created based on annotators’ observations of the three-axis acceleration signal, examining the correlation between ECG heartbeats and PPG heartbeats, and assessing the regularity of the PPG signals to identify artifacts. Two scenarios were considered for artifact annotations: (1) If the accelerometer shows motion and irregularities in the PPG signal align with the accelerometer data, the segment is marked as an artifact. (2) If the accelerometer shows no obvious motion, ECG displays a normal sinus rhythm, but irregularities are observed in the PPG signal, the segment is marked as an artifact. Each signal was annotated by at least one annotator. In the initial annotation trial phase, fifty 30-second segments were randomly selected and independently annotated by three annotators. Annotations from each pair of annotators were compared and analyzed, and the group of annotators collectively made decisions on correct annotations, improving agreement. The remaining data were annotated by a single annotator thereafter. 4.3. Learning process We followed the procedure outlined in [ 9 ] to construct the training and testing sets. Specifically, 3436 segments from 12 subjects (ID 2 to ID 13) in the DaLiA dataset constitute the DaLiA-training (DTrain) set; 869 segments from the remaining subjects in the DaLiA dataset form the DaLiA-testing (Dtest) set. Additional testing sets include 2888 segments from the WESAD dataset and 113 segments from the TROIKA dataset. We allocate DaLiA-training for training and reserve DaLiA-testing, TROIKA, and WESAD for testing. 4.4. Statistical analysis We first run a 10-fold cross-validation on the DTrain set following the 10-fold splitting in [ 9 ]. Then, train the SQA model on the entire DTrain set, and test on DTest, TROIKA and WESAD datasets separately. By viewing label 1 as the positive class, and 0 as the negative class, we report accuracy, sensitivity, precision, macro-F1 score, and the DICE score, which is defined as 2TP / (TP + FP + FN), where TP, FP and FN are true positive, false positive and false negative, respectively. 5. R esult In DTrain (DTest, TROIKA and WESAD respectively), the overall length of the PPG signal is 103,080 s (26,070 s, 3,390 s and 86,640 s respectively) and the overall length of artifact is 60,478.48 s (13,298.47 s, 1,784.58 s and 43,020.41 s respectively). Among all recordings, the ratio of labeled artifact in each recording is 0.59 ± 0.34 (0.51 ± 0.31, 0.53 ± 0.34 and 0.50 ± 0.39 respectively). 5.1. Basic statistics for signal quality indices The mean and standard deviation of different SQIs are reported in Table 1 . Overall, SQI M and SQI S are higher when the signal quality is high, which fits our expectation. H 1 and H 6 have opposite behavior, which can be explained by the fact that the higher order harmonic in PPG is weaker, and hence easily perturbed and “enhanced” by the high frequency component of artifacts. View this table: View inline View popup Download powerpoint Table 1. The mean and standard deviation of different SQIs. 5.2. Performance of each SQI The Wilcoxon rank sum test on each testing dataset shows that all SQIs are significantly different ( p < 10 −10 ) on the artifact and the non-artifact groups. In DTrain (DTest, TROIKA and WESAD respectively), the Pearson correlation coefficients between SQI M and H 1 , H 6 , SQI S and SQI E are 0.64, 0.07, 0.36 and −0.04 (0.59, 0.13, 0.40 and −0.09, 0.27, 0.24, 0.04 and 0.23, and 0.72, −0.04, 0.43 and −0.14 respectively) respectively. Except for TROIKA, the correlation coefficient between SQI M and H 1 is usually higher than 0.5. The area under the receiver operating characteristic curve (AUROC) and optimal threshold for the binary classification are reported in Table 2 . Overall, except for TROIKA, the AUROC of SQI M is the highest, and those of H 1 and SQI S are also high. Signals in TROIKA were recorded during running and were expected to be more challenging. Since SQI M has the highest AUROC in general, we evaluate its ability as a single index to classify the signal quality. First, we learn the optimal threshold of SQI M from the AUROC from DTrain using the experts’ labels. Then apply this threshold to the testing databases. Overall, the accuracy, macro-F1 and DICE are 0.78, 0.77 and 0.80 (0.64, 0.61 and 0.72, 0.85, 0.85 and 0.85, respectively) for DTest (TROIKA and WESAD, respectively). View this table: View inline View popup Download powerpoint Table 2. AUROC and the best thresholds of each feature for each testing datasets. The negative sign preceding an index emerges when the AUROC with the original index is below 0.5, prompting us to invert the sign of the index and report the resulting AUROC. View this table: View inline View popup Download powerpoint Table 3. The confusion matrices and the performance metrics of the trained SQA model on different testing sets. NPV: negative predictive value; SEN: sensitivity; SPE: specificity; PRE: precision; mF1: macro-F1. 5.3. Performance of the SQA model The proposed SQA model achieves accuracy 0.86 ± 0.01 and macro-F1 score 0.85 ± 0.01 on DTrain under the 10-folds cross-validation scheme. When the trained model is tested on DTest (TROIKA and WESAD respectively), it achieves accuracy 0.83 (0.76 and 0.87 respectively), macro-F1 score 0.82 (0.75 and 0.87 respectively). See Table 6 for details. Note that DICE does not outperform the neural network based algorithm proposed in [ 9 ], which achieves 0.87, 0.81 and 0.91 in DTest, TROIKA and WESAD respectively, and we will come back to this in Discussion. 5.4. More analysis results The histogram and receiver operating characteristic curve (ROC) of various SQIs over different databases are shown in Figures 2 , 3 and 4 . Download figure Open in new tab Figure 2. Histograms and AUROC curves of different SQIs on the DaLiA- testing dataset. Download figure Open in new tab Figure 3. Histograms and AUROC curves of different SQIs on the TROIKA dataset. Download figure Open in new tab Figure 4. Histograms and AUROC curves of different SQIs on the WE- SAD dataset. Download figure Open in new tab Figure 5. Two PPG signals recorded from two subjects’ wrists while they were running. Top row: the raw PPG signal that has been bandpass filtered with the 0.4 − 5Hz band. Middle row: the cardiac component decomposed from the raw PPG signal is shown as the black curve, and the simultaneously recorded ECG signal and the detected R-peaks are shown as the red curve and the grey lines, respectively. Bottom row: the motion rhythm decomposed from the raw PPG signal is shown as the black curve, and the magnitude of the simultaneously recorded accelerometer signal is shown as the red curve. Among various SQIs, since SQI M has the highest AUROC in general, we evaluate its ability as a single index to classify the signal quality in different databases. First, we learn the optimal threshold of SQI M from the AUROC curve from DTrain using the experts’ labels. We then apply this threshold to DTest, TROIKA and WESAD. The result is shown in Table 4 . Overall, accuracy and macro-F1 are 0.78 and 0.77 (0.64 and 0.61, 0.85 and 0.85, respectively) for DTest (TROIKA and WESAD, respectively). View this table: View inline View popup Download powerpoint Table 4. Performance evaluation of SQI M . We apply the threshold determined by DaLiA-training set on the other three testing datasets, and report the confusion matrices and standard metrics. NPV: negative predictive value; SEN: sensitivity; SPE: specificity; PRE: precision; mF1: macro- F1. The proposed SQA model achieves accuracy 0.86 ± 0.01 and macro-F1 score 0.85 ± 0.01 on DTrain under the 10-folds cross-validation scheme, which is shown in Table 5 . We follow the 10-fold splitting proposed in [ 9 ]. View this table: View inline View popup Download powerpoint Table 5. The 10-folds cross-validation of the proposed SQA model on DaLiA-training set. The total sum of 10 confusion matrices is shown above. NPV: negative predictive value; SEN: sensitivity; SPE: specificity; PRE: precision; mF1: macro-F1. View this table: View inline View popup Download powerpoint Table 6. Sum of the confusion matrices and the performance metrics of testing the SQA models on each testing sets. The SQA model is trained from the DaLiA-training database. NPV: negative predictive value; SEN: sensitivity; SPE: specificity; PRE: precision; mF1: macro-F1. When the trained model is tested on DTest (TROIKA and WESAD respectively), it achieves accuracy 0.83 (0.76 and 0.87 respectively) and macro-F1 score 0.82 (0.75 and 0.87 respectively). See Table 6 for details. Finally, we compare the performance of the proposed signal quality indices with the Segade model proposed in [ 9 ]. The DICE scores of the proposed SQA model, SQI M , and Segade are reported in Table 7 , where the DICE score is defined as 2TP / (TP + FP + FN), where TP means true positive, FP means false positive and FN means false negative [ 9 ]. View this table: View inline View popup Download powerpoint Table 7. The DICE score of testing the proposed SQA model on each dataset. The Segade result in the first row is from Table 1 in [ 9 ]. 6. D iscussion and conclusion We proposed a model-based SQI, denoted as SQI M , and a learning-based SQA model that incorporates various SQIs including SQI M . The proposed SQA performs well, but does not outperform the existing CNN-based approach model. The first topic to discuss, which probably is the spotlight of readers interested in the “predictive model”, is the performance of our SQA model. In SQI M , the strong motion rhythm resistant to the bandpass filter is treated as “noise”, resulting in a small SQI M . This, coupled with concerns about labels derived from raw PPG signals raised in [ 27 ] elucidates the slightly lower performance of our SQA model compared to results reported in [ 9 ], which is a convolutional neural network model derived from the U-Net model architecture [ 21 ] tailored for 1D signal processing. See the left subplot of Figure 5 for a PPG segment that is labeled “low quality”, where the PPG is composed of a cardiac component and a motion rhythm since the subject was running at the speed of 6km/hour. This segment was considered of low quality, probably due to its irregular pattern, but its decomposed cardiac component is reasonably well. In the right subplot of Figure 5 , the PPG segment is labeled “high quality” probably since its presence “seems” regular and close to cardiac oscillation. However, these cycles do not aligned with the cardiac cycles confirmed by the simultaneously recorded electrocardiogram (ECG). We thus could reasonably view the labeled signal quality as uncertain . This uncertainty complicates the comparison of model performances. Although the DICE evaluation of the proposed SQA model indicates a lower performance than [ 9 ], the SQA model holds a distinct advantage in interpretability inherited from the PPG model. This raises the question of whether quantifying signal quality of cardiac component post-decomposition is more effective when irrelevant components exist. As no labeled database follows this approach, we leave this intriguing question for future research. The advantage that SQI M is defined with mathematical meanings allows generalization for quantifying other information in PPG; for example, respiratory information, motion rhythm, or other factors in PPG signals. This is related to the change point detection for oscillatory signals in statistics, which unfortunately has received limited attention, except for recent efforts [ 29 ]. Note that respiratory information like RIIV may be absent, motion rhythms might be absent or irregular, and arrhythmia might appear, making quality assessment vague. We may extend the change point detection algorithm [ 29 ] to the PPG signal, considering time-varying frequency, amplitude, and WSF. This problem is prevalent in other scientific fields, and exploring joint oscillatory component change point detection and signal decomposition is a future research direction. In conclusion, our proposed ANHM model, in conjunction with advanced signal decomposition tools, holds promise for establishing such a system by incorporating the signal decomposition step. With labels provided by this system, we can advance towards establishing a more dependable SQA model, particularly for scientific research. Data Availability All data produced are available online and cited in the paper. A cknowledgement The authors thanks author in [ 9 ] for providing details regarding the labeled databases they shared. Footnotes E-mail address : su311652001.sc11{at}nycu.edu.tw E-mail address : allenh18.ee08{at}nycu.edu.tw E-mail address : girenliu{at}gmail.com E-mail address : sheu{at}math.nctu.edu.tw E-mail address : hauwu{at}cims.nyu.edu ↵ 1 https://github.com/chengstark/Segade/blob/main/db2npy.py , line 23 to line 30. ↵ 2 See [ 9 ] and the description in [ 31 ] R eferences [1]. ↵ J. Allen . Photoplethysmography and its application in clinical physiological measurement . Physio. Meas ., 28 ( 3 ): R1 , feb 2007 . OpenUrl [2]. ↵ P. H. Charlton and et al. Acquiring wearable photoplethysmography data in daily life: The ppg diary pilot study . Engineering Proceedings , 2 ( 1 ), 2020 . [3]. ↵ Y.-C. Chen , M.-Y. Cheng , and H.-T. Wu . Non-parametric and adaptive modelling of dynamic periodicity and trend with heteroscedastic and dependent errors . J. R. Stat. Soc. Ser. B. Stat. Methodol ., 76 ( 3 ): 651 – 682 , 2014 . OpenUrl [4]. ↵ Neng-Tai Chiu , Beau Chuang , Suthawan Anakmeteeprugsa , Kirk H. Shelley , Aymen Awad Alian , and Hau-Tieng Wu . Signal quality assessment of peripheral venous pressure . J. Clin. Monit. Comput ., 2023 . [5]. ↵ I. Daubechies , J. Lu , and H.-T. Wu . Synchrosqueezed wavelet transforms: an empirical mode decomposition-like tool . Appl. Comput. Harmon. Anal ., 30 ( 2 ): 243 – 261 , 2011 . OpenUrl CrossRef [6]. ↵ N Delprat and et al. Asymptotic wavelet and gabor analysis: Extraction of instantaneous frequencies . IEEE Trans. Inf. Theory , 38 ( 2 ): 644 – 664 , 1992 . OpenUrl CrossRef [7]. ↵ A. Eid and et al. Using the ear photoplethysmographic waveform as an early indicator of central hypovolemia in healthy volunteers utilizing lbnp induced hypovolemia model . Physiol. Meas ., 2023 . [8]. ↵ M. Elgendi . Optimal signal quality index for photoplethysmogram signals . Bioengineering , 3 , 2016 . [9]. ↵ Z. Guo and et al. A supervised machine learning semantic segmentation approach for detecting artifacts in plethysmography signals from wearables . Physiol. Meas ., 42 ( 12 ): 125003 , dec 2021 . OpenUrl [10]. ↵ S. Huthart and et al. Advancing ppg signal quality and know-how through knowledge translationfrom experts to student and researcher . Frontiers in Digital Health , 2 , 2020 . [11]. ↵ I. Guyon , U. Von Luxburg , S. Bengio , H. Wallach , R. Fergus , S. Vishwanathan , and R. Garnett G. Ke and et al. LightGBM: A highly efficient gradient boosting decision tree . In I. Guyon , U. Von Luxburg , S. Bengio , H. Wallach , R. Fergus , S. Vishwanathan , and R. Garnett , editors, NIPS , volume 30 . Curran Associates, Inc ., 2017 . [12]. ↵ R. Krishnan , B. Natarajan , and S. Warren . Two-stage approach for detection and reduction of motion artifacts in photoplethysmographic data . IEEE Trans. Biomed. Eng ., 57 ( 8 ): 1867 – 1876 , 2010 . OpenUrl PubMed [13]. ↵ C.-Y. Lin , L. Su , and H.-T. Wu . Wave-shape function analysis–when cepstrum meets time-frequency analysis . J. Fourier Anal. Appl ., 24 ( 2 ): 451 – 505 , 2018 . OpenUrl [14]. ↵ Sylvain Meignen , Duong-Hung Pham , and Stephen McLaughlin . On demodulation, ridge detection, and synchrosqueezing for multicomponent signals . IEEE Trans. Signal Process , 65 ( 8 ): 2093 – 2103 , 2017 . OpenUrl [15]. ↵ John Allen and Panicos Kyriacou E. Mejia-Mejia and et al. 4 - photoplethysmography signal processing and synthesis . In John Allen and Panicos Kyriacou , editors, Photoplethysmography , pages 69 – 146 . Academic Press , 2022 . [16]. ↵ S. Moscato and et al. Wrist photoplethysmography signal quality assessment for reliable heart rate estimate and morphological analysis . Sensors , 22 ( 15 ), 2022 . [17]. ↵ E. K. Naeini and et al. A real-time ppg quality assessment approach for healthcare internet-of-things . Procedia Computer Science , 151 : 551 – 558 , 2019 . ANT 2019/EDI40 2019. OpenUrl [18]. ↵ T. Oberlin , S. Meignen , and V. Perrier . Second-order synchrosqueezing transform or invertible reassignment? towards ideal time-frequency representations . IEEE Trans. Signal Process , 63 ( 5 ): 1335 – 1344 , 2015 . OpenUrl CrossRef [19]. ↵ C. Orphanidou . Signal Quality Assessment in Physiological Monitoring: State of the Art and Practical Considerations . 01 2018 . [20]. ↵ A. Reiss and et al. Deep ppg: Large-scale heart rate estimation with convolutional neural networks . Sensors , 19 ( 14 ), 2019 . [21]. ↵ O. Ronneberger , P. Fischer , and T. Brox . U-net: Convolutional networks for biomedical image segmentation . In MICCAI 2015 , pages 234 – 241 , Cham , 2015 . Springer International Publishing . [22]. ↵ J. Ruiz and M. A. Colominas . Wave-shape function model order estimation by trigonometric regression . Signal Processing , 197 : 108543 , 2022 . OpenUrl [23]. ↵ P. Schmidt and et al. Introducing wesad, a multimodal dataset for wearable stress and affect detection . Proceedings of the 20th ACM ICMI , 2018 . [24]. ↵ N. Selvaraj and et al. Statistical approach for the detection of motion/noise artifacts in photoplethysmogram . In 2011 Annual International Conference of the IEEE EMBS , pages 4972 – 4975 , 2011 . [25]. ↵ KH Shelley . Photoplethysmography: beyond the calculation of arterial oxygen saturation and heart rate . Anesth Analg , 105 ( 6 ): S31 – S36 , 2007 . OpenUrl CrossRef PubMed Web of Science [26]. ↵ Y.-W. Su and et al. Ridge detection for nonstationary multicomponent signals with time-varying waveshape functions and its applications . arXiv preprint arxiv: 2309.06673 , 2023 . [27]. ↵ Yan-Wei Su , Chia-Cheng Hao , Gi-Ren Liu , Yuan-Chung Sheu , and Hau-Tieng Wu . Reconsider photoplethysmogram signal quality assessment in the free living environment . Physiological Measurement , 2024 . [28]. ↵ J Abdul Sukor , J J Redmond , and N H Lovell . Signal quality measures for pulse oximetry through waveform morphology analysis . Physiological Measurement , 32 ( 3 ): 369 , feb 2011 . OpenUrl PubMed [29]. ↵ H.-T. Wu and Z. Zhou . Frequency detection and change point estimation for time series of complex oscillation . J. Am. Stat. Assoc ., pages 1 – 29 , 2023 . [30]. ↵ S. T. Young and et al. Specific frequency properties of renal and superior mesenteric arterial beds in rats . Cardiovascular research , 23 ( 6 ): 465467 , June 1989 . OpenUrl [31]. ↵ Z. Zhang , Z. Pi , and B. Liu . Troika: A general framework for heart rate monitoring using wristtype photoplethysmographic signals during intensive physical exercise . IEEE Trans. Biomed. Eng ., 62 ( 2 ): 522 – 531 , 2015 . OpenUrl CrossRef View the discussion thread. Back to top Previous Next Posted June 09, 2024. Download PDF Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Model-Based Assessment of Photoplethysmogram Signal Quality in Real-Life Environments Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Model-Based Assessment of Photoplethysmogram Signal Quality in Real-Life Environments Yan-Wei Su , Chia-Cheng Hao , Gi-Ren Liu , Yuan-Chung Sheu , Hau-Tieng Wu medRxiv 2024.06.07.24308621; doi: https://doi.org/10.1101/2024.06.07.24308621 Share This Article: Copy Citation Tools Model-Based Assessment of Photoplethysmogram Signal Quality in Real-Life Environments Yan-Wei Su , Chia-Cheng Hao , Gi-Ren Liu , Yuan-Chung Sheu , Hau-Tieng Wu medRxiv 2024.06.07.24308621; doi: https://doi.org/10.1101/2024.06.07.24308621 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Health Informatics Subject Areas All Articles Addiction Medicine (573) Allergy and Immunology (865) Anesthesia (304) Cardiovascular Medicine (4457) Dentistry and Oral Medicine (445) Dermatology (383) Emergency Medicine (610) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1517) Epidemiology (15244) Forensic Medicine (30) Gastroenterology (1132) Genetic and Genomic Medicine (6621) Geriatric Medicine (669) Health Economics (1002) Health Informatics (4557) Health Policy (1372) Health Systems and Quality Improvement (1615) Hematology (543) HIV/AIDS (1272) Infectious Diseases (except HIV/AIDS) (15936) Intensive Care and Critical Care Medicine (1106) Medical Education (624) Medical Ethics (147) Nephrology (670) Neurology (6635) Nursing (346) Nutrition (999) Obstetrics and Gynecology (1148) Occupational and Environmental Health (957) Oncology (3348) Ophthalmology (980) Orthopedics (369) Otolaryngology (421) Pain Medicine (436) Palliative Medicine (130) Pathology (665) Pediatrics (1696) Pharmacology and Therapeutics (693) Primary Care Research (714) Psychiatry and Clinical Psychology (5463) Public and Global Health (9257) Radiology and Imaging (2210) Rehabilitation Medicine and Physical Therapy (1371) Respiratory Medicine (1198) Rheumatology (598) Sexual and Reproductive Health (716) Sports Medicine (532) Surgery (714) Toxicology (100) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'a0368309dfb809d6',t:'MTc4MDA2ODMyNw=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

⚙ Ask this paper AI returns verbatim quotes from the full text · source: preprint-html ⓘ

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2024) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc: last seen: 2026-05-20T01:45:00.602351+00:00