Comparing Wastewater-Based and Case-Based R t Estimates of SARS-CoV-2 Transmission in Georgia Using Generalized Linear Mixed Models

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 45,947 characters · extracted from preprint-html · click to expand
Comparing Wastewater-Based and Case-Based Rt Estimates of SARS-CoV-2 Transmission in Georgia, USA Using Generalised Linear Mixed Models | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Comparing Wastewater-Based and Case-Based R t Estimates of SARS-CoV-2 Transmission in Georgia, USA Using Generalised Linear Mixed Models View ORCID Profile Seth Edmunds , View ORCID Profile Doug Landsittel , View ORCID Profile Marco Ajelli , View ORCID Profile Maria Litvinova doi: https://doi.org/10.1101/2025.10.24.25338734 Seth Edmunds 1 Department of Epidemiology and Biostatistics, Indiana University School of Public Health , Bloomington, IN, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Seth Edmunds For correspondence: shedmund{at}iu.edu Doug Landsittel 1 Department of Epidemiology and Biostatistics, Indiana University School of Public Health , Bloomington, IN, USA 3 Department of Biostatistics, State University of New York at Buffalo , Buffalo, NY, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Doug Landsittel Marco Ajelli 2 Laboratory for Computational Epidemiology and Public Health, Indiana University School of Public Health , Bloomington, IN, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Marco Ajelli Maria Litvinova 1 Department of Epidemiology and Biostatistics, Indiana University School of Public Health , Bloomington, IN, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Maria Litvinova Abstract Full Text Info/History Metrics Data/Code Preview PDF Abstract The COVID-19 pandemic has highlighted limitations in case-based surveillance due to inconsistent testing and reporting. Wastewater-based epidemiology (WBE) has emerged as a complementary surveillance approach for tracking SARS-CoV-2 transmission, capturing both symptomatic and asymptomatic infections. The aim of this study is to evaluate the effectiveness of WBE in estimating the effective reproduction number ( R t ) of SARS-CoV-2 in Georgia, USA. We used a Generalised Linear Mixed Model to analyse viral concentration data from multiple wastewater treatment plants (WWTPs) collected between June 1, 2022 and December 15, 2022. After controlling for flow rates and site-level heterogeneity, model residuals were transformed into a non-negative incidence-like series used to estimate wastewater-based R t . Wastewater-based R t was compared with case-based R t estimates using Spearman correlation. The two R t estimates showed concordant temporal patterns across most sites, with stronger correlations in areas with higher case counts (Spearman correlations ranging from 0.39 to 0.84, p < 0.001). Wastewater-based R t tracked increases and decreases in transmission over similar time scales as case-based estimates, while exhibiting reduced sensitivity to short-term changes in clinical testing and reporting behaviour. These findings suggest that WBE can support estimation of transmission trends and complement traditional case-based surveillance for public health monitoring. Introduction The COVID-19 pandemic has underscored the need for effective surveillance systems to monitor disease transmission at the population level. Initially, case-based surveillance was critical for tracking the spread of COVID-19. However, fluctuations in testing rates and the changes in reporting practices gradually undermined its reliability. By late 2022, the shift by the Centers for Disease Control and Prevention (CDC) from daily to weekly aggregated case and death reporting reduced the temporal resolution of data available for public health monitoring. This change was intended to reduce the reporting burden and improve operational efficiency, but it limited the ability to assess localised and short-term transmission dynamics. After the expiration of the public health emergency on May 11, 2023, the U.S. Department of Health and Human Services (HHS) could no longer require laboratories to submit COVID-19 testing results; subsequently, hospital COVID-19 reporting requirements were discontinued effective May 1, 2024 ( 1 ). Together, these changes highlight the need for complementary surveillance approaches capable of monitoring population-level transmission when clinical reporting is incomplete or delayed. In response to these challenges, wastewater-based epidemiology (WBE) has re-emerged as a promising complementary approach, providing a non-invasive, scalable method to track viral RNA in community wastewater, capturing both symptomatic and asymptomatic infections. WBE offers a unique opportunity to supplement traditional case-based surveillance, particularly by providing a population-level signal that is less dependent on individual testing behaviour and can reflect changes in community transmission. Because wastewater surveillance occurs at the community level, it is less sensitive to biases arising from uneven access to testing and underreporting, making WBE especially valuable in settings with limited healthcare access or inconsistent clinical testing ( 2 , 3 ). With the rise of at-home COVID-19 testing, which is largely not reported, comparing wastewater-based and clinical estimates of the effective reproduction number ( R t ) has become increasingly important for understanding transmission dynamics while recognizing that each data stream reflects different processes and sources of spatio-temporal heterogeneity. Recent studies have begun to leverage wastewater data alongside clinical surveillance to infer transmission dynamics and develop early-warning systems under varying assumptions about shedding, reporting, and observation processes ( 4 ). By capturing SARS-CoV-2 RNA at the community level, wastewater-based epidemiology (WBE) provides a population-scale signal that is less influenced by biases in clinical data, such as uneven testing access, changing individual behaviour, or reporting delays, though it is subject to its own sources of variability (5 Several studies have estimated wastewater-based SARS-CoV-2 effective reproduction numbers using various assumptions, preprocessing, and model complexities ( 2 , 6 ) While county-level estimations have shown high concordance with traditional case-based estimates ( 7 ), there is a need to validate these methods at finer scales. Using a unique dataset that includes both reported cases and wastewater surveillance at the level of individual sewersheds, we demonstrate the concordance of R t estimations on a disaggregated level. This study provides evidence for the operational utility of wastewater-based R t estimations and offers a practical pipeline accounting for sewershed-related heterogeneity. The aim of this study is to evaluate the effectiveness of WBE in estimating R t of SARS-CoV-2 at a sewershed level. We focus on data collected between June 1 and December 15, 2022 - a period during which routine case reporting via electronic laboratory and provider reports remained available, enabling a contemporaneous comparison of wastewater-based and case-based R t estimates. To compare these signals, we apply a Generalised Linear Mixed Model (GLMM) to wastewater concentrations, adjusting for temporal trends, flow-related dilution, and persistent sewershed differences. This approach allows us to assess the degree to which wastewater-derived transmission dynamics align with contemporaneous case-based R t estimates at the sewershed level, and to evaluate the role of WBE as a complementary surveillance signal for clinical data at finer scales. ( 1 , 8 ). Methods Data Collection Wastewater Data Sources WWTP employees collected twice-weekly wastewater samples, which were shipped to two university laboratories for analysis. Sampling frequency was typically twice weekly across sites, though exact schedules varied by facility and operational constraints (summarized in Appendix Table A1). Viral RNA concentrations were quantified using PCR, specifically targeting the N2 gene for its widespread use and comparable performance to the N1 target (Huisman et al., 2022). RT-qPCR was used at WWTP 9 following the method detailed by Lott et al. (2023) due to logistical constraints, while dPCR, preferred for its higher sensitivity to low viral concentrations, was used at all other sites following the protocol described by Sablon et al. (2022) (Sablon et al. 2022). Differences in analytical platform across sites were treated as time-invariant site characteristics and accounted for through site-level random effects in downstream modelling. Flow rate data were obtained from routine facility records and aligned with wastewater sampling dates; depending on facility practice, measurements corresponded to composite (time- or flow-weighted) or grab sampling approaches, consistent with standard wastewater surveillance reporting practices ( 11 ). Concurrent flow rates were incorporated to account for dilution-related variability in wastewater volume. Case Data Sources Case data were obtained from routine provider and electronic laboratory reports submitted to the Department of Public Health (DPH) and stored within an electronic disease reporting system. Residential addresses were geocoded to obtain XY coordinates. Sewershed shapefiles were provided by the facilities. Case-to-sewershed assignment assumes accurate residential geocoding and alignment with sewershed boundaries, consistent with standard public health surveillance practice. Case data were aggregated daily by sewershed geography using symptom onset date when available; specimen collection date was used otherwise. Data Processing Case Data Processing Cases were assigned to sewersheds based on geocoded residential addresses and the spatial overlap with sewershed boundaries. Epidemic curves were generated using either the date of symptom onset or, if unavailable, the date of the first positive specimen (including asymptomatic cases). Missing daily case counts were imputed using Kalman filtering to provide smoothed estimates, ensuring the preservation of temporal sequences while handling reporting fluctuations. Imputation primarily reflects completion of a daily time series from routine non-daily reporting rather than filling extended gaps in surveillance and the Kalman approach was selected based on comparative performance in preserving temporal structure, as summarized in the Appendix. Data were restricted to the study period from June 1, 2022, to December 15, 2022, and the processed case data were used in conjunction with wastewater viral concentrations for analysis. Wastewater Data Processing All data are from 8 sewersheds in Georgia, USA. Outliers in wastewater viral concentrations and flow rates were detected using the Interquartile Range (IQR) method, with outliers replaced by the median to reduce their influence on downstream analysis. Flagged values were treated as transient spikes for robustness rather than assumed measurement errors, and the number of flagged observations by site is reported in Appendix Table A2. While Appendix Table A1 summarizes the characteristics of all 10 facilities participating in the broader state surveillance program, two facilities, WWTP 4 and WWTP 7, lacked sufficient data during the study period window (June 1 – December 15, 2022). Because only observations exceeding the IQR threshold were modified, minimum and maximum values could remain unchanged if those extremes did not meet the outlier criterion. This method was selected based on a sensitivity analysis comparing multiple outlier detection techniques, including Median Absolute Deviation (MAD), using agreement with case-based R t (Spearman correlation and RMSE) as evaluation criteria. Samples were predominantly 24-hour composite, collected twice weekly. Population served by individual sewersheds varied from 10,000 (WWTP 10) to 650,000 (WWTP 1) Sewershed locations spanned urban, suburban, and rural areas across Georgia; specific geographic coordinates are not disclosed to protect facility identities, but site-level population, flow, and sample characteristics are summarized in Appendix Table A1. Concentrations were not pre-normalised. Instead, by including flow as a fixed effect in the GLMM, the model inherently adjusts for flow-related dilution, with the resulting residuals representing viral signal fluctuations independent of flow variation. Preprocessing method selection was guided by comparative evaluation across multiple approaches. Outlier detection using the IQR method flagged 27 concentration values and 57 flow values across sites, compared with 27, and 123 respectively for the MAD approach. Missing data imputation using Kalman filtering (71.8% of the daily time series) reflected completion to daily resolution from approximately twice-weekly sampling; inter-sample gaps had a median of 2 days. Sensitivity analyses across rolling window lengths showed that 14-day windows achieved the highest concordance with case-based R t estimates (median Spearman ρ = 0.608, IQR = 0.121), comparable to 10-day windows (ρ = 0.612, IQR = 0.184) and superior to 7-day windows (ρ = 0.593, IQR = 0.254). The selected preprocessing combination (IQR outlier detection, Kalman imputation, 14-day rolling average) balanced noise reduction with preservation of transmission trends and minimized data loss (flagging fewer than half as many flow outliers as the MAD approach), as assessed by correlation with case-based estimates (median RMSE = 0.098). Complete site-level characteristics, outlier counts, missingness patterns, and sensitivity results are provided in Appendix Tables A1-A4. Missing data were interpolated using Kalman filtering, chosen for its performance relative to linear and spline interpolation methods in preserving temporal structure during routine non-daily sampling. (Miyazawa et al. 2024; Narci et al. 2021) Both viral concentrations and flow rates were log-transformed to stabilise variance and normalise the data distribution. Comparisons of raw and processed data are presented in Appendix Table A5. These preprocessing steps were implemented to stabilise the time series for downstream transmission trend estimation rather than to reconstruct true incidence or shedding processes. Statistical Modelling Model Specification A Generalised Linear Mixed Model (GLMM) was employed (significance level set to α=0.05) to analyse viral concentrations in wastewater, with both fixed and random effects to capture the hierarchical and temporal structure of the data. The fixed effects included time and flow rate, while the random effects accounted for site-level variability across WWTPs. Model diagnostics were used to assess statistical fit and stability of the mixed-effects model, including residual behaviour and random-effect variance. While these diagnostics ensure the statistical robustness of the framework, they do not, by themselves, imply the biological validity of the resulting residual time series as a direct and comprehensive measure of the number of infections. By accounting for both site-specific and time-based variability, the model provided a flexible framework for analyzing transmission dynamics signal. ( 14 , 15 ) Where: Y it is the viral concentration in wastewater at time t for WWTP i . β 0 is the fixed intercept representing the global baseline concentration. β 1 is the coefficient for the linear temporal trend. β 2 is the coefficient adjusting for the log-transformed wastewater flow rate. t is a daily time variable to account for temporal trends. flow it is the flow rate of wastewater at time t for WWTP i . γ 0i is the random intercept for WWTP i , capturing time-invariant site-specific differences where . ϵ it is the residual error term. The primary specification includes a fixed effect for temporal trend and a site-specific random intercept, implying a common temporal trend with persistent site-specific differences. By utilizing a GLMM instead of manual flow-normalization, we provide a unified framework to adjust simultaneously for flow-related dilution, shared temporal trends, and site-level heterogeneity (e.g., variations in measurement and sampling approaches) that are captured by the random intercept (γ 0i ). By intentionally omitting site-specific random slopes for time, we ensure that localised deviations from the regional trend are preserved within the residuals (ϵ it ) rather than being absorbed into the model parameters. This approach allows the residuals to more accurately reflect the site-level dynamics necessary for subsequent R t estimations while accommodating the nested data structure. It is important to note that the linear time covariate is specified as a global fixed effect across a geographically diverse set of sewersheds. It is intended to control for shared baseline trend without absorbing localised epidemic waves. However, researchers applying this framework should note that if applied to highly synchronized, homogeneous sites over a short period, the global time effect may absorb the epidemic signal, especially during the period of consistent epidemic growth or decline. In such cases, the approach should be implemented without the time trend fixed effects. Empirical demonstrations of the model’s robustness across varying observation windows and distinct transmission phases are provided in Appendix Figures A1 and A2, respectively. Residual Extraction and Smoothing Residuals ϵ it from the GLMM were extracted to capture variability in viral concentrations not explained by the fixed effects of time, flow rate, and site-specific differences in wastewater concentrations, including measurement differences. The inclusion of site-specific random intercepts accounts for persistent between-site differences in baseline viral concentration, allowing within-site temporal deviations to be examined on a comparable scale. To reduce high-frequency noise, a 14-day rolling average was applied to the residual series. While rolling averages introduce additional temporal smoothing and may attenuate short-term changes, this window length reflects a pragmatic balance between noise reduction and trend interpretability and was evaluated through sensitivity analyses reported in Appendix Table A4. This approach ensures that critical transmission patterns are preserved while minimizing the impact of daily fluctuations. Accordingly, residual-based analyses are intended to support inference on transmission trends rather than to reconstruct individual-level infection, shedding processes, case or hospitalization incidence. Estimation of the Effective Reproduction Number (Rt) Rt Calculation The effective reproduction number ( R t ) was estimated using the EpiEstim package in R. ( 16 , 17 ) A parametric serial interval distribution was specified with a mean of 2.75 days and a standard deviation of 2.53 days, utilizing updated parameters specific to the SARS-CoV-2 Omicron variant. (Kremer et al., 2022) To align with the requirements for R t estimation, the GLMM residuals were exponentiated to back-transform the values from the log-link model and ensure the non-negativity required for an incidence proxy. Two estimates of R t were calculated: one based on case-derived incidence, and one based on a transformed wastewater-derived residual series. Both case-based and wastewater-based series were smoothed using a 14-day rolling average prior to R t estimation to reduce short-term noise, with the understanding that this additional smoothing further convolves the underlying signal; the impact of window length on R t concordance was evaluated through sensitivity analyses reported in the Appendix Table A4. ( 2 , 3 ) As a result, wastewater-derived R t estimates are interpreted as a signal of relative transmission dynamics rather than as direct estimates of intrinsic incidence-based reproduction parameters. Sensitivity Analysis: Rolling Average Window A sensitivity analysis was performed to assess the impact of rolling average window length on both case-based and wastewater-based R t estimates. Rolling windows ranging from 3 to 30 days were evaluated, with performance assessed based on agreement with case-based R t (Spearman correlation and RMSE) and qualitative stability of inferred trends. The 14-day window was selected for primary analysis because it provided a pragmatic balance between noise reduction and temporal responsiveness across sites, as summarized in Appendix Table A4. Longer windows further reduced noise but increasingly attenuated short-term changes during periods of rapid transmission change. ( 19 ) Estimate Alignment To quantify concordance between wastewater-based and case-based R t estimates, we computed Spearman rank correlation coefficients across sites. Analyses were restricted to the period prior to December 2022, after which changes in case reporting requirements substantially altered the reliability and completeness of case-based surveillance. Alignment was further assessed by comparing the temporal co-movement of wastewater-based R t , case-based R t , and reported case counts, focusing on direction and timing of major transmission changes rather than pointwise equality. This approach emphasizes concordance in transmission trends under differing observation processes rather than validation against a presumed ground truth. ( 20 ) Results The initial dataset comprised 294 observations for both PCR target average concentration and flow rate measurements across eight WWTPs. After data preprocessing, which included outlier handling and missing data imputation, the number of observations increased to 1,019. Detailed statistics on preprocessing outcomes are presented in the Appendix. A total of 749 data points (72% of the dataset) were imputed using Kalman smoothing reflecting routine completion of a daily time series from non-daily (typically twice-weekly) sampling rather than extended gaps in surveillance. Kalman smoothing was employed because it effectively estimates missing values in time series data by modelling the underlying stochastic processes. This method accounts for variability by incorporating both the observed data and the process noise, allowing for smoothed estimates of the underlying temporal signal amidst measurement uncertainty and routine sampling variability. (Narci et al. 2021) An overview of the R t estimates derived from both case-based and wastewater-based surveillance is provided in Table 1 . This table includes the duration of data collection, total case counts, median R t values, and Spearman correlation coefficients across the eight wastewater treatment plants (WWTPs). All statistically significant results illustrate notable positive correlation between the two R t estimations, with the highest correlation being observed for WWTP 5 (0.84, p < 0.001) and the lowest for WWTP 3 (0.39, p < 0.001). The results ( Table 1 ) indicate that average case burden influenced both correlation strength and statistical significance ( Figure 1 ). For example, no statistically significant correlation was observed for WWTP 9; while its data collection duration was comparable to WWTP 1, its average case burden was substantially lower. Generally, correlation strength and statistical significance aligned with overall case burden. Sewersheds with very low daily case counts frequently lacked the temporal variability required to power rank-based correlation (e.g., WWTP 9 and WWTP 6). However, statistically significant correlations were occasionally observed even in low-incidence settings (e.g., WWTP 10, averaging approximately 2 cases per day). The overall pattern is illustrated in Figure 1 , where R t concordance generally increases as a function of the average number of cases. View this table: View inline View popup Download powerpoint Table 1. Core Statistics of R t Estimates, Correlations and Sewershed Characteristics (ordered by descending case burden) Download figure Open in new tab Figure 1. Average Number of Cases and Spearman Correlation Coefficient Between Case-Based and Wastewater-Based R t Estimates by Wastewater Treatment Plant Sewershed The vertical dashed line indicates approximately five average daily cases (log scale), below which rank-based correlation was generally underpowered in our data, though exceptions were observed (e.g., WWTP 10). Download figure Open in new tab Figure 2. Comparison of Wastewater-Based and Case-Based R t Estimates for WWTP 1 At WWTP 1, the wastewater-based and case-based R t estimates closely tracked from June through August, both peaking in mid-July, which aligns with the peaks in the interpolated wastewater signal and clinical case incidence ( Figure 2 ). By late August, both estimates fell below the epidemic threshold (Rt=1). From mid-October onward, the wastewater-based climbed above epidemic threshold earlier than the case-based estimate in this sewershed. Download figure Open in new tab Figure 3. Comparison of Wastewater-Based and Case-Based R t Estimates for WWTP 3 In WWTP 3, the wastewater-based estimates sometimes lagged peaks in the case-based R t ( Figure 3 ). In mid-October, the wastewater-based R t increased to approximately 1.1−1.3, with comparatively narrower confidence intervals, while the case-based estimates exhibited wider uncertainty that encompassed the threshold of 1.0. Download figure Open in new tab Figure 4. Comparison of Wastewater-Based and Case-Based R t Estimates for WWTP 5 For WWTP 5, the wastewater-based R t initially aligned with case-based trends during early summer, with values above 1.0 ( Figure 4 ). In mid-September, the wastewater-based R t declined below 0.8 prior to a similar decline in the case-based estimate. A subsequent increase in the wastewater-based R t in mid-October preceded a rise in cases. Download figure Open in new tab Figure 5. Comparison of Wastewater-Based and Case-Based R t Estimates for WWTP 8 At WWTP 8, the wastewater-based R t remained above 1.0 from early July, with brief dips ( Figure 5 ). Case-based R t exhibited broadly similar temporal patterns but with shifts in timing consistent with differences in smoothing and observation processes. Download figure Open in new tab Figure 6. Comparison of Wastewater-Based and Case-Based R t Estimates for WWTP 2 At WWTP 2, over the shorter study period, the wastewater-based R t remained consistently above 1.0, while the case-based R t rose above 1.0 in early December ( Figure 6 ). An initial elevation in the wastewater-based estimate was interpreted as a transient anomaly consistent with preprocessing and smoothing effects rather than sustained transmission change. Overview of Rt Estimates Across All Sites Table 2 . Percent of Days with R t Confidence Intervals Above or Below 1 (ordered by descending case burden) View this table: View inline View popup Download powerpoint Table 2. illustrates the percentage of days on which lower and upper bounds of the R t confidence intervals (CIs) were either above or below the epidemic threshold (1.0). This metric provides supplementary information on directional agreement relative to the epidemic threshold ( R t = 1), but was not used as a primary performance criterion because it is sensitive to smoothing choices and uncertainty width. Detailed Analysis of Representative Sites The wastewater-based and case-based R t estimates were analysed across five representative sites with total case incidence greater than 1,000 cases during the study period. Each site exhibits unique patterns in transmission dynamics, as captured by the two surveillance methods. Sites were selected to represent higher-incidence sewersheds where case-based R t estimates showed sufficient variability to support meaningful temporal comparisons. The sites are presented in the order of decreasing case burden. Two levels of uncertainty around median estimates (50% and 95% Cis) are used to represent two levels of potential risk-tolerance of public health practitioners in making decisions based on uncertain data. Discussion Our analyses indicate that wastewater-based R t estimates exhibited broadly similar temporal patterns to case-based estimates across most sites, capturing transmission shifts within approximately two weeks of clinical data. The fundamental purpose of evaluating a clinical comparator is to determine whether pathogen detection in wastewater translates into a tangible public health burden. However, selecting an appropriate clinical comparator requires navigating the inherent limitations of all potential public health signals. Because R t estimation relies on the ratio of successive incidence values rather than absolute counts, it remains mathematically robust to systematic underreporting provided ascertainment does not shift abruptly. Therefore, the optimal choice must be guided by the stability of the signal during the observation window and the specific practical needs of public health authorities. For this study, we utilized reported case incidence by symptom onset or collection date. While such data inherently underestimates true infection burden, as demonstrated by infection incidence being 2.2 to 3.7 times higher than reported cases in the United States during the Omicron wave ( 21 ), reporting requirements during our study period (June– December 2022) were sufficiently stable to establish a reliable baseline. The subsequent expiration of public health mandates and the wider utilization of non-reportable at-home testing rapidly rendered clinical ascertainment lower and highly volatile ( 21 ), necessitating our choice of the study’s end date. Therefore, for this study, reported cases provided the most stable, geospatially appropriate comparator to address the local public health burden at the sewershed level. However, during periods of rapid surveillance infrastructure changes, divergence between wastewater and clinical signals should not be interpreted as a failure of wastewater surveillance, but rather as a complementary reflection of community transmission dynamics essential for comprehensive situational awareness. Several limitations should be acknowledged. A substantial portion of the time series required completion to daily resolution for R t estimation, primarily reflecting routine non-daily sampling rather than prolonged data gaps. Kalman smoothing was used to interpolate missing days and stabilise temporal structure, which may attenuate short-term variability but is necessary for renewal-based estimation frameworks. Additionally, wastewater measurements reflect a convolution of infections over heterogeneous shedding durations and sewer transport processes. As a result, wastewater-derived R t should be interpreted as a smoothed indicator of transmission trends rather than a direct measure of incident infections. This interpretation is subject to uncertainties and heterogeneities in SARS-CoV-2 shedding likelihood, rates, duration, and routes. Furthermore, while we account for the flow differences, variability introduced by site-specific shedding dynamics, viral variants, and in-sewer environmental factors impacts the precision of these estimates. Nevertheless, these uncertainties do not preclude the detection of major transmission shifts as evidenced by the strong concordance observed with case data in higher-burden areas. Finally, assignment of COVID-19 cases to sewersheds relied on residential address geocoding, which may misclassify infections if substantial exposure or shedding occurred outside the residential sewershed. Future studies could enhance geolocation accuracy by incorporating additional data sources or methods, such as improved address resolution or alternative approaches to case-to-sewershed assignment. These limitations highlight areas for methodological improvement but do not alter the central finding that wastewater-based R t estimates captured transmission trends broadly consistent with case-based surveillance. Rather than enabling direct intervention decisions, wastewater-derived R t provides a complementary indicator of changing transmission dynamics that may support situational awareness when clinical surveillance is incomplete or delayed. The weaker correlation observed at WWTP 3 (ρ = 0.39) despite higher total case counts compared with WWTP 5 (ρ = 0.84) likely reflects differences in case variability rather than absolute burden. WWTP 3 exhibited lower day-to-day variance in case incidence during the study period, reducing the discriminatory power of rank-based correlation metrics even when directional trends were broadly consistent. Hill et al. (2025) compared eight WBE-based R t estimation approaches and found that methodological choices substantially influenced estimates. The present study does not seek to advance a competing method but rather to assess whether a relatively simple GLMM framework applied to routine twice-weekly sampling can yield transmission trend indicators concordant with case-based surveillance at the sewershed level. Future research may benefit from evaluating how wastewater-based surveillance scales to larger geographic units, such as counties or clusters of wastewater treatment plants, and whether multiple facilities within a region capture consistent spatiotemporal transmission patterns. Assessing how wastewater-derived indicators can be aggregated without obscuring local dynamics would inform their use in regional surveillance frameworks. As wastewater surveillance continues to be integrated into public health practice, clarifying its role next to the traditional epidemiologic data will be essential for understanding how population-level signals can complement, rather than replace, case-based reporting systems. Data Availability Data is available upon request from Georgia Department of Public Health https://dph.georgia.gov/phip-data-request Data Availability Code used for this analysis is available at: https://github.com/sethmund/wastewater_glmm . Wastewater and case surveillance data are available upon request from the Georgia Department of Public Health subject to data use agreements. Acknowledgments We thank the Georgia Department of Public Health for providing access to sewershed-level COVID-19 case data, and the participating wastewater treatment plant operators and university laboratory partners for sample collection and analysis. Appendix Footnotes Updated various tables and figures, adjusted language, corrected errors. References 1. ↵ Silk BJ . COVID-19 Surveillance After Expiration of the Public Health Emergency Declaration—United States, May 11, 2023 . Morbidity and Mortality Weekly Report . 2023 ; 72 : e1 . OpenUrl 2. ↵ Huisman JS , et al. Wastewater-Based Estimation of the Effective Reproductive Number of SARS-CoV-2 . Environmental Health Perspectives . 2022 ; 130 ( 5 ): 057011 . OpenUrl CrossRef PubMed 3. ↵ Zheng X , et al. Wastewater Surveillance Provides Spatiotemporal SARS-CoV-2 Infection Dynamics . Engineering . 2024 ; 40 ( 9 ) pages 70 – 77 , OpenUrl 4. ↵ Safford H , et al. Wastewater-Based Epidemiology for COVID-19: Handling qPCR Nondetects and Comparing Spatially Granular Wastewater and Clinical Data Trends . ACS ES&T Water . 2022 ; 2 ( 11 ): 2114 – 24 . OpenUrl 5. Nourbakhsh S , et al. A Wastewater-Based Epidemic Model for SARS-CoV-2 with Application to Three Canadian Cities . Epidemics . 2022 ; 39 : 100560 . OpenUrl PubMed 6. ↵ Hill A , et al. Comparison of methods for estimating the effective reproduction number from wastewater data . Epidemics . 2025 ; 52 : 100839 . OpenUrl PubMed 7. ↵ Ravuri S , et al. Estimating effective reproduction numbers using wastewater data from multiple sewersheds for SARS-CoV-2 in California counties . Epidemics . 2025 ; 50 : 100803 . OpenUrl PubMed 8. ↵ Ungar L. Pandemic Gets Tougher to Track as COVID Testing Plunges . Associated Press . 2022 . 9. Lott MEJ , et al. Direct Wastewater Extraction as a Simple and Effective Method for SARS-CoV-2 Surveillance and COVID-19 Community-Level Monitoring . FEMS Microbes . 2023 ; 4 : xtad004 . OpenUrl 10. Sablon O , et al. Nanotrap® KingFisher Concentration/Extraction & MagMAX KingFisher Extraction . protocols.io . 2022 . 11. ↵ Antkiewicz DS , et al. Wastewater-Based Protocols for SARS-CoV-2: Insights into Virus Concentration, Extraction, and Quantitation Methods from Two Years of Public Health Surveillance . Environmental Science: Water Research & Technology . 2024 ; 10 ( 8 ): 1766 – 84 . OpenUrl CrossRef 12. Miyazawa S , et al. Wastewater-Based Reproduction Numbers and Projections of COVID-19 Cases in Three Areas in Japan, November 2021 to December 2022 . Eurosurveillance . 2024 ; 29 ( 8 ): 2300277 . OpenUrl PubMed 13. Narci R , et al. Inference for Partially Observed Epidemic Dynamics Guided by Kalman Filtering Techniques . Computational Statistics & Data Analysis . 2021 ; 164 : 107319 . OpenUrl 14. ↵ Daza-Torres ML , et al. A Mixed-Effects Model to Predict COVID-19 Hospitalizations Using Wastewater Surveillance . Journal of Environmental Chemical Engineering . 2024 ; 12 ( 2 ): 112485 . OpenUrl 15. ↵ de Graaf M , et al. Capturing the SARS-CoV-2 Infection Pyramid Within the Municipality of Rotterdam Using Longitudinal Sewage Surveillance . The Science of the Total Environment . 2023 ; 883 : 163599 . OpenUrl CrossRef PubMed 16. ↵ Cori A , et al. A New Framework and Software to Estimate Time-Varying Reproduction Numbers During Epidemics . American Journal of Epidemiology . 2013 ; 178 ( 9 ): 1505 – 12 . OpenUrl CrossRef PubMed 17. ↵ Nash RK , et al. Estimating the Epidemic Reproduction Number from Temporally Aggregated Incidence Data: A Statistical Modelling Approach and Software Tool . PLOS Computational Biology . 2023 ; 19 ( 8 ): e1011439 . OpenUrl 18. Kremer C , et al. Serial Intervals for SARS-CoV-2 Omicron and Delta Variants, Belgium, November 19-December 31, 2021 . Emerging Infectious Diseases . 2022 ; 28 ( 8 ): 1699 – 1702 . OpenUrl CrossRef PubMed 19. ↵ Wannigama DL , et al. COVID-19 monitoring with sparse sampling of sewered and non-sewered wastewater in urban and rural communities . iScience . 2023 ; 26 ( 7 ): 107019 . OpenUrl PubMed 20. ↵ Rezaeitavabe F , et al. Beyond Linear Regression: Modelling COVID-19 Clinical Cases with Wastewater Surveillance of SARS-CoV-2 for the City of Athens and Ohio University Campus . Science of The Total Environment . 2024 ; 912 : 169028 . OpenUrl CrossRef PubMed 21. ↵ Deng Y , et al. Ratio of Infections to COVID-19 Cases and Hospitalizations in the United States based on SARS-CoV-2 Seroprevalence Data, September 2021-February 2022 . Open Forum Infectious Diseases . 2025 ; 12 ( 1 ): ofae719 . OpenUrl PubMed View the discussion thread. Back to top Previous Next Posted April 11, 2026. Download PDF Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Comparing Wastewater-Based and Case-Based Rt Estimates of SARS-CoV-2 Transmission in Georgia, USA Using Generalised Linear Mixed Models Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Comparing Wastewater-Based and Case-Based R t Estimates of SARS-CoV-2 Transmission in Georgia, USA Using Generalised Linear Mixed Models Seth Edmunds , Doug Landsittel , Marco Ajelli , Maria Litvinova medRxiv 2025.10.24.25338734; doi: https://doi.org/10.1101/2025.10.24.25338734 Share This Article: Copy Citation Tools Comparing Wastewater-Based and Case-Based R t Estimates of SARS-CoV-2 Transmission in Georgia, USA Using Generalised Linear Mixed Models Seth Edmunds , Doug Landsittel , Marco Ajelli , Maria Litvinova medRxiv 2025.10.24.25338734; doi: https://doi.org/10.1101/2025.10.24.25338734 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Epidemiology Subject Areas All Articles Addiction Medicine (568) Allergy and Immunology (863) Anesthesia (299) Cardiovascular Medicine (4428) Dentistry and Oral Medicine (444) Dermatology (382) Emergency Medicine (608) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1508) Epidemiology (15225) Forensic Medicine (30) Gastroenterology (1124) Genetic and Genomic Medicine (6592) Geriatric Medicine (667) Health Economics (997) Health Informatics (4530) Health Policy (1368) Health Systems and Quality Improvement (1613) Hematology (540) HIV/AIDS (1264) Infectious Diseases (except HIV/AIDS) (15912) Intensive Care and Critical Care Medicine (1103) Medical Education (623) Medical Ethics (145) Nephrology (667) Neurology (6593) Nursing (346) Nutrition (998) Obstetrics and Gynecology (1143) Occupational and Environmental Health (957) Oncology (3332) Ophthalmology (971) Orthopedics (369) Otolaryngology (420) Pain Medicine (436) Palliative Medicine (129) Pathology (663) Pediatrics (1691) Pharmacology and Therapeutics (691) Primary Care Research (710) Psychiatry and Clinical Psychology (5441) Public and Global Health (9223) Radiology and Imaging (2197) Rehabilitation Medicine and Physical Therapy (1370) Respiratory Medicine (1196) Rheumatology (593) Sexual and Reproductive Health (712) Sports Medicine (530) Surgery (712) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'9fffd450ca2d4807',t:'MTc3OTQ5NDk0MA=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00