Generalizing population RT-qPCR cycle threshold values-informed estimation of epidemiological dynamics: Impact of surveillance practices and pathogen variability

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 52,750 characters · extracted from preprint-html · click to expand
Generalizing population RT-qPCR cycle threshold values-informed estimation of epidemiological dynamics: Impact of surveillance practices and pathogen variability | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Generalizing population RT-qPCR cycle threshold values-informed estimation of epidemiological dynamics: Impact of surveillance practices and pathogen variability Yun Lin , View ORCID Profile James A. Hay , Yu Meng , View ORCID Profile Benjamin J Cowling , Bingyi Yang doi: https://doi.org/10.1101/2025.05.22.25328079 Yun Lin 1 WHO Collaborating Centre for Infectious Disease Epidemiology and Control, School of Public Health, Li Ka Shing Faculty of Medicine, The University of Hong Kong , Hong Kong Special Administrative Region, China Find this author on Google Scholar Find this author on PubMed Search for this author on this site James A. Hay 2 Pandemic Sciences Institute, Nuffield Department of Medicine, University of Oxford , Oxford, United Kingdom Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for James A. Hay Yu Meng 1 WHO Collaborating Centre for Infectious Disease Epidemiology and Control, School of Public Health, Li Ka Shing Faculty of Medicine, The University of Hong Kong , Hong Kong Special Administrative Region, China Find this author on Google Scholar Find this author on PubMed Search for this author on this site Benjamin J Cowling 1 WHO Collaborating Centre for Infectious Disease Epidemiology and Control, School of Public Health, Li Ka Shing Faculty of Medicine, The University of Hong Kong , Hong Kong Special Administrative Region, China 3 Laboratory of Data Discovery for Health Limited , Hong Kong Science and Technology Park, New Territories, Hong Kong Special Administrative Region, China Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Benjamin J Cowling Bingyi Yang 1 WHO Collaborating Centre for Infectious Disease Epidemiology and Control, School of Public Health, Li Ka Shing Faculty of Medicine, The University of Hong Kong , Hong Kong Special Administrative Region, China Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: byyang{at}connect.hku.hk Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF Abstract Population-level viral load distributions, measured by RT-qPCR or qPCR cycle threshold (Ct) values from surveillance testing, can be used to estimate the time-varying reproductive number ( R t ) in real-time during COVID-19 outbreaks. However, it remains unclear whether this approach can be broadly applied to other pathogens, sources of virologic test data, or surveillance strategies beyond those used during the pandemic, such as in Hong Kong. We systematically evaluated the accuracy of Ct-based R t estimates using simulated epidemics under different surveillance testing systems and pathogen viral kinetics. Using area under the ROC curve (AUC) to assess accuracy in detecting epidemic growth or decline, we found that case ascertainment rates minimally impacted estimation accuracy, except when detection was heavily biased towards severe patients (AUC: 0.64, 95% CIs: 0.59 - 0.71) or during prolonged waves with stable R t near one (AUC: 0.54, 0.48 - 0.64), compared to stable detection patterns over time (AUC 0.76, 0.66 - 0.82). We further examined the impact of pathogen viral kinetics by comparing model accuracies across four hypothesized temporal relations between viral peak and onset by parameterizing our model using data from six respiratory pathogens, including SARS-CoV-2 variants, SARS-CoV-1, and influenza A. We found that accurate model performance largely depends on a monotonic viral shedding trajectory following case detection. A pathogen that lacks such shedding pattern – for example, those with a viral peak after onset – exhibited lower accuracy (AUC: 0.58, 0.49 - 0.65). Our findings suggest that the Ct-based R t estimation method is resilient to various surveillance and pathogen-related factors, provided there are temporal variations in both epidemic and population viral distributions, making it a useful tool for timely transmission monitoring and future disease control efforts. Author summary Population viral load distributions, often approximated by cycle threshold (Ct) values from RT-qPCR testing, have proven valuable for real-time estimation of transmission rates, enhancing situational awareness during the COVID-19 pandemic. However, a comprehensive framework for applying Ct-based methods in other epidemiological contexts, such as varying levels of surveillance coverage or different circulating pathogens/variants, has yet to be developed. In this study, we evaluated the strengths and limitations of Ct-based epidemic surveillance approaches by simulating a range of scenarios with diverse surveillance coverage reflecting real-life outbreaks and carefully calibrating pathogen viral kinetics using real-world parameters. Our findings underscore the critical surveillance and pathogen characteristics that should be considered in future implementations of the method. Introduction Monitoring infectious disease transmission is important for implementing effective public health measures and timely assessment of the effectiveness of interventions. The time-varying effective reproductive number ( R t ), defined as the expected number of secondary infections per infectious individual, has been widely used to monitor community transmission, especially during the COVID-19 pandemic( 1 - 3 ). Conventionally, R t estimates rely on statistical models applied to time series of reported case counts (i.e., the incidence-based method), which suffers unavoidable delays due to the time between infection, symptom development, diagnosis and reporting( 4 , 5 ). To provide an alternative method for real-time R t estimation, inference models have integrated population-level viral load data measured through cycle threshold (Ct) values from reverse-transcription quantitative polymerase chain reaction (RT-qPCR)( 6 , 7 ). This approach, validated in simulations using random Ct samples( 6 ) and applied in Hong Kong’s epidemic waves with symptom and contact-tracing-based surveillance( 7 ), leverages Ct value data to provide insights into transmission dynamics. However, factors such as changes in surveillance practices, including the proportion of detected cases, and testing capacity, reasons for selecting individuals for testing, and variation in viral kinetics across different pathogens and variants can impact the distribution of viral loads measured in the population, limiting the method’s generalizability. Recent research highlights the value of Ct-based methods in nowcasting and forecasting transmission across regions and SARS-CoV-2 variants including Alpha, Delta and Omicron( 8 - 10 ). Evidence from Hong Kong also demonstrated the method’s accuracy during Omicron waves while emphasizing the impact of significant detection delays on method performance( 11 ). While these findings support the method’s application during epidemic waves with diverse variants and changing population immunity, a systematic evaluation of the method in the context of varying surveillance efforts, or its adaptability to other viruses, remains limited. Considering the potential future risks of outbreaks posed by emerging or re-emerging pathogens( 12 ), it is crucial to examine and refine new surveillance metrics, including Ct-based methods, for future applications. Here, we compared the performance of Ct-based R t estimation methods in simulated scenarios featuring different detection and testing coverage, epidemic characteristics, and pathogen outbreaks with varied viral kinetics, aiming to build a generic framework for incorporating population viral load into R t nowcasting for future application. Results Overview of scenarios and procedures for comparative analysis The Ct-based method estimates R t by training a statistical model to find the relationship between incidence-based R t and Ct value statistics (i.e., mean and skewness). This model is then applied to estimate R t continuously based on measured Ct values each day to achieve real-time estimation of R t ( Fig 1A ). Surveillance coverage, including the proportion of all cases detected and the number of detected cases tested by RT-qPCR, could influence the number of Ct values recorded each day. Meanwhile, variation in viral shedding kinetics of different pathogens and variants could impact individual viral loads at the time of testing. Both surveillance coverage and viral shedding kinetics could potentially affect the population viral load and measured Ct value distributions over time ( Fig 1A ). Download figure Open in new tab Fig 1. Overview of data flows used to generate Ct-based Rt and factors potentially affecting distributions of population Ct values. (A) the mechanism of Ct-based Rt illustrated by the relation between transmission dynamics (epidemic trajectory; top left panel) and population viral load distributions (bottom left panels). Correlations between population Ct distributions as indicated by daily mean and skewness are shown in middle panels, with boxes representing the estimated median and interquartile range (IQR) of daily Ct distributions under each interval of the simulation truth Rt , the lower and upper whiskers representing the minimum and maximum estimates and dots for outliers. Temporal transmission dynamics as indicated by Rt estimated using different data are shown in the right panel. Black line and gray shaded area indicate median and 95% credible intervals for incidence-based Rt , pink line and shaded area indicate median and 95% confidence intervals for Ct-based, while red line indicate simulation truth (i.e., the real transmission rates under simulation). Area under the receiver operator characteristics curve (AUC) is used to evaluate estimation accuracy, with the AUC for Ct-based Rt compared to the simulation truth over training and testing periods denoted in top-right of the right panel. (B) epidemic trajectories under different detection modes, as examples of varying surveillance sensitivity. Bars show the number of cases, with different colors indicating different case types as denoted in corresponding panels. Red line indicates the trend for simulation truth. (C) viral shedding trajectories for four pathogens (pathogen 1-4) with varying timings of viral peak in relation to illness onset, as the other affecting factor (i.e., pathogen viral kinetics) for model performance. In each panel, 200 infected individuals are randomly selected to demonstrate the shedding trajectory for each pathogen, and each gray line indicates the shedding trajectory of an infected individual. Green and blue vertical dashed lines indicate the median time of onset and viral peak among the 200 selected individuals infected with each of the four pathogens. We simulated two consecutive epidemic waves (Table S1; see Methods ) to evaluate the Ct-based method under different scenarios. Data from the first wave (training period) were used to train the model, which then predicted estimates for the second wave (testing period). We compared testing-period estimation accuracies to access the impact of surveillance coverage and pathogen shedding characteristics on performance ( Fig 1 ). In the first set of simulations, we simulated epidemics of a SARS-CoV-2 ancestral strain-like pathogen while varying surveillance practices, such as the proportion of cases detected and proportion of detected cases who were tested ( Fig 1B ). In the second set, we kept case detection and virologic sampling constant but introduced pathogens or variants with different viral shedding kinetics ( Fig 1C ). Under symptom-based surveillance, only symptomatic individuals are typically detected, and most of these cases undergo RT-qPCR testing with reported Ct values ( Fig 1B ). To explore the impact of surveillance practices, we constructed scenarios with varying virologic testing capacities by adjusting the fraction of detected cases tested from 100% to 30% (scenarios 1-4). We also compared scenarios where the epidemic curve plateaued either due to detection capacity limits (i.e., only able to detect a limited number of cases per day; scenario 5) or because R t remained stable around one due to genuine epidemic dynamics (scenario 6). Additionally, we investigated the impact of detection bias by varying the proportion of detected severe cases relative to non-severe cases, and severe cases typically have longer shedding durations and lower detected Ct values( 13 ). We considered scenarios with and without additional detection delays for these cases (scenarios 7-14) ( Fig 1B ; Table S2). We also examined the impact of viral shedding kinetics by compiling four parameter sets with distinct timings of peak viral load relative to illness onset ( Fig 1C ; see Methods ). Viral shedding parameters for six real-world pathogens, including different variants of SARS-CoV-2 (ancestral strain, Alpha, Delta and Omicron variants), SARS-CoV-1 and influenza A (Table S3; see Methods ), were applied to further elucidate the key pathogen characteristics necessary for accurate estimation. We simulated transmission rates using a susceptible-exposed-infectious-recovered (SEIR) model as the simulation truth, applying varied surveillance and pathogen parameters to generate daily case numbers and associated Ct values for each scenario. Detected cases were used to estimate incidence-based R t , while population-level Ct distributions (summarized by mean and skewness by sampling dates) were used to estimate R t following our previous method( 7 ) (see Methods ). We defined the training period as three weeks before and after the peak case date during the first epidemic wave (day 0-109 after the initial outbreak; see Supplementary Methods ), during which the model was built to estimate Ct-based R t for the testing period (110 days after initial outbreak). We primarily compared Ct-based R t estimates with the simulation truth using the area under the receiver operator characteristic curve (AUC; see Methods ), which evaluates the model’s ability to distinguish between high ( R t ≥1) and low ( R t <1) transmission rates. Additional evaluation metrics, including Spearman’s correlation coefficient ρ and mean absolute percentage error (MAPE), were also used (see Supplementary Methods ). Impact of varying surveillance coverage The Ct-based R t estimation achieved an AUC of 0.76 (95% confidence intervals (CIs): 0.66 - 0.82) during the testing period in scenario 1, which modelled epidemics caused by a SARS-CoV-2 ancestral strain-like pathogen with stable detection and 100% of cases tested with RT-qPCR. Estimation accuracy remained moderate to high even when only 30% of detected cases reported Ct values (scenario 4; AUC = 0.66, 95% CIs: 0.58 – 0.75), or when daily case detection was limited (scenario 5; AUC = 0.74, 95 CIs: 0.65 – 0.81) ( Fig 2 ; Fig S2). Moderate detection bias towards severe cases did not significantly affect accuracy (scenarios 7-9; AUC ranging from 0.75 to 0.76), but delayed detection of severe cases reduced performance (scenarios 12-14 vs. scenarios 8-10) ( Fig 2 ; Fig S2). With strong detection bias (i.e., testing only severe cases), accuracy dropped to an AUC of 0.62 – 0.64 (scenarios 10 and 14), though it remained moderately accurate ( Fig 2 ; Fig S2). Download figure Open in new tab Fig 2. Estimation accuracy for Ct-based Rt during the testing period in different scenarios of surveillance sensitivity. (A) estimation accuracy for Ct-based Rt as compared to the simulation truth and evaluated by AUC over the testing period in each scenario. Points and vertical lines show median and interval estimates of the AUC over 100 times of bootstrapping (see Methods), with the interval estimates taken as the 2.5 and 97.5 percentiles of all 100 estimated AUC values during bootstrapping. (B) brief summary of each scenario in terms of surveillance-related factors that can affect model performance, as illustrated in Fig 1A . More detailed description of each scenario can be found in Table S2. Estimation accuracy varied according to the underlying cause of an observed flattened epidemic curve. When the plateau resulted from limited detection (scenario 5), the Ct-based R t estimate accuracy remained high (AUC = 0.74, 95% CIs: 0.60 – 0.82). In contrast, during a genuine low transmission period (scenario 6), accuracy declined significantly (AUC = 0.54, 95% CI: 0.48 – 0.64) ( Fig 2 ). This decrease was supported by lower Spearman’s correlation and higher MAPE (scenario 6 in Fig S3; see Supplementary Methods ). Lower estimation accuracy was typically associated with less variable population Ct values over time, such as observed in low transmission (Fig S4B) and heavily biased scenarios (Fig S4D). Overall, the method performed best during epidemic growth, with both stable (scenario 1) and limited detection (scenario 5) conditions outperforming low transmission scenario (scenario 6) (Fig S5). Although performance improved with increased Ct sample sizes, benefits became marginal beyond 100 samples (Fig S6; see Supplementary Methods ). Impact of distinct viral shedding kinetics We compared the estimation accuracies of four viral shedding kinetics models that differ solely in the timing of their viral load peak relative to illness onset, while keeping peak viral loads and shedding durations similar. The model with an earlier peak than illness onset (pathogen 2) achieved high accuracy (AUC = 0.85, 95% CIs: 0.78 – 0.90), whereas the model with a delayed viral peak than illness onset (pathogen 4) showed much lower accuracy (AUC = 0.58, 95% CIs: 0.49 – 0.65; Fig 3B ). The performance differences are consistent with the relationship between population Ct values and epidemic progression, as pathogens with greater variations in population Ct values during epidemic growth and declines and therefore a clear and linear relationship between population Ct values and epidemic progression tend to yield higher model accuracy ( Fig 3 ; Fig S7). Download figure Open in new tab Fig 3. Impact of pathogen shedding characteristics on estimation accuracy. (A) Summary of epidemic waves in the scenario of stable detection. Black solid line and gray shaded area represents the median and 95% credible intervals of incidence-based Rt , orange bars show daily number of detected cases, and shaded areas with different colors indicate different epidemic periods (increasing epidemic as blue-shaded period 1, epidemic peak as red-shaded period 2, and decreasing epidemic as purple-shaded period 3). (B) estimation accuracies of Ct-based Rt over testing periods for pathogen 1-4 corresponding to examples shown in Fig 1C . Dots and horizontal lines represent median and interval estimates of the AUC over 100 bootstrapped samples(see Methods), with the interval estimates taken as the 2.5 and 97.5 percentiles of all 100 estimated AUC values during bootstrapping. Gray dashed lines in the background mark the minimum and maximum median AUC across the four pathogen scenarios serving as visual reference points for easier comparison. (C-F) trajectories of viral shedding until the time of detection for 200 randomly selected individuals infected with pathogen 1-4 corresponding to examples shown in Fig 1C , and in different epidemic periods as indicated in panel A (left panels: increasing epidemic, period 1; middle panels: epidemic peak, period 2; right panels: decreasing epidemic, period 3). Each line represents the viral shedding trajectory for each individual, and a gray line indicates the trajectory for an individual that is detected after viral peak, while a pink line indicates that for an individual detected before viral peak. The violin plot represents the distribution of the detected Ct values for the 200 randomly selected individuals in each trajectory panel, and the horizontal dashed line represents the median Ct value at detection for individuals infected with each pathogen during the increasing epidemic as a reference for comparing the Ct distributions for each pathogen during different epidemic periods. (C) Shedding trajectories until detection for individuals infected with pathogen 1 whose viral loads peak at day 5 after infection (irrelevant to the timing of symptom onset). (D) Shedding trajectories until detection for individuals infected with pathogen 2 whose viral loads peak 2 days before symptom onset. (E) Shedding trajectories until detection for individuals infected with pathogen 3 whose viral loads peak at symptom onset. (F) Shedding trajectories until detection for individuals infected with pathogen 3 whose viral loads peak 3 days after symptom onset. The varying performance across viral shedding kinetics can be attributed to how well exposure time can be inferred from viral loads. With fixed shedding durations, an earlier viral peak allows a monotonic shedding trajectory for detection under symptom-based surveillance, resulting in a clear relationship between time-since-infection and viral loads that helps distinguish recent versus older infections. Consequently, population Ct values differ significantly between epidemic growth and decline phases, with mean Ct values ranging from 26.1 to 28.7 and skewness ranging from 0.5 to 0.3 at the epidemic peak versus the decreasing phase ( Fig 3D ). Conversely, a delayed viral peak leads to non-monotonic trajectories, increasing the likelihood that recent infections are detected before reaching peak viral load. Consequently, mean Ct values remained around 26 and skewness at 0.5 across epidemic phases, thereby diminishing the signal of transmission dynamics ( Fig 3F ). Application potential for real-world pathogens We further demonstrated the method’s potential across various real-world pathogens and variants. For SARS-CoV-2, the Alpha (AUC = 0.81, 95% CIs: 0.76 – 0.88) and Delta (AUC = 0.82, 95% CIs: 0.76 – 0.90) variants showed higher accuracy than the ancestral strain, likely due to their relatively earlier and higher viral peaks at or before symptom onset. In contrast, Omicron infections initially yielded less favorable performance (AUC = 0.75, 95% CIs: 0.65 – 0.82), likely due to a later viral peak and non-monotonic shedding trajectories post-detection ( Fig 4 ; Fig S8). However, delaying Ct testing by 2-4 days to capture the monotonic phase improved the performance (AUC = 0.84, 95% CIs: 0.78 – 0.89) (Fig S9; see Supplementary Methods ). Download figure Open in new tab Fig 4. Viral shedding trajectories for six real-world pathogens and estimation accuracies of Ct-based Rt over testing periods for these pathogens. (A) viral shedding trajectories of 100 randomly selected individuals infected with each of the six real-world pathogens. Each gray line indicates the shedding trajectory of an infected individual. The dashed vertical line indicates the median time of viral peak for the 100 individuals. Orange dots and horizontal lines represent the median and IQR of the onset time for these individuals (Table S3), while blue dots and lines represent the median and IQR of their detection time (Table S1) (see Methods). (B) estimation accuracies of Ct-based Rt during the testing period for six real-world pathogens. Dots and vertical lines show median and interval estimates of the AUC over 100 times of bootstrapping (see Methods), with the interval estimates taken as the 2.5 and 97.5 percentiles of all 100 estimated AUC values during bootstrapping. For SARS-CoV-1, a reversed relationship between Ct and R t was observed due to distinct shedding dynamics, yet high accuracy was achieved (AUC = 0.88, 95% CIs: 0.82 – 0.92), possibly due to a later viral peak that provided a stable time-dependent signal for inferring exposure ( Fig 4B ; Fig S8). Conversely, influenza A exhibited reduced performance (AUC = 0.61, 95% CIs: 0.53 – 0.69) because its very short shedding duration resulted in consistently low population viral load ( Fig 4 ; Fig S8). Discussion In this study we examined the potential of Ct-based R t estimation methods across different surveillance practices and viral shedding kinetics. Our findings indicate that larger temporal variations in population Ct values yield clearer epidemic signals and more accurate Ct-based R t estimates. These variations are driven more by pathogen shedding kinetics than by surveillance practices, except in cases of heavily detection biased or stagnant epidemics conditions. A monotonic shedding trajectory is crucial for effectively distinguishing recent from older infections, thereby enhancing the model’s ability to capture epidemic phases. By leveraging routinely collected RT-qPCR Ct data, often discarded in surveillance, our framework could offer timely insights into epidemic trends, which can be particularly useful for early outbreak surveillance in the future. Our evaluation across varying surveillance practices identified key factors affecting model performance. As the method relies on the distribution of Ct values rather than absolute case counts, even limited or moderately biased detection can provide informative signals of epidemic changes, as observed during the Omicron waves in Hong Kong( 11 ). However, dramatic shifts, such as a sudden bias in detecting only severe cases, which typically have longer shedding durations and lower Ct values, or delays in detecting these cases, can distort the learned Ct- R t relationship and reduce estimation accuracy( 11 ). Our simulations provide possible explanations in relation to these problems, helping to understand the strengths and caveats of the method for application. We demonstrated that the relationship between population Ct values and R t estimates remain robust when average exposure time can be accurately inferred from viral load data. Pathogens with earlier and higher viral peaks, coupled with moderate shedding durations, exhibit greater temporal variability in Ct values from recent and older infections, thereby enhancing the model performance. In contrast, extremely short shedding duration (as seen in our influenza A example( 14 )) or non-monotonic shedding trajectories (as with the Omicron example( 15 )) limit the ability to estimate time-since-infection, potentially compromising accuracy. Notably, our findings suggested that adjusting the Ct testing window to capture the Omicron’s monotonic shedding phase could improve the performance. While our study focused on applying this methods to human respiratory viruses, the framework could be extended to other pathogens where viral loads correlate with exposure time. For instance, mpox has an incubation period of around 5 days( 16 ), with viral shedding peaking within a week after symptom onset and PCR positivity lasting up to 3 weeks( 17 , 18 ). Since detection typically occurs 3-5 days after onset( 17 ) during the viral proliferation phase, Ct-based estimates may be as accurate as for SARS-CoV-1. In H5N1 outbreaks, prolonged viral shedding in birds( 19 ) could enable reliable R t estimation using Ct values, despite challenges such as species-specific variability and asymptomatic shedding( 19 - 21 ). Although we did not explore these pathogens due to differences in transmission routes and surveillance strategies, our findings imply promising directions for enhancing future surveillance. Although we have analyzed various surveillance practices and circulating pathogens, real-world complexities arise from individuals infected with different virus subtypes or varying immune backgrounds, which influence the viral load distribution. Additionally, shifts in dominant variants across epidemic waves, such as Omicron in Hong Kong( 22 ), may further complicate predictions. Reported viral shedding parameters also differ between studies; for instance, one study( 23 ) found longer influenza A shedding durations than those used in our analysis( 14 , 24 ). However, we believe such heterogeneity has minimal impact on the method’s applicability, as our simulations and observations from epidemic waves in Hong Kong( 11 ) demonstrate that the method remains accurate even under varying severity profiles, viral variants, population immunity, and surveillance intensities. While the method shows suboptimal performance for pathogens with non-monotonic shedding, incorporating a generative or more complex model may help to improve performance by accounting for such shedding characteristics, making the method more applicable in these scenarios. To summarize, our modelling study extends the use of Ct-based R t estimation methods in symptom-based surveillance settings to scenarios with different surveillance practices (e.g., variations in case ascertainment, virologic testing and severity biases), as well as different pathogen viral kinetics. This generic framework identifies key factors affecting the model performance and highlights the value of incorporating viral load data to monitor transmission dynamics and enhance preparedness and response strategies against various infectious threats. Methods Simulation of epidemic waves, detected individuals, and viral loads We used an SEIR model to simulate two consecutive epidemic waves (see Supplementary Methods ). Two consecutive epidemic waves with clear increasing and decreasing phases were simulated, while another scenario (scenario 6) featured a typical first wave and a second wave with R t stable around one using a different set of parameters (Table S1). We focused on symptom-based surveillance, where individuals are detected only if they develop symptoms after infection. Therefore, detection dates occur on or after symptom onset with a detection delay modelled by a gamma distribution (mean: 4.20, SD: 3.14), and these detection dates are used as testing dates for Ct values unless otherwise specified. For the typical scenario of stable case detection similar to the first four COVID-19 waves in Hong Kong( 25 ) (i.e., scenario 1), symptomatic cases were detected at a fixed probability of 25%, with small daily variation introduced as noise (e.g., ±0.5% around the 25% detection probability). Similarly, we synthesized different series of detection and testing probabilities to represent various surveillance modes that may occur in reality, including limited viral testing as well as biased case detection( 26 , 27 ). We explored the impact of testing only small fractions of detected cases (i.e., limited testing capacity) by varying the proportion of detected cases that were tested for Ct values from 100% to 80%, 50% and 30% respectively (scenarios 1-4; Table S2). To recover plateaued epidemic waves caused by different reasons, we constructed a scenario of a second wave plateaued due to limited detection capacity (scenario 5) by restricting the number of detected cases at around 100 during the wave, while we also simulated the other possible scenario with genuinely low transmission (scenario 6) by updating the R t to be stably around one (Table S1-2). During the Omicron waves in Hong Kong, the health system was challenged by the massive number of infected individuals, and severe patients were more likely to be captured and included in the hospital systems, causing certain biases in the surveillance( 22 ). To explore the impact of biased detection similar to this, we considered different case severity profiles and assigned corresponding detection probabilities. Specifically, we assumed 15%, 3% and 2% of cases would develop severe, critical or fatal illness respectively( 28 ), which would lengthen their shedding durations (see Supplementary Methods ) and increase detection probabilities. While symptomatic cases generally have a 25% detection possibility, severe cases would have a 37.5% detection probability (1.5 times the baseline) and mild cases a 20% detection probability (80% of the baseline) in scenarios of biased detection. By varying detection rates for severe cases, the observed severity profile among detected cases would change over time, independent of any actual changes in the pathogen’s genuine severity profile. We constructed scenarios with varying intensities and durations of biased detection (scenarios 7-10), and included scenarios with further delayed detection for severe cases (gamma distribution of mean=6.95, SD=4.12 compared to the original mean of 4.20) in scenarios 11-14 for comparison (Table S1-2). For individual viral loads, we simulated viral load trajectories accounting for variation in observed Ct values each day since infection for infected symptomatic cases using previous method( 7 , 29 ) (see Supplementary Methods ; Table S1). Each infected individual had their Ct values per day since infection and, if detected, would have their corresponding sampled Ct values as the Ct value falling on day k post infection based on their individual Ct trajectories, with k being the time interval between their dates of infection and detection/sampling. Viral shedding parameters for different pathogens To explore the impact of pathogen properties, we compiled four sets of viral shedding kinetics with different timings of viral peak relative to illness onset. Pathogen 1 has a viral peak at day 5 after infection (irrespective of onset), while pathogens 2, 3, and 4 have viral peaks 2 days before, at and 3 days after symptom onset, respectively ( Fig 1C ). We updated the distribution of viral shedding durations to align with the time of infection rather than illness onset to allow more flexible comparisons (see Supplementary Methods ). In symptom-based surveillance settings where individuals are detected and tested only after developing symptoms, this adjustment enabled us to explore variations in the magnitude of detectable viral loads from different pathogens. We used the detection probability (25%) and detection delay distribution (gamma distribution with shape of 1.83 and rate of 0.43) from scenario 1 to generate the daily number of infected and detected cases, applying this to all four pathogens. Consequently, only the Ct values of detected cases and thus the population Ct values would vary across pathogen scenarios. In addition to the four hypothesized time relations between viral peak and illness onset, we also used shedding parameters from the literature for variants of SARS-CoV-2, SARS-CoV-1 and influenza A as real-world examples to demonstrate the applicability of the Ct-based method (see Supplementary Methods ). Similarly, we used the detection probability (25%) and detection delay distribution (gamma distribution with shape of 1.83 and rate of 0.43) from scenario 1 to get daily number of infected and detected cases; however, due to differences in incubation periods and viral shedding parameters, both daily case counts and population Ct values will vary per pathogen scenario. We additionally explored different Ct testing windows for the Omicron scenario by extending Ct testing 2-4 days after case detection (see Supplementary Methods ). Incidence-based and Ct-based R t Incidence-based R t was estimated using the R package EpiNow2( 30 ) (see Supplementary Methods ), while daily distribution of population Ct (by sampling date t) estimated by mean and skewness ( b t ) was used to generate Ct-based R t following our previous method( 7 ): Where ln ( R t ) refers to natural log-transformed incidence-based R t . We first fitted models over different time periods during the first simulated wave as the training period and selected the best-performing period by comparing the adjusted R squared of all options within each scenario (see Supplementary Methods ). The generic characteristics of the best-performing training periods were summarized and such training periods were applied across all scenarios to estimate the Ct-based R t . The predicted Ct-based R t from days 110 onward (i.e., the testing period) were compared with R t from the SEIR model (i.e., simulation truth). The area under the receiver operator characteristic curve (AUC) was used as the primary metric for assessing estimation accuracy, measuring the possibility that the Ct-estimated R t values correctly align with the simulation truth (i.e., both below or above 1). To investigate the uncertainty in sampling Ct values and consequently the accuracy of Ct-based R t estimates, we repeated each scenario 100 times using bootstrapping and calculated the AUC between the estimated Ct-based R t and the simulation truth in each iteration (see Supplementary Methods ). The estimation accuracy for each scenario was summarized by the median, 2.5% and 97.5% quantiles of the AUC across the 100 bootstrapping iterations. All statistical analyses were conducted in R version 4.3.2 (R Development Core Team, 2023). Data availability Parameters for simulations can be found in Methods and Supplementary Materials. All simulation data generated in this study and all codes for analyses will be made available at the GitHub repository ( https://github.com/vanialin/Ct_Rt_generic ). Competing interests BJC consults for AstraZeneca, Fosun Pharma, GSK, Haleon, Moderna, Novavax, Pfizer, Roche, and Sanofi Pasteur. The authors report no other potential conflicts of interest. Acknowledgements This study was supported by the Health and Medical Research Fund from the Health Bureau of the Government of the Hong Kong Special Administrative Region (grant no. 22210552, B.Y.) and by a grant from the Research Grants Council of the Hong Kong Special Administrative Region, China (Project No. T11-705/21-N, B.J.C.) References 1. ↵ Tsang TK , Wu P , Lau EHY , Cowling BJ . Accounting for Imported Cases in Estimating the Time-Varying Reproductive Number of Coronavirus Disease 2019 in Hong Kong . J Infect Dis . 2021 ; 224 ( 5 ): 783 – 7 . OpenUrl PubMed 2. Gostic KM , McGough L , Baskerville EB , Abbott S , Joshi K , Tedijanto C , et al. Practical considerations for measuring the effective reproductive number, Rt . PLoS Comput Biol . 2020 ; 16 ( 12 ): e1008409 . OpenUrl CrossRef PubMed 3. ↵ Cori A , Ferguson NM , Fraser C , Cauchemez S. A new framework and software to estimate time-varying reproduction numbers during epidemics . Am J Epidemiol . 2013 ; 178 ( 9 ): 1505 – 12 . OpenUrl CrossRef PubMed 4. ↵ Kucirka LM , Lauer SA , Laeyendecker O , Boon D , Lessler J. Variation in False-Negative Rate of Reverse Transcriptase Polymerase Chain Reaction–Based SARS-CoV-2 Tests by Time Since Exposure . Annals of Internal Medicine . 2020 ; 173 ( 4 ): 262 – 7 . OpenUrl CrossRef PubMed 5. ↵ Li Q , Guan X , Wu P , Wang X , Zhou L , Tong Y , et al. Early Transmission Dynamics in Wuhan, China, of Novel Coronavirus–Infected Pneumonia . New England Journal of Medicine . 2020 ; 382 ( 13 ): 1199 – 207 . OpenUrl CrossRef PubMed 6. ↵ Hay JA , Kennedy-Shaffer L , Kanjilal S , Lennon NJ , Gabriel SB , Lipsitch M , et al. Estimating epidemiologic dynamics from cross-sectional viral load distributions . Science . 2021 ; 373 ( 6552 ). 7. ↵ Lin Y , Yang B , Cobey S , Lau EHY , Adam DC , Wong JY , et al. Incorporating temporal distribution of population-level viral load enables real-time estimation of COVID-19 transmission . Nat Commun . 2022 ; 13 ( 1 ): 1155 . OpenUrl CrossRef PubMed 8. ↵ Musalkova D , Piherova L , Kwasny O , Dindova Z , Stancik L , Hartmannova H , et al. Trends in SARS-CoV-2 cycle threshold values in the Czech Republic from April 2020 to April 2022 . Sci Rep . 2023 ; 13 ( 1 ): 6156 . OpenUrl PubMed 9. Sharmin M , Manivannan M , Woo D , Sorel O , Auclair JR , Gandhi M , et al. Cross-sectional Ct distributions from qPCR tests can provide an early warning signal for the spread of COVID-19 in communities . Front Public Health . 2023 ; 11 : 1185720 . OpenUrl PubMed 10. ↵ Ahuja V , Bowe T , Warnock G , Pitman C , Dwyer DE . Trends in SARS-CoV-2 cycle threshold (Ct) values from nucleic acid testing predict the trajectory of COVID-19 waves . Pathology . 2024 . 11. ↵ Meng Y , Lin Y , Xiong W , Lau EHY , Ho F , Wong JY , et al. Effective Real-time Transmission Estimations Incorporating Population Viral Load Distributions Amid SARS-CoV-2 Variants and Preexisting Immunity . J Infect Dis . 2025 ; 231 ( 3 ): 684 – 91 . OpenUrl PubMed 12. ↵ Subissi L , Otieno JR , Worp N , Attar Cohen H , Oude Munnink BB , Abu-Raddad LJ , et al. An updated framework for SARS-CoV-2 variants reflects the unpredictability of viral evolution . Nat Med . 2024 ; 30 ( 9 ): 2400 – 3 . OpenUrl CrossRef PubMed 13. ↵ Lin Y , Wu P , Tsang TK , Wong JY , Lau EHY , Yang B , et al. Viral kinetics of SARS-CoV-2 following onset of COVID-19 in symptomatic patients infected with the ancestral strain and omicron BA.2 in Hong Kong: a retrospective observational study . Lancet Microbe . 2023 ; 4 ( 9 ): e722 – e31 . OpenUrl 14. ↵ Carrat F , Vergu E , Ferguson NM , Lemaitre M , Cauchemez S , Leach S , et al. Time lines of infection and disease in human influenza: a review of volunteer challenge studies . Am J Epidemiol . 2008 ; 167 ( 7 ): 775 – 85 . OpenUrl CrossRef PubMed Web of Science 15. ↵ Zhou K , Hu B , Zhao X , Chi H , Pan J , Zheng Y , et al. Longitudinal observation of viral load in patients infected with Omicron variant and its relationship with clinical symptoms . Front Microbiol . 2022 ; 13 : 1037733 . OpenUrl PubMed 16. ↵ Madewell ZJ , Charniga K , Masters NB , Asher J , Fahrenwald L , Still W , et al. Serial Interval and Incubation Period Estimates of Monkeypox Virus Infection in 12 Jurisdictions, United States, May-August 2022 . Emerg Infect Dis . 2023 ; 29 ( 4 ): 818 – 21 . OpenUrl CrossRef PubMed 17. ↵ Adler H , Gould S , Hine P , Snell LB , Wong W , Houlihan CF , et al. Clinical features and management of human monkeypox: a retrospective observational study in the UK . Lancet Infect Dis . 2022 ; 22 ( 8 ): 1153 – 62 . OpenUrl CrossRef PubMed 18. ↵ Kim H , Kwon R , Lee H , Lee SW , Rahmati M , Koyanagi A , et al. Viral load dynamics and shedding kinetics of mpox infection: a systematic review and meta-analysis . J Travel Med . 2023 ; 30 ( 5 ). 19. ↵ Beerens N , Germeraad EA , Venema S , Verheij E , Pritz-Verschuren SBE , Gonzales JL . Comparative pathogenicity and environmental transmission of recent highly pathogenic avian influenza H5 viruses . Emerg Microbes Infect . 2021 ; 10 ( 1 ): 97 – 108 . OpenUrl PubMed 20. Ellis TM , Bousfield RB , Bissett LA , Dyrting KC , Luk GS , Tsim ST , et al. Investigation of outbreaks of highly pathogenic H5N1 avian influenza in waterfowl and wild birds in Hong Kong in late 2002 . Avian Pathol . 2004 ; 33 ( 5 ): 492 – 505 . OpenUrl CrossRef PubMed Web of Science 21. ↵ Moreno A , Bonfante F , Bortolami A , Cassaniti I , Caruana A , Cottini V , et al. Asymptomatic infection with clade 2.3.4.4b highly pathogenic avian influenza A(H5N1) in carnivore pets, Italy, April 2023 . Euro Surveill . 2023 ; 28 ( 35 ). 22. ↵ Wong JY , Cheung JK , Lin Y , Bond HS , Lau EHY , Ip DKM , et al. Intrinsic and Effective Severity of Coronavirus Disease 2019 Cases Infected With the Ancestral Strain and Omicron BA.2 Variant in Hong Kong . J Infect Dis . 2023 ; 228 ( 9 ): 1231 – 9 . OpenUrl PubMed 23. ↵ Ip DK , Lau LL , Leung NH , Fang VJ , Chan KH , Chu DK , et al. Viral Shedding and Transmission Potential of Asymptomatic and Paucisymptomatic Influenza Virus Infections in the Community . Clin Infect Dis . 2017 ; 64 ( 6 ): 736 – 42 . OpenUrl CrossRef PubMed 24. ↵ Ng S , Lopez R , Kuan G , Gresh L , Balmaseda A , Harris E , et al. The Timeline of Influenza Virus Shedding in Children and Adults in a Household Transmission Study of Influenza in Managua, Nicaragua . Pediatr Infect Dis J . 2016 ; 35 ( 5 ): 583 – 6 . OpenUrl CrossRef PubMed 25. ↵ Yang B , Tsang TK , Gao H , Lau EHY , Lin Y , Ho F , et al. Universal Community Nucleic Acid Testing for Coronavirus Disease 2019 (COVID-19) in Hong Kong Reveals Insights Into Transmission Dynamics: A Cross-Sectional and Modeling Study . Clin Infect Dis . 2022 ; 75 ( 1 ): e216 – e23 . OpenUrl PubMed 26. ↵ Bosonkie M , Egbende L , Namale A , Fawole OI , Seck I , Kizito S , et al. Improving testing capacity for COVID-19: experiences and lessons from Senegal, Uganda, Nigeria, and the Democratic Republic of Congo . Front Public Health . 2023 ; 11 : 1202966 . OpenUrl PubMed 27. ↵ Seidu AA , Hagan JE , Jr. , Ameyaw EK , Ahinkorah BO , Schack T. The role of testing in the fight against COVID-19: Current happenings in Africa and the way forward . Int J Infect Dis . 2020 ; 98 : 237 – 40 . OpenUrl PubMed 28. ↵ Wu Z , McGoogan JM . Characteristics of and Important Lessons From the Coronavirus Disease 2019 (COVID-19) Outbreak in China: Summary of a Report of 721Z314 Cases From the Chinese Center for Disease Control and Prevention . Jama . 2020 ; 323 ( 13 ): 1239 – 42 . OpenUrl CrossRef PubMed 29. ↵ Quilty BJ , Clifford S , Hellewell J , Russell TW , Kucharski AJ , Flasche S , et al. Quarantine and testing strategies in contact tracing for SARS-CoV-2: a modelling study . Lancet Public Health . 2021 ; 6 ( 3 ): e175 – e83 . OpenUrl 30. ↵ Abbott S , Hellewell J , Thompson R , Sherratt K , Gibbs H , Bosse N , et al. Estimating the time-varying reproduction number of SARS-CoV-2 using national and subnational case counts [version 2; peer review: 1 approved with reservations] . Wellcome Open Research . 2020 ; 5 ( 112 ). View the discussion thread. Back to top Previous Next Posted May 22, 2025. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Generalizing population RT-qPCR cycle threshold values-informed estimation of epidemiological dynamics: Impact of surveillance practices and pathogen variability Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Generalizing population RT-qPCR cycle threshold values-informed estimation of epidemiological dynamics: Impact of surveillance practices and pathogen variability Yun Lin , James A. Hay , Yu Meng , Benjamin J Cowling , Bingyi Yang medRxiv 2025.05.22.25328079; doi: https://doi.org/10.1101/2025.05.22.25328079 Share This Article: Copy Citation Tools Generalizing population RT-qPCR cycle threshold values-informed estimation of epidemiological dynamics: Impact of surveillance practices and pathogen variability Yun Lin , James A. Hay , Yu Meng , Benjamin J Cowling , Bingyi Yang medRxiv 2025.05.22.25328079; doi: https://doi.org/10.1101/2025.05.22.25328079 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Infectious Diseases (except HIV/AIDS) Subject Areas All Articles Addiction Medicine (569) Allergy and Immunology (863) Anesthesia (300) Cardiovascular Medicine (4442) Dentistry and Oral Medicine (444) Dermatology (383) Emergency Medicine (609) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1510) Epidemiology (15230) Forensic Medicine (30) Gastroenterology (1126) Genetic and Genomic Medicine (6609) Geriatric Medicine (668) Health Economics (998) Health Informatics (4542) Health Policy (1370) Health Systems and Quality Improvement (1613) Hematology (543) HIV/AIDS (1266) Infectious Diseases (except HIV/AIDS) (15923) Intensive Care and Critical Care Medicine (1103) Medical Education (623) Medical Ethics (147) Nephrology (668) Neurology (6607) Nursing (346) Nutrition (999) Obstetrics and Gynecology (1146) Occupational and Environmental Health (957) Oncology (3337) Ophthalmology (974) Orthopedics (369) Otolaryngology (420) Pain Medicine (436) Palliative Medicine (130) Pathology (664) Pediatrics (1693) Pharmacology and Therapeutics (692) Primary Care Research (712) Psychiatry and Clinical Psychology (5448) Public and Global Health (9237) Radiology and Imaging (2202) Rehabilitation Medicine and Physical Therapy (1370) Respiratory Medicine (1196) Rheumatology (596) Sexual and Reproductive Health (714) Sports Medicine (530) Surgery (712) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'a019507639e9aa64',t:'MTc3OTc2MjE2OQ=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00