A Tale of Two Models: Linear Regression and Poisson GLM Yield Identical Trends for COVID-19 Mortality in Italy

preprint OA: closed CC-BY-NC-ND-4.0
📄 Open PDF Full text JSON View at publisher
Full text 66,159 characters · extracted from preprint-html · click to expand
A Tale of Two Models: Linear Regression and Poisson GLM Yield Identical Trends for COVID-19 Mortality in Italy | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search A Tale of Two Models: Linear Regression and Poisson GLM Yield Identical Trends for COVID-19 Mortality in Italy Marco Roccetti , Giuseppe Cacciapuoti doi: https://doi.org/10.1101/2025.09.11.25335570 Marco Roccetti 1 Department of Computer Science and Engineering, University of Bologna , Bologna, Italy Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: marco.roccetti{at}unibo.it Giuseppe Cacciapuoti 2 Department of Computer Science and Engineering, University of Bologna , Bologna, Italy Find this author on Google Scholar Find this author on PubMed Search for this author on this site Abstract Full Text Info/History Metrics Data/Code Preview PDF Abstract While it is undisputed that Poisson GLM models represent the gold standard for counting COVID-19 deaths, recent studies have analyzed the seasonal growth and decline trends of these deaths in Italy using a simple segmented linear regression. They found that, despite an overall decreasing trend throughout the entire period analyzed (2021-2025), rising mortality trends from COVID-19 emerged in all summers and winters of the period, though they were more pronounced in winter. The technical reasons for the general unsuitability of using linear regression for the precise counting of deaths are well-known. Nevertheless, the question remains whether, under certain circumstances, the use of linear regression can provide a valid and useful tool in a specific context, for example, to highlight the slopes of seasonal growth/decline in deaths more quickly and clearly. Given this background, this paper presents a comparison between the use of linear regression and a Poisson GLM model with the aforementioned death data, leading to the following conclusions. Appropriate statistical hypothesis testing procedures have demonstrated that the conditions of a normal distribution of residuals, their homoscedasticity, and the lack of autocorrelation were essentially guaranteed in this particular Italian case (weekly COVID-19 deaths in Italy, from 2021 to 2025) with very rare exceptions, thus ensuring an acceptable performance of linear regression. This was further confirmed by the development of a Poisson GLM model, which showed: a) a 100% correspondence with the linear regression model in identifying the growth or decline trend across all 11 seasonal periods considered; b) that both the simple linear and Poisson models demonstrated a comparable great accuracy in counting COVID-19 deaths, with mean MAE values, per period, respectively of 88.60 and 62.76. Based on an average of approximately 6,630 deaths per period, the Poisson model showed a percentage error of 1.15%, while the linear regression model’s error was just 1.48%. 1. Introduction In the field of statistical modeling, the fundamental premise of a rigorous analysis is the selection of a regression technique that aligns with the inherent characteristics of the data [ 1 ]. This is particularly critical when dealing with count data, which represent discrete, non-negative numbers, such as the number of events occurring over a fixed period. Unlike continuous variables that can take any value, count data are governed by distinct statistical properties. The widely adopted linear regression model, which operates under the assumption that the response variable is normally distributed, is fundamentally illsuited for this type of data. The use of a linear model on count data can lead to serious statistical violations, including heteroscedasticity (non-constant variance) and the potential for predicting nonsensical, negative values, which are anathema to the very nature of counting [ 2 ]. For these reasons, the statistical community has long embraced Generalized Linear Models (GLMs), with Poisson regression standing as the undisputed gold standard for analyzing count data. Poisson GLMs are meticulously designed to accommodate the unique properties of discrete counts by employing a logarithmic link function that connects the linear predictor to the expected value of the counts [ 3 , 4 ]. This ensures that all predictions remain non-negative which is a core reason for the model reliability. The Poisson model’s foundational assumption of equal dispersion (where the mean and variance are equal) makes it the most theoretically sound and widely accepted approach for count-based analysis in fields ranging from epidemiology to economics [ 5 - 7 ]. Despite this established statistical orthodoxy, recent research has explored an unconventional, yet compelling, application of a simpler technique. A recent study broke from convention by applying a segmented linear regression to analyze weekly COVID-19 death counts in Italy [ 8 ]. While statistically unorthodox, this methodology yielded powerful and highly interpretable results. The study, which investigated nine distinct seasonal periods (three winters, three summers, and three intermediate periods between winter and subsequent summer), revealed a clear and consistent pattern: all summers and winters within the analyzed period showed rising mortality trends, with the winter surges being consistently more pronounced, while the intermediate periods exhibited strong downward trends. The true strength of this segmented linear approach laid in its ability to provide a visually impactful and intuitive representation of the mortality dynamics. By fitting straight lines to each seasonal segment, the model offered a clear and easily understandable visualization of the growth and decline rates through the slopes of the lines. This visual simplicity is a significant advantage, as it is often more accessible to a broader audience than the abstract logarithmic or exponential curves inherent in Poisson models. The compelling findings of the initial research prompted a subsequent, confirmatory study to validate the discovered pattern over a (partially) new, extended period [ 9 ]. This work specifically extended the analysis to an entire, continuous year from May 2024 to May 2025 and was specifically designed to verify if the observed seasonal rhythm of growth during summer and winter, followed by a decline in the period from late winter to the end of the subsequent spring, would persist over a completely new 12-month span. This additional analysis, which built upon the techniques developed to analyze the original nine seasonal segments of [ 8 ], provided a more robust and comprehensive view of the phenomenon, demonstrating the durability of the observed COVID-19 mortality cycle and solidifying the linear model potential as a reliable tool for trend identification. Given this background, a critical question comes now to the fore in all its significance: can the use of linear regression, despite its theoretical limitations, be considered an acceptable and even valuable tool in the unique context of seasonal COVID-19 mortality analysis, where its primary goal is to provide a quick and visually impactful representation of seasonal trends? This present paper aims to address this question by presenting a detailed, head-to-head comparison between a linear regression model and a Poisson GLM, using the same comprehensive dataset of Italian COVID-19 deaths from September 2021 to May 2025. The core of our investigation is not to dismiss the statistical rigor of GLMs, but rather to assess whether, under specific empirical conditions, a simpler model can provide comparable predictive power while offering superior interpretability and visual clarity. Our methodology involved two key steps. First, we conducted a series of rigorous statistical hypothesis tests on the linear regression model of [ 8 , 9 ] to ensure its underlying assumptions were met. These tests assessed for the normal distribution of residuals, homoscedasticity (constant variance), and the absence of autocorrelation. Our findings reveal that, with very rare exceptions, these conditions were largely satisfied in this particular dataset, suggesting that the use of linear regression was indeed statistically tenable. Second, we developed a Poisson GLM on the same data to directly compare its performance against the linear model. The results were remarkable: a) the Poisson model showed a 100% correspondence with the linear regression model in identifying the growth or decline trend across all eleven sub-periods (the nine from the original study plus the two additional seasons from the 2024/2025 period). Furthermore, both models demonstrated a comparable high level of accuracy in predicting death counts. The mean absolute error (MAE) for the linear model was 88.60, while the Poisson model MAE was 62.76. Based on an average of approximately 6,300 deaths per period, this translates to a relative error of only 1.48% for the linear model and 1.15% for the Poisson model. These results have suggested that, in the context of analyzing Italian COVID-19 mortality data over this long period, the two models produced nearly identical outcomes. This finding highlights the practical utility of linear regression for this specific application, particularly for its ability to provide a clear and intuitive visual representation of seasonal trends through the slopes of its fitted lines, which are arguably more effective for communicating the phenomenon than the logarithmic/exponential curves inherent in Poisson models. The remainder of this paper details the statistical procedures, models, and comparisons that led to these conclusions. In particular, in the next Section 2 , we describe the source of the data used in this study and provide a comprehensive summary of all that data presented in tabular format. Furthermore, in the same Section, we provide the foundational information needed to discuss linear and Poisson regression, as well as the necessary background to understand the scope of the statistical tests conducted to verify the normality, homoscedasticity, and non-autocorrelation of residuals. In Section 3 , we present the results obtained, both from the statistical tests and from the Poisson regression. Section 4 , discusses a comparison between the outcomes of the linear and Poisson models, while Section 5 provides the conclusion of the work. 2. Materials and Methods In this Section, we provide all the necessary details on the data and methods used in this study, allowing readers to easily replicate our results. We focused on the time series of Italian COVID-19 death data, which were subjected to various transformations, as described below. 2.1. Sources of COVID-19 Deaths Data For the study of weekly COVID-19 deaths in Italy, all data were sourced from the two certified and currently available repositories within the country. These official sources are: i) the repository maintained by the Italian Civil Protection Department under the Italian Presidency of the Council of Ministers ( https://github.com/pcm-dpc/COVID-19/blob/master/dati-andamento-nazionale ), and ii) the repository maintained by the Italian Ministry of Health ( https://www.salute.gov.it/new/it/tema/covid-19/report-set-timanali-covid-19/ ). These same data were used in our previous studies [ 8 , 9 ] and cover a total of weeks of weekly COVID-19 deaths, spanning from September 23, 2021, to May 21, 2025. While the aforementioned are the primary sources, to make this study independently comprehensible, the time series of these weekly deaths, along with other relevant information, is also presented in a tabular format in the following Sections. 2.2. Linear Regression Fit to COVID-19 Deaths Data We here summarize the results of fitting a linear regression model to the 210 weeks of COVID-19 death data from September 2021 to May 2025 mentioned above. The detailed findings were previously described in papers [ 8 , 9 ], nonetheless the general principle behind this fitting procedure was to follow the trends of growth and decline in the historical time series of weekly deaths by dividing the entire period into seasonal segments. For each segment, the linear regression model identified the corresponding growth or decline trend, which is best expressed by the slope of the corresponding segment. This slope is captured by the well-known parameter β 1 in the classic linear regression equation [ 10 ]: It is important to note that the definition of these seasonal segments was not strictly based on astronomical seasons. The segments were slightly adjusted, either lengthened or shortened, to better fit the regression lines, with the goal of keeping the goodness-of-fit, measured by the R 2 parameter, around a 70% threshold on average. This approach allowed us to more accurately model the specific growth and decline phases of the pandemic throughout the analyzed period, yielding a total of nine seasonal segments. To briefly summarize the main findings obtained by applying this procedure in [ 8 ], it should be recalled that the linear regression model has demonstrated that, throughout the examined three-year period (late 2021 to late 2024) dominated by the Omicron and post-Omicron variants: i) the overall trend of weekly COVID-19 mortality was in decline, yet ii) there were notable increases in deaths during all winters and summers. These rising mortality variations were more pronounced in winter than in summer. Conversely, deaths were less frequent in the intermediate periods between winter and summer. This study, therefore, concluded that essentially, although the general downward trend of COVID-19 mortality in Italy was favorable, transient rises in mortality occurred in both winter and summer but were largely offset by the consistent downward drifts during the intermediate seasons. To further confirm these, in some respects, surprising results, particularly the ascending mortality trends in summer in addition to winter, a subsequent study was conducted to examine an entire year, from May 2024 to May 2025, using the same segmented linear regression model of [ 8 ]. This later study [ 9 ] also confirmed the ascending mortality trend, which began in summer, or late spring, and connected with the upward trend of autumn and the following winter. The trend then started to decline substantially from mid-winter all the way through spring. This descending period was precisely what had been identified as the intermediate period in the previously mentioned work [ 8 ]. Specifically, these two additional seasonal segments began and ended on dates May 16, 2024 and November 14, 2024, and November 21, 2024 and May 21, 2025, respectively, for a total duration of 53 weeks, thus constituting two new seasonal segments for study to be added to the previous 9, for a total of 11. Table 1 summarizes these 11 periods, showing their duration in weeks, start and end dates, and season type. View this table: View inline View popup Download powerpoint Table 1. The 11 segments identified in Italy in the period from September 2021 to May 2025 with their seasonal connotation provided by the linear regression model of [ 8 , 9 ]. The following four Tables (2-5) provide a concise yet comprehensive overview of the data and results from the two previous studies [ 8 , 9 ] over more than 210 weeks. The extensive time frame, spanning from September 2021 to May 2025, has been divided into four consecutive macro-periods (macro-periods 1, 2 3 and 4). Each macro-period 1-3 encompasses an autumn-winter phase (Winter), an intermediate phase (Intermediate), and the subsequent summer (Summer). For each macro-period, we presents in the second column of each Table the raw weekly COVID-19 death data. The subsequent columns of each Table provide the corresponding regression results, including the type of season, the ascending or descending trend identified by the regression, along with the β 1 coefficient, the point-estimate prediction (in terms of weekly deaths) provided by the linear regression model, and the residual, that is the difference between the actual and estimated death values. The residual’s sign is positive for overestimation and negative for underestimation. In summary, macro-period 1 ( Table 2 ): from September 23, 2021, to August 18, 2022, 48 weeks; macro-period 2 ( Table 3 ): from August 26, 2022, to September 7, 2023, 55 weeks; macro-period 3 ( Table 4 ): from September 14, 2023, to September 19, 2024, 54 weeks. View this table: View inline View popup Table 2. Macro-period 1 (September 23, 2021, to August 18, 2022). 48 consecutive weeks of COVID-19 deaths in Italy plus segmented linear regression results, including: Season type, Identified seasonal trend of growth (>) or decline (<) and segment slope β 1 , Predictions, Residuals. View this table: View inline View popup Table 3. Macro-period 2 (August 26, 2022, to September 7, 2023). 55 consecutive weeks of COVID-19 deaths in Italy plus segmented linear regression results, including: Season type, Identified seasonal trend of growth (>) or decline (<) and segment slope β 1 , Predictions, Residuals. View this table: View inline View popup Table 4. Macro-period 3 (from September 14, 2023, to September 19, 2024). 54 consecutive weeks of COVID-19 deaths in Italy plus segmented linear regression results, including: Season type, Identified seasonal trend of growth (>) or decline (<) and segment slope β 1 , Predictions, Residuals. The final Table 5 details the one-year period from May 2024 to May 2025, as studied in [ 9 ]. This study, also conducted using our linear regression model, aimed to confirm the ascending summer-autumn-winter COVID-19 mortality trend and the subsequent post-winter decline over an annual timeframe. It should be noted that the first 35 weeks of this final macro-period (the fourth) overlap with the third macro-period. For this macro-period 4 as well, the second column of Table 5 reports the weekly COVID-19 deaths, while the subsequent columns of Table 5 presents the linear regression model results: the season type, the growth or decline trend of mortality, with the corresponding β 1 values, the prediction values, and the residuals. Hence, the macro-period 4 ( Table 5 ), from May 16, 2024, to May 21, 2025, for a duration of 53 weeks. View this table: View inline View popup Table 5. Macro-period 4 (from May 16, 2024 to May 21, 2025). A full year of COVID-19 deaths in Italy (53 weeks) plus segmented linear regression results, including: Season type, Identified seasonal trend of growth (>) or decline (<), segment slope β 1 , Predictions, Residuals. In the end, not counting the 35-week overlap between macro-periods 3 and 4, the total number of weeks on which the linear regression model was fitted is 210. Of these, 157 were studied in [ 8 ] and 53 in [ 9 ]. 2.3. Statistical Tests for Linear Regression on COVID-19 Mortality Data With the linear regression model applied to the COVID-19 death data series reported in Tables 1 - 4 , and the consequent values of the predictions and residuals, we can now perform a series of statistical tests. These tests, primarily applied to the residuals, that is the difference between predicted values and actually COVID-19 observed deaths, are essential for verifying whether the key conditions for a reliable applicability of a linear regression model have been met. Specifically, these tests check for the normality of the residual distribution, their homoscedasticity and the absence of autocorrelation. The rationale is that we use the following statistical tests to check if the residuals satisfy these conditions, allowing for a safe and valid use of the regression model used in [ 8 , 9 ]. In particular, to test residuals for normality, we used both the Shapiro-Wilk test and the QQ plot procedure. The Shapiro-Wilk test is the principal method used to formally assess whether the residuals of a linear regression model are normally distributed [ 11 ]. The assumption of normality of residuals is crucial for the validity of hypothesis tests and the construction of confidence intervals for the linear model coefficients. This test calculates a statistic W which quantifies how well the sample data aligns with a normal distribution. The null hypothesis of the test is that the residuals are drawn from a normal distribution. A p-value from the test that is greater than a chosen significance level (we have chosen 0.05) indicates that the null hypothesis cannot be rejected, suggesting that the residuals are likely normally distributed. To strengthen the verification of residual normality, a more empirical approach is usually employed, based on the visual inspection of a plot. We are talking about a Q-Q Plot [ 12 ]. A Quantile-Quantile (Q-Q) plot, in fact, provides a visual method for checking the normality of a model’s residuals, serving as an important complement to formal numerical statistical tests. The plot compares the ordered values of the residuals against the theoretical quantiles of a normal distribution. If the residuals are approximately normally distributed, the points on the plot will closely follow a straight diagonal line. Any significant deviation from this straight line or points that fall away from the line suggests that the residuals are not normally distributed, indicating a violation of the assumption. One common convention when using Q-Q plots is also to include a 95% confidence band around the diagonal line. The idea is that if the residuals are indeed normally distributed, the vast majority of the plot’s points should fall within this band. A second fundamental condition for the reliable application of a linear regression model is the homoscedasticity of its residuals. This term refers to the property when the variance of the residuals is constant and uniform across all values of the independent variables. In other words, the spread of the data points around the regression line remains consistent throughout the entire range of predicted values. The violation of this condition, known as heteroscedasticity, renders the standard errors and significance tests unreliable, compromising the model’s conclusions. The Breusch-Pagan test is the specific statistical tool used to verify this condition, detecting whether the variance of the residuals is related to the independent variables [ 13 ]. In particular, the test works calculating an LM statistic which measures if the variance of a linear model’s residuals is constant. It is computed by running an auxiliary regression of the squared residuals on the original independent variables. The statistic is derived from this auxiliary regression’s R 2 and follows a chi-squared distribution. A low p-value (typically < 0.05) for the LM statistic indicates heteroscedasticity, meaning the variance of the residuals is not constant which is exactly the situation we would want to avoid. In the end, for a proper application of linear regression to counting problems, it is also essential to verify that the residuals are not autocorrelated. This serial correlation, where the error term of one observation is related to the next, is a common issue with time-series data, like weekly death counts. Its presence violates a core assumption of linear regression, leading to biased standard errors and unreliable hypothesis tests. This can cause to incorrectly conclude that a predictor is significant. Therefore, checking for auto-correlation is a crucial step to ensure the model’s findings are trustworthy. This verification can be done using ACF and PACF diagrams for autocorrelation. In simple terms, ACF (Autocorrelation Function) and PACF (Partial Autocorrelation Function) correlograms are powerful tools for detecting autocorrelation in the residuals of a regression model, particularly with time-series data [ 14 ]. Autocorrelation occurs when the residuals are not independent of each other. The ACF plot shows the correlation between a time series and its lagged values, helping to identify how long a residual’s effect persists. The PACF plot shows the direct correlation between a residual and its lagged values, after accounting for the influence of intermediate lags. Significant spikes on these plots (both ACF and PACF), extending beyond the confidence bands, are clear indicators of autocorrelation, suggesting the need for a different model or a transformation of the data. 2.4. Developing a Poisson GLM Model for COVID-19 Deaths Data When analyzing weekly COVID-19 death counts, the Poisson Generalized Linear Model (GLM) is often a more suitable choice than linear regression. While linear regression assumes residuals are normally distributed, the Poisson GLM is specifically designed for discrete, non-negative count variables, assuming a Poisson distribution [ 15 - 19 ]. The model uses a link function (the natural logarithm) to transform the nonlinear relationship into a linear form. The model formula, applied to our case with a single time variable, is: Here, Y represents the expected (or predicted) count of deaths, while β 1 is the regression coefficient. This approach produces an exponential curve that better reflects the natural growth and decline phases of COVID-19 deaths. To compare the two models (Poisson vs. Linear), it is then crucial to understand the meaning of β 1 in each. In linear regression, β 1 indicates a constant, additive change in the number of deaths for each new week. For example, a β 1 of K would mean an increase of K deaths every week. In the Poisson model, instead, β 1 represents a change in the logarithm of the expected count. To interpret this in terms of deaths, we need to calculate e β 1 . The result is a multiplicative factor: for instance, an e β 1 of 1.05 indicates a 5% increase in deaths per week. This interpretation naturally aligns very well with the exponential growth and decay rates that characterize pandemics. In closing, to determine which model provides a better seasonal profile, or whether they are ultimately comparable under the specific circumstances of our case, we have taken two approaches. In the first, we checked for any deviations in the seasonal predictions of COVID-19 mortality growth or decline, and their respective β 1 values (of course, after applying the link function in the case of Poisson). As a second check, we directly compared the predictions of the two models using the Mean Absolute Error (MAE). As is well known, MAE measures a model’s predictive accuracy by calculating the average of the absolute differences between predicted Y and observed Ŷ values with the formula: where Y is the actual number of weekly deaths and Ŷ is the predicted count. A lower MAE signifies a more accurate model. By calculating the MAE for both models for each season, we can see which model provides the better fit for the data during that specific seasonal period. 3. Results This Results Section presents two types of achievements from the current study. First, the results related to the application of the various statistical tests mentioned previously to verify if the linear regression model developed in [ 8 , 9 ] could be conducted with the assurance that the statistical assumptions of residual normality, their homoscedasticity, and the absence of autocorrelation were respected. Then, the second part of the results, shows the product of the Poisson regression, showing, for each of the 11 previously identified seasonal segments, the corresponding curves that identify the trend of COVID-19 mortality, along with the corresponding predictions in terms of COVID-19 deaths. 3.1. Results from the Statistical Validation of the Linear Regression Model for COVID-19 Mortality Data in Italy (2021-2025) This part is divided into three types of results from corresponding checks that answer to the three subsequent questions: were the residuals of the linear model applied to the data of interest normally distributed across all 11 seasonal segments considered in the period 2021-2025? Were these residuals homoscedastic? Lastly, were they autocorrelated? First, we provide results of the statical test conducted for checking the residuals normality. The following Table 7 provides the results of the Shapiro-Wilk test on the 11 seasonal segments of interest, listing the W statistic (where it is recalled that the closer it is to 1, the more the hypothesis of residual normality holds), the p-value, and the outcome of the test. View this table: View inline View popup Download powerpoint Table 7. Shapiro-Wilk test results for the normality of residuals of the linear regression model for the seasonal segments in the period 2021 – 2025 ( α = 0.05). What is noteworthy about these results is that either the test confirms the normality of the residuals (7 out of 11 cases), or the p-value, while below the significance threshold, is very close to it, always with W statistic values very near to 1. The four cases of failure of the normality test, due to their configuration, convinced us to plot the corresponding Q-Q plots for all 11 seasonal segments to get a better visual of this situation. The following are therefore four Figures ( Figures 1 to 4 ) that provide the Q-Q plots for all the winter segments of the investigated period ( Figure 1 ), for all the summer segments ( Figure 2 ), and for all the segments of the intermediate periods ( Figure 3 ). Finally, Figure 4 provides the Q-Q plots for the two seasonal segments related to [ 9 ]. Download figure Open in new tab Figure 1. Q-Q Plots with a confidence intervals band of 95% for Winter 2021 (Top), Winter 2022 (Middle), Winter 2023 (Bottom). Download figure Open in new tab Figure 2. Q-Q Plots with a confidence intervals band of 95% for Summer 2022 (Top), Summer 2023 (Middle), Winter 2024 (Bottom). Download figure Open in new tab Figure 3. Q-Q Plots with a confidence intervals band of 95% for Intermediate 2022 (Top), Intermediate 2023 (Middle), Intermediate 2024 (Bottom). Download figure Open in new tab Figure 4. Q-Q Plots with a confidence intervals band of 95% for Summer-Winter 2024/25 (Left) and Extended Spring 2025 (Right). As is easy to infer from a visual analysis of all the 11 Q-Q plots, the plot’s line aligns very well with the graph bisector. Most importantly, apart from three single points respectively in the plots for Winter 21, Intermediate 23 and Intermediate 24, the vast majority of points fall within the 95% confidence interval bands. This demonstrates that, in addition to the decent normality results achieved with the more formal Shapiro-Wilk tests, from a practical numerical standpoint, all 11 seasonal segments exhibit a residual behavior that is almost entirely comparable to normality, with rare exceptions that deviate only slightly, and can therefore be defined as quasi-normal. In conclusion, with 7 cases of normality and 4 very borderline, even if the entire spectrum of the 11 segments cannot be defined as perfectly normal, a situation largely close to normality can be deduced. Therefore, this certainly does not constitute one of the reasons for an unreliable application of the linear regression model. Now it is time to check the homoscedasticity of the residuals produced by the linear regression model applied in [ 8 , 9 ]. For this purpose, we show the results of the Breusch-Pagan tests for all 11 seasonal segments in the following Table 8 , remembering that heter-oscedasticity is the opposite of homoscedasticity. View this table: View inline View popup Download powerpoint Table 8. Breusch-Pagan test results for the heteroscedasticity of residuals of the seasonal segments in the period 2021 – 2025 ( α = 0.05). A quick look at this Table confirms that in 9 out of 11 cases, the residuals of the seasonal segments do not show heteroscedasticity, thus being homoscedastic. For the Intermediate 2024 segment, an additional analysis of the residuals vs. fitted values plot (not reported here for the sake of conciseness) suggests the result is more due to a lack of linearity, rather than true heteroscedasticity. Hence in that case, the outcome is very borderline, almost pointing to quasi-homoscedasticity. The only clear case of heteroscedasticity among the 11 is Winter 2021. Therefore, in the end, one must be very cautious about doubting that the residuals considered constitute a clear situation of heteroscedasticity; rather, the opposite is true. Now let us move on to autocorrelation Figures 5 - 8 display the ACF and PCF correlograms used to test for autocorrelation. The confidence bands, calculated using the Bartlett formula, are at a 95% confidence level. Significant autocorrelation is indicated when multiple points fall outside these bands. Our results show that in all diagrams, the points remain within the confidence bands, suggesting a general absence of autocorrelation. The few exceptions are the first points of each seasonal segment. This is not a sign of a larger issue; it is simply because these initial points serve as the starting point for subsequent trends and are therefore inherently correlated with the following data. Download figure Open in new tab Figure 5. Correlograms for autocorrelation: Winter 2021 (Top-left ACF – Top-right PCF), Winter 2022 (Middle-left ACF – Middle-right PCF), Winter 2023 (Bottom-left ACF – Bottom-right PCF). Download figure Open in new tab Figure 6. Correlograms for autocorrelation: Summer 2022 (Top-left ACF – Top-right PCF), Summer 2023 (Middle-left ACF – Middle-right PCF), Summer 2024 (Bottom-left ACF – Bottom-right PCF). Download figure Open in new tab Figure 7. Correlograms for autocorrelation: Intermediate 2022 (Top-left ACF – Top-right PCF), Intermediate 2023 (Middle-left ACF – Middle-right PCF), Intermediate 2024 (Bottom-left ACF – Bottom-right PCF). Download figure Open in new tab Figure 8. Correlograms for autocorrelation: Summer-Winter 2024-25 (Top-left ACF – Top-right PCF), Extended Spring 2025 (Bottom-left ACF – Bottom-right PCF). We believe it is helpful to the reader to conclude this Section on the results of statistical tests for the correct applicability of a linear regression model for COVID-19 mortality (2021-2025) by providing a summary Table 9 with the outcomes of the tests for all 11 periods studied with respect to the three dimensions of interest (normality, homoscedasticity and absence of autocorrelation). View this table: View inline View popup Download powerpoint Table 9. Summary of testing results for normality, homoscedasticity and absence of autocorrelation of linear regression residuals relative to the 11 seasonal segments of the period 2021 – 2025. 3.2. Results from the GLM Poisson Model for COVID-19 Mortality Data in Italy (2021-2025) We here provide the results of the Poisson GLM model fit to the weekly COVID-19 mortality data for all 11 seasonal segments identified in Section 2 . The results are presented in the form of four Figures (9-12) where: Figure 9 shows the Poisson regression curves for all winter seasonal segments, Figure 10 for all summer seasonal segments, Figure 11 for all intermediate seasonal segments, and finally Figure 12 for the two seasonal segments of the period from May 2024 to May 2025. Download figure Open in new tab Figure 9. GLM Poisson regression curves for Winter segments. Top: Winter 2021, ( Ŷ × (exp( β 1 ) – 1)) = 157.30, Pseudo R 2 = 0.93. Middle: Winter 2022, ( Ŷ × (exp( β 1 ) – 1)) = 23.79, Pseudo R 2 = 0.55. Bottom: Winter 2023, ( Ŷ × (exp( β 1 ) – 1)) = 18.81, Pseudo R 2 = 0.70. Download figure Open in new tab Figure 10. GLM Poisson regression curves for Summer segments. Top: Summer 2022, ( Ŷ × (exp( β 1 ) – 1)) = 57.38, Pseudo R 2 = 0.32. Middle: Summer 2023, ( Ŷ × (exp( β 1 ) – 1)) = 7.33, Pseudo R 2 = 0.45. Bottom: Summer 2024, ( Ŷ × (exp( β 1 ) – 1)) = 8.21, Pseudo R 2 = 064. Download figure Open in new tab Figure 11. GLM Poisson regression curves for Intermediate segments. Top: Intermediate 2022, ( Ŷ × (exp( β 1 ) – 1)) = -84.23, Pseudo R 2 = 0.84. Middle: Intermediate 2023, ( Ŷ × (exp( β 1 ) – 1)) = -18.42, Pseudo R 2 = 0.82. Bottom: Intermediate 2024, ( Ŷ × (exp( β 1 ) – 1)) = -14.35, Pseudo R 2 = 0.90. Download figure Open in new tab Figure 12. GLM Poisson regression curves for the period May 2024 – May 2025. Left: Summer-Winter 2024/25, ( Ŷ × (exp( β 1 ) – 1)) = 4.41, Pseudo R 2 = 0.49. Right: Extended Spring 2025, ( Ŷ × (exp( β 1 ) – 1)) = -1.85, Pseudo R 2 = 0.45. Each Poisson regression curve in the Figures is accompanied by its corresponding ( Ŷ × (exp( β 1 ) – 1)) value which, starting from the β 1 value of the Poisson regression, and applying the transformation with the link function and the average number of deaths for that segment, yields a parameter comparable to the β 1 produced by the linear regression model. Also included in the caption of each Figure is the Pseudo R 2 value which represents the goodness of fit of the model. After showing the Poisson regression curves in the aforementioned Figures, we present in Table 10 the corresponding values of the weekly COVID-19 death forecasts calculated according to the Poisson model. We defer to the Discussion Section a precise comparison between the results of the linear regression and Poisson models. This comprehensive analysis will be based on: a) a comparison of the growth/decline trends of the profiles identified by lines in one model and curves in the other, b) a comparison based on their respective β 1 values, and finally, a numerical comparison of the death forecasts from the two models versus the observed deaths. View this table: View inline View popup Table 10. GLM Poisson regression. Predicted weekly deaths from COVID-19: 2021-2025 (210 weeks/W). Before providing, after the 11 Poisson regression curves, the predicted values of weekly COVID-19 deaths from the Poisson model for all the 11 seasonal segments above, it is impossible not to anticipate, at this point in the treatment, that even with the Poisson model, all three winter curves show an increasing mortality trend, as do the summer curves, albeit less pronounced, while the intermediate periods show a decreasing trend. This is exactly the same type of result provided by the linear regression model in [ 8 ]. Similarly, the growth and decline segments observed in the two periods that make up the timeframe studied in [ 9 ] from May 2024 to May 2025, show the same trends as the Poisson model curves in Figure 12 . Identical statements could be made about the β 1 values of the linear model and the linearized Poisson ones, which show a high degree of coincidence. Now, however, we provide in the Table 10 all the COVID-19 death predictions from the Poisson model for each of the 210 weeks studied. To close this section, which has first shown the results of the statistical validation tests for the applicability of the linear regression model to COVID-19 mortality data in the extensive time segment from September 2021 to May 2025, and then the results of a similar development exercise on the same mortality data for a Poisson GLM model, we reiterate that the first set of results (statistical tests) has substantially confirmed the possibility of applying a linear model to that data without excessive errors. Meanwhile, the results from the Poisson model show a remarkable alignment with the analogous results of the linear model presented in [ 8 , 9 ] from every conceivable angle: in the slopes of the curves for all seasonal segments, in the corresponding β 1 parameters and in the over 200 forecasts. However, we believe it is useful to dedicate an entire Section, the next one, to discussing this comparison, performing it with the precision and accuracy that the topic deserves. 4. Discussion The true core of this present work was to find a confirmation, peacefully accepted by experts, for the somewhat surprising results published in [ 8 , 9 ]. Those results showed that in Italy, during the period 2021-2025, the seasonal profiles of COVID-19 mortality had a growing trend in both winter and summer, with greater emphasis on winter, and then descending profiles in the intermediate period that follows the most central part of winter until late spring. The problem, however, was that those results were obtained by fitting a linear regression model, while it is undeniable that death count problems should be modeled with Poisson or Negative Binomial GLMs. Although there was a rationale behind the use of the linear model, namely, to express the growth and decline trends in a visually clear and unmistakable way, as only straight lines and their slopes can do, those results needed a confirmation that could be fully convincing. This confirmation has been partially obtained with the results of the statistical tests presented in first part of the previous Section 2 , which confirmed that a linear regression model could be applied to that particular time series without committing excessive errors. However, this was not enough, and we developed a more canonical and commonly accepted Poisson GLM model on the same mortality data. The results shown in the second part of Section 2 were confirmatory and surprising afresh. To discuss them better, we first present the summary Table 11 . It takes the 210 observations of COVID-19 deaths in Italy (see columns termed Weekly Deaths of Tables 2 - 5 ), grouped into the 11 seasonal segments subject to the model fitting, and numerically compares them with: i) the predictions of the linear model (see columns termed Prediction of Tables 2 - 5 ) and ii) with the predictions of the Poisson model (shown in Table 10 ), calculating the relative MAE and percentage error, for each comparison. View this table: View inline View popup Download powerpoint Table 11. Comparison between COVID-19 deaths and predictions from linear regression and Poisson regression, with corresponding MAE and percentage errors. Table 11 clearly shows that the MAE of the Poisson regression is only slightly better than that of the linear regression, 62.76 versus 88.60 (the lower the MAE, the more accurate the prediction). If we then look at the percentage errors, we see that the quantity of errors on this huge number of predictions (averaged over the number of deaths per period) is indeed lower with the Poisson model, at exactly 1.15%. However, moving to the linear regression model results in a shift to 1.48%, which is frankly negligible. It is still important to remember, though, that out of the 210 predictions, the linear regression model provided 7 negative values, which, although very few, are obviously forbidden as they are meaningless. An even more interesting comparison is to look at the slopes of the Poisson curves versus the lines of the linear regression model. We have already documented that the trends match 100% across all 11 periods, that is when the linear model shows an ascending trend, so does the Poisson model, and similarly for descending trends. However, a more compelling comparison is between the slopes of the Poisson curves and the lines for each seasonal segment. Table 13 shows the β 1 values of the linear model (second column) for each period and the corresponding linearized β 1 values of the Poisson model (fourth column). It is possible to see that the two series of values are practically identical, with such minimal differences that they do not even warrant being counted. View this table: View inline View popup Download powerpoint Table 12. Comparison between the slopes of the linear model and the Poisson model, with the linearized Poisson β 1 . Ultimately, this is the truly surprising and, we believe, innovative aspect of this study: it has shown that, at least in the limited, yet temporally extended, circumstances analyzed, a simpler and easier-to-understand linear model provides the same results as a Poisson model, especially concerning the seasonal growth and decline trends of the COVID-19 mortality subject of our interest. To conclude, we present Figure 13 which displays the COVID-19 mortality data from 2021 to 2025 with superimposed curves from the Poisson model for each seasonal segment (each distinguished by a different color), along with an inset box showing the linear model lines from study [ 8 ]. This last Figure perfectly exemplifies the overlap of the two models’ results, effectively summarizing the most significant data that has emerged from the current study. Download figure Open in new tab Figure 13. In the big picture, the COVID-19 death data for the entire 2021-2025 period with the Poisson model curves superimposed, with each distinct seasonal segment represented by a different color. In the small inset, an analogous plot with the linear model lines, inspired by [ 8 ]. Of course, we do not forget the limitations of the current study. The first of these, we must remember, is the clear preference for regression models based on Poisson or negative binomial distributions when dealing with count data, given that the case examined here is only a single event, however significant it has been. We also cannot avoid concisely listing a summary of the limitations that concern not so much the modeling discussions conducted so far but those related to the content, namely the observation of COVID-19 mortality during the period of interest. First, this study’s findings are limited to the specific epidemiological context of Italy between September 2021 and May 2025, a period dominated by Omicron and post-Omicron SARS-CoV-2 variants. The results might differ in other periods or geographic locations with different circulating lineages [ 20 ]. Another key limitation with this kind of studies, already discussed at length in [ 8 ], is they deliberately avoid identifying the causes behind the observed seasonal mortality trends. While these trends could be influenced by various factors like climate, social behaviors, immunity levels, and public health measures, the decision was made to focus purely on observing and quantifying the trends themselves [ 21 - 26 ]. This observational approach was chosen due to the unreliability of relevant data during this period, such as vaccination rates and recorded infections. Discussing the causes without reliable data would have been just speculative. Finally, the use of Italian government data presents its own set of limitations. The data, provided as aggregated measures from two different sources, has been subject to corrections and adjustments over time, only recently achieving relative stability. Nevertheless, public thanks must be given to the Italian institutions, because they have still guaranteed, and continue to do so, a constant flow of data that allows independent researchers to continue studying the phenomenon of COVID spread, even in the current times. 5. Conclusions In the field of epidemiological modeling, Poisson GLM models are considered the standard for analyzing count data, such as deaths, and are extensively used in epidemiology and beyond [ 27 - 36 ]. However, our research [ 8 , 9 ] explored the use of a simple linear regression on weekly COVID-19 mortality data in Italy (2021-2025). The results revealed a significant finding: despite a general downward trend, we consistently observed an increase in mortality during both winter and summer. The question we asked in the present paper was whether linear regression could still be a valid tool for highlighting the slopes of these seasonal trends. Our direct comparison with a Poisson GLM model provided convincing answers. The key findings of this current analysis, in fact, have been: As to statistical validity, hypothesis tests confirmed that linear regression was applicable to this specific time series, as its conditions for normality of residuals, homoscedasticity, and lack of autocorrelation were substantially met. As to trend correspondence, there was a 100% alignment between the two models in identifying growth or decline trends across all 11 seasonal periods. Finally, as to accuracy, both models showed exceptional precision in forecasting deaths. The Poisson model had a slightly lower MAE (62.76) compared to the linear one (88.60). In percentage terms, the Poisson model’s error was 1.15%, while the linear regression’s error was just 1.48%, a negligible difference. In conclusion, our current study has shown that in this specific context, a simpler and more visually intuitive linear regression model provided the same results and nearly identical accuracy as the more complex Poisson model. This suggests that, under certain circumstances, linear regression can be an effective tool for understanding mortality trends. Supplementary Materials No further supporting information. Author Contributions Conceptualization, M.R.; methodology, M.R.; software, G.D.; validation, M.R. and G.C.; formal analysis, G.C.; investigation, M.R.; resources, M.R.; data curation, M.R. and G.C.; writing—original draft preparation, M.R.; writing—review and editing, M.R. and E.D.; visualization, G.C.; supervision, M.R.; project administration, M.R.. All authors have read and agreed to the published version of the manuscript. Both authors have contributed substantially to the work reported. Funding This research received no external funding. Institutional Review Board Statement This study uses publicly available, aggregated data that contains no private information. Therefore, ethical approval is not required. Informed Consent Statement Not applicable: Neither humans nor animals nor personal data are involved in this study. Data Availability Statement All the initial COVID-19 deaths data are downloadable from two public, open access repositories, specifically: i) the repository maintained by the Italian Civil Protection Department, under the Italian Presidency of the Council of Ministers ( https://github.com/pcm-dpc/COVID-19/blob/master/dati-andamento-nazionale ), and ii) the repository maintained by the Italian Ministry of Health, ( https://www.salute.gov.it/new/it/tema/covid-19/report-settimanali-covid-19/ ). Moreover, all the data on which both the statistical hypothesis tests and the Poisson regression model are based have been made fully available in Section 2 under a tabular format. All the results of this study are fully reproducible by using the methods described in this paper and the data made available above. Further reasonable requests relative to data and code can be also addressed to the corresponding author (email: marco.roccetti{at}unibo.it ). Conflicts of Interest The authors declare no conflict of interest. Footnotes giuseppe.cacciapuoti{at}studio.unibo.it References 1. ↵ Cameron , A. C. ; Trivedi , P. K . Regression Analysis of Count Data . Cambridge University Press . 1998 , doi: 10.1017/CBO9781139013567 OpenUrl CrossRef 2. ↵ Hilbe , J. M. Modeling Count Data . Cambridge University Press . 2014 , doi: 10.1017/CBO9781139236065 OpenUrl CrossRef 3. ↵ Gardner , W. ; Mulvey , E. P. ; Shaw , E. C . Regression Analyses of Counts and Rates: Poisson, Overdispersed Poisson, and Negative Binomial Models . Psychological Bulletin . 1995 , 118 ( 3 ) , doi: 10.1037/0033-2909.118.3.392 OpenUrl CrossRef PubMed Web of Science 4. ↵ Chan , S. ; Chu , J. ; Zhang , Y. ; Nadarajah , S ., Count regression models for COVID-19 . Physica A: Statistical Mechanics and its Applications . 2021 , 563 : 125460 , doi: 10.1016/j.physa.2020.125460 OpenUrl CrossRef 5. ↵ Schober , P. ; Vetter T.R . Count Data in Medical Research: Poisson Regression and Negative Binomial Regression . Anest Analg . 2021 , 132 ( 5 ) , doi: 10.1213/ANE.0000000000005398 OpenUrl CrossRef PubMed 6. Casini , L. ; Roccetti , M . Reopening Italy’s schools in September 2020: A Bayesian estimation of the change in the growth rate of new SARS-CoV-2 cases . BMJ Open . 2021 , 11 : e051458 , doi: 10.1136/bmjopen-2021-051458 OpenUrl Abstract / FREE Full Text 7. ↵ Cappi , R. ; Casini , L. ; Tosi , D. ; Roccetti , M . Questioning the seasonality of SARS-CoV-2: A Fourier spectral analysis . BMJ Open . 2022 , 12 : e061602 , doi: 10.1136/bmjopen-2022-061602 OpenUrl Abstract / FREE Full Text 8. ↵ Roccetti , M. ; De Rosa , E.M . A Segmented Linear Regression Study of Seasonal Profiles of COVID-19 Deaths in Italy: September 2021–September 2024 . Computation . 2025 , 13 : 165 , doi: 10.3390/computation13070165 OpenUrl CrossRef 9. ↵ Roccetti , M . Seasonal Trends of COVID-19 Deaths in Italy: A Confirmatory Linear Regression Study with Time Series Data from 2024/2025 . MedRxiv . 2025 , doi: 10.1101/2025.05.30.25328619 OpenUrl Abstract / FREE Full Text 10. ↵ Altman , N. ; Krzywinski , M. Simple Linear Regression . Nature Methods . 2015 , 12 , doi: 10.1038/nmeth.3627 OpenUrl CrossRef PubMed 11. ↵ Shapiro , S. S. ; Wilk , M. B . An Analysis of Variance Test for Normality (complete samples) . Biometrika . 1965 , 52 :( 3/4 ) , doi: 10.2307/2333709 OpenUrl CrossRef 12. ↵ Montgomery , D. C. ; Peck , E. A. ; Vining , G. G . Introduction to Linear Regression Analysis (6th ed.) , 2021 . John Wiley & Sons , ISBN: 978-1-119-57872-7 13. ↵ Breusch , T. S. ; Pagan , A. R . A Simple Test for Heteroscedasticity and Random Coefficient Variation . Econometrica . 1979 , 47 ( 5 ) , doi: 10.2307/1911963 OpenUrl CrossRef Web of Science 14. ↵ Hyndman , R. J. ; Athanasopoulos , G . Forecasting: Principles and Practice (3rd ed.) , 2021 . OTexts , ISBN: 978-0987507136 . 15. ↵ Bhaskaran , K. ; Gasparrini , A. ; Hajat , S. ; Smeeth , L. ; Armstrong , B . Time Series Regression Studies in Environmental Epidemiology . International Journal of Epidemiology . 2013 , 42 ( 4 ) , doi: 10.1093/ije/dyt092 OpenUrl CrossRef PubMed Web of Science 16. Casini , L. ; Roccetti , M . A Cross-regional Analysis of the COVID-19 Spread during the 2020 Italian Vacation Period: Results from three Computational Mmodels are Compared . Sensors . 2020 , 20 ( 24 ) , doi: 10.3390/s20247319 BMJ Open, 2021, 11: e051458 , doi: 10.1136/bmjopen-2021-051458 OpenUrl CrossRef 17. Roccetti , M . Drawing a parallel between the trend of confirmed COVID-19 deaths in the winters of 2022/2023 and 2023/2024 in Italy, with a prediction . Mathematical Biosciences and Engineering . 2023 , 21 ( 3 ) , doi: 10.3934/mbe.2024165 OpenUrl CrossRef 18. Tosi , D. ; Campi A , How Data Analytics and Big Data Can Help Scientists in Managing COVID-19 Diffusion: Modeling Study to Predict the COVID-19 Diffusion in Italy and the Lombardy Region . Journal of Medical Internet Research . 2020 , 22 ( 10 ) , doi: 10.2196/21081 OpenUrl CrossRef PubMed 19. ↵ Roccetti , M . Excess mortality and COVID-19 deaths in Italy: A peak comparison study . Mathematical Biosciences and Engineering . 2023 , 20 ( 4 ) , doi: 10.3934/mbe.2023304 OpenUrl CrossRef 20. ↵ D’Amico , F. ; Marmiere , M. ; Righetti , B. ; Scquizzato , T. ; Zangrillo , A. et al. COVID-19 seasonality in temperate countries , Environmental Research , 2022 , 206 ( 15 ) , doi: 10.1016/j.envres.2021.112614 OpenUrl CrossRef 21. ↵ Venturelli , F. ; Mancuso , P. ; Vicentini , M. : Ottone , M. ; Storchi , C. , et al. , High temperature, COVID-19, and mortality excess in the 2022 summer: a cohort study on data from Italian surveillances . Science of The Total Environment , 2023 , Volume 887 , doi: 10.1016/j.scitotenv.2023.164104 OpenUrl CrossRef 22. Chirumbolo , S. ; Pandolfi , S. ; Valdenassi , L . Seasonality of COVID-19 deaths. Did social restrictions and vaccination actually impact the official reported dynamic of COVID-19 pandemic in Italy? Environmental Research . 2022 , Volume 212 , doi: 10.1016/j.envres.2022.11322 OpenUrl CrossRef 23. Fontal , A. ; Bouma , M.J. ; San-José , A. ; Lopez , L. ; Pascual , M. et al. , Climatic signatures in the different COVID-19 pandemic waves across both hemispheres , Nature Computational Science , 2021 , Volume 1 , doi: 10.1038/s43588-021-00136-6 OpenUrl CrossRef PubMed 24. Sera , F. ; Armstrong , B. ; Abbott , S. ; Meakin , S. ; O’Reilly , K. et al. , A cross-sectional analysis of meteorological factors and SARS-CoV-2 transmission in 409 cities across 26 countries . Nature Communications . 2021 , 12 ( 1 ) , doi: 10.1038/s41467-021-25914-8 OpenUrl CrossRef PubMed 25. Wong , C . Why do covid cases rise in summer? New Scientist . 2024 , Volume 263 , doi: 10.1016/S0262-4079(24)01548-3 OpenUrl CrossRef 26. ↵ De Meijere , G. ; Valdano , G. ; Castellano , C. ; Debin , M. ; Kengne-Kuetche , C. et al. , Attitudes towards booster, testing and isolation, and their impact on COVID-19 response in winter 2022/2023 in France, Belgium, and Italy: a cross-sectional survey and modelling study . The Lancet Regional Health – Europe , 2023 , 28 , doi: 10.1016/j.lanepe.2023.100614 OpenUrl CrossRef PubMed 27. ↵ Khajanchi S , Sarkar K , Mondal J , Nisar , K.S. ; Abdelwahab , S.F . Mathematical modeling of the COVID-19 pandemic with intervention strategies . Results in Physics . 2021 , Volume 25 , doi: 10.1016/j.rinp.2021.104285 OpenUrl CrossRef 28. Roccetti , M. ; Marfia , G . TCP at last: reconsidering TCP’s role for wireless entertainment centers at home . IEEE Transactions on Consumer Electronics . 2010 , 56 ( 4 ) , doi: 10.1109/TCE.2010.5681095 OpenUrl CrossRef 29. Roccetti , M. ; Ferretti , S. ; Palazzi , C.E. The brave new world of multiplayer online games: Synchronization issues with smart solutions . 2008 11th IEEE International Symposium on Object and Component-Oriented Real-Time Distributed Computing (ISORC) . 2008 , doi: 10.1109/ISORC.2008.17 OpenUrl CrossRef 30. Ghini , V. ; Panzieri , F. ; Roccetti , M . Client-centered load distribution: A mechanism for constructing responsive web services . Proceedings of the 34th Annual Hawaii International Conference on System Sciences . 2001 , doi: 10.1109/HICSS.2001.927214 OpenUrl CrossRef 31. Morotti , E. ; Stacchio , L. ; Donatiello , L. ; Roccetti , M. ; Tarabelli , J. et al. Exploiting fashion x-commerce through the empowerment of voice in the fashion virtual reality arena . Virtual Reality . 2022 , Volume 26 , doi: 10.1007/s10055-021-00602-6 OpenUrl CrossRef 32. Yang , H. ; Lin , X. ; Li , J. ; Zhai , Y. ; Wu , J ., A Review of Mathematical Models of COVID-19 Transmission . Contemporary Mathematics , 2023 , 4 ( 1 ) , doi: 10.37256/cm.4120232080 OpenUrl CrossRef 33. Hao , B. ; Liu , C. ; Wang , Y. ; Zhu , N. ; Ding , Y. et al. , A mathematical-adapted model to analyze the characteristics for the mortality of COVID-19 . Scientific Reports , 2022 , Volume 12 , doi: 10.1038/s41598-022-09442-z OpenUrl CrossRef 34. James , G. ; Witten , D. ; Hastie , T. ; Tibshirani , R. An Introduction to Statistical learning, with Applications in Python , 2023 , Springer Nature , ISBN: 9783031387470 35. Taljaard , M. ; McKenzie , J.E. ; Ramsay , C.R. ; Grimshaw , J.M . The use of segmented regression in analysing interrupted time series studies: an example in pre-hospital ambulance care . Implementation Science . 2014 , 9 ( 77 ) , doi: 10.1186/1748-5908-9-77 OpenUrl CrossRef PubMed 36. ↵ Ozili , P.K . The acceptable R-square in empirical modelling for social science research . Social Research Methodology and Publishing Results . 2022 , doi: 10.2139/ssrn.4128165 OpenUrl CrossRef View the discussion thread. Back to top Previous Next Posted September 12, 2025. Download PDF Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following A Tale of Two Models: Linear Regression and Poisson GLM Yield Identical Trends for COVID-19 Mortality in Italy Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share A Tale of Two Models: Linear Regression and Poisson GLM Yield Identical Trends for COVID-19 Mortality in Italy Marco Roccetti , Giuseppe Cacciapuoti medRxiv 2025.09.11.25335570; doi: https://doi.org/10.1101/2025.09.11.25335570 Share This Article: Copy Citation Tools A Tale of Two Models: Linear Regression and Poisson GLM Yield Identical Trends for COVID-19 Mortality in Italy Marco Roccetti , Giuseppe Cacciapuoti medRxiv 2025.09.11.25335570; doi: https://doi.org/10.1101/2025.09.11.25335570 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Epidemiology Subject Areas All Articles Addiction Medicine (567) Allergy and Immunology (863) Anesthesia (297) Cardiovascular Medicine (4411) Dentistry and Oral Medicine (443) Dermatology (380) Emergency Medicine (606) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1505) Epidemiology (15205) Forensic Medicine (30) Gastroenterology (1119) Genetic and Genomic Medicine (6574) Geriatric Medicine (666) Health Economics (994) Health Informatics (4511) Health Policy (1365) Health Systems and Quality Improvement (1608) Hematology (537) HIV/AIDS (1263) Infectious Diseases (except HIV/AIDS) (15903) Intensive Care and Critical Care Medicine (1103) Medical Education (620) Medical Ethics (144) Nephrology (665) Neurology (6573) Nursing (345) Nutrition (998) Obstetrics and Gynecology (1139) Occupational and Environmental Health (954) Oncology (3319) Ophthalmology (967) Orthopedics (369) Otolaryngology (420) Pain Medicine (435) Palliative Medicine (129) Pathology (662) Pediatrics (1689) Pharmacology and Therapeutics (691) Primary Care Research (710) Psychiatry and Clinical Psychology (5421) Public and Global Health (9205) Radiology and Imaging (2191) Rehabilitation Medicine and Physical Therapy (1367) Respiratory Medicine (1191) Rheumatology (593) Sexual and Reproductive Health (709) Sports Medicine (529) Surgery (709) Toxicology (99) Transplantation (288) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'9fe88edbbaea52ad',t:'MTc3OTI1MDkyMg=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00
unpaywall
last seen: 2026-05-23T02:00:01.238055+00:00
License: CC-BY-NC-ND-4.0