Municipal Wealth and Spatial Clustering of Leprosy Incidence in São Paulo, Brazil (2017-2020): Evidence from BYM2 Modeling

preprint OA: closed CC-BY-4.0
📄 Open PDF Full text JSON View at publisher
Full text 46,388 characters · extracted from preprint-html · click to expand
Socioeconomic determinants and spatial distribution of leprosy in São Paulo State, Brazil (2017–2020): a municipal-level analysis | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Socioeconomic determinants and spatial distribution of leprosy in São Paulo State, Brazil (2017–2020): a municipal-level analysis View ORCID Profile Carlos Souto dos Santos Filho , View ORCID Profile Ana Júlia Alves Câmara , View ORCID Profile Guilherme Aparecido Santos Aguilar doi: https://doi.org/10.1101/2025.09.16.25335912 Carlos Souto dos Santos Filho a Graduate Program in Statistics, Institute of Mathematics, Statistics and Scientific Computing, State University of Campinas—UNICAMP , Rua Sérgio Buarque de Holanda, 651, Campinas - 13083-859, SP, Brazil Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Carlos Souto dos Santos Filho For correspondence: c300761{at}dac.unicamp.br Ana Júlia Alves Câmara b Federal University of Espírito Santo - UFES, Avenida Fernando Ferrari , 514, Goiabeiras, Vitória, ES, 29075-910, Brazil Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Ana Júlia Alves Câmara Guilherme Aparecido Santos Aguilar c Faculty of Science and Technology, Department of Statistics, São Paulo State University – UNESP , Rua Roberto Símonsen, 305 – Educational Center, Pres. Prudente – SP, 19060-900, Brazil Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Guilherme Aparecido Santos Aguilar Abstract Full Text Info/History Metrics Data/Code Preview PDF Summary Objectives Leprosy remains a significant public health challenge in Brazil, with distinct spatial and temporal patterns reflecting underlying socioeconomic inequalities. This study investigated the association between municipal socio-territorial indicators and the geographic distribution of leprosy in São Paulo State. Methods A total of 4562 new leprosy cases reported across 645 municipalities from 2017 to 2020 were analysed using Bayesian spatial modelling. The Besag–York–Mollié 2 (BYM2) model was implemented to estimate relative risk while accounting for spatial dependence, incorporating municipal wealth as a covariate. Expected case counts were calculated based on overall state incidence rates and local population sizes. Exceedance probabilities were computed to identify high-risk clusters using a threshold of relative risk >2.0. Results Local relative risk estimates ranged from 0.06 to 31.52 (median: 0.96), with substantial spatial heterogeneity across municipalities. Municipal wealth demonstrated a significant protective effect (posterior mean: −0.059, 95% CrI: −0.081 to −0.037), indicating lower leprosy incidence in economically advantaged areas. The mixing parameter ( φ = 0.517) revealed approximately equal contributions of structured spatial and unstructured random effects. High-risk clusters were predominantly concentrated in western and northern regions of the state. Conclusions Leprosy distribution in São Paulo State exhibits significant spatial clustering associated with municipal wealth disparities. The persistent geographic patterns suggest that socioeconomic conditions are associated with variations in local leprosy risk across municipalities. These findings support targeted public health interventions in identified high-risk areas and highlight the importance of addressing underlying sociodemographic inequalities that may influence the local effectiveness of leprosy control strategies. Introduction Hansen’s disease, caused by Mycobacterium leprae and Mycobacterium lepromatosis , is a chronic infectious disease ranking as the second most common mycobacterial infection world-wide after tuberculosis. 1 The bacteria target Schwann cells and dermal macrophages, causing peripheral neuropathy, cutaneous manifestations, and mucosal lesions that may progress to motor and sensory impairments, deformities, and stigmatising wounds. In addition to its clinical impact, historically, the disease carries profound social implications due to historical discrimination and exclusion. Key scientific milestones include Hansen’s discovery of M. leprae in 1873; Shepard’s successful bacterial cultivation in mouse footpads at the U.S. Centers for Disease Control in 1959; and Kirchheimer and Storrs’ development of the nine-banded armadillo model in 1968, which enabled disseminated infection studies. These advances significantly enhanced understanding of the disease’s pathogenesis and treatment approaches. 2 Despite decades of public health initiatives, leprosy continues to affect populations disproportionately in low- and middle-income countries (LMICs), where poverty, poor housing conditions, and limited access to health care persist. Globally, from 1990 to 2021, the age-standardised incidence rate (ASIR) for leprosy declined by 64.79%, reaching 0.58 per 100,000 population in 2021. 3 The global burden, as measured by disability-adjusted life years (DALYs), also followed a downward trajectory, yet leprosy remains endemic in more than 120 countries. Notably, Brazil, India, and Indonesia together account for approximately 79.3% of new annual cases, with the disease particularly concentrated in tropical and subtropical regions. 1 In these contexts, the persistence of leprosy reflects not only biological transmission mechanisms but also structural and societal inequities that facilitate the disease ’ s spread and hinder timely diagnosis and treatment. In Brazil, leprosy continues to represent a complex public health issue, with distinct spatial and temporal patterns. Recent investigations have documented heterogeneous relapse rates and disease clustering across the national territory. Using space–time scan statistics, Boigny and colleagues identified high-risk clusters of leprosy relapse in the North, Northeast, and Central-West regions, characterised by relative risks (RR) ranging from 1.78 to 3.97. 4 These clusters were frequently found in socioeconomically disadvantaged municipalities with barriers to health service access. According to the authors, these patterns are associated with both structural vulnerabilities and higher baseline infection rates, which contribute to continued transmission and recurrence of the disease. In a complementary analysis, Sczmanski et al . 5 assessed clinical and epidemiological data from 215,155 newly reported leprosy cases between 2014 and 2019. Their findings revealed that the disease remains stable in most Brazilian regions, with the highest detection rates in the Midwest and lowest in the South. The most affected individuals were predominantly male, literate, and of black or brown ethnicity, aged between 60 and 79 years. Multibacillary forms and borderline clinical presentations predominated, suggesting late detection and heightened transmission potential. The study emphasised that leprosy persists as a public health concern, closely linked to social inequalities and requiring spatially informed public health responses. For a long time, the importance of epidemiology related to leprosy was neglected in spatial studies. Guided by these findings, the present study adopts a spatial epidemiology approach to investigate the association between municipal-level socio-territorial indicators and the geographic distribution of leprosy in the state of São Paulo from 2017 to 2020. By incorporating spatial statistical modelling and disease mapping techniques, this analysis aims to uncover hidden patterns of risk and support the strategic allocation of public health resources in line with the WHO’s “Towards Zero Leprosy” roadmap. The main objective of this study was to evaluate the association between municipality-level socio-territorial indicators—namely wealth, longevity, and education—and the spatial distri-bution of leprosy cases in the State of São Paulo from 2017 to 2020. Additionally, the study aimed to identify clusters of municipalities where the incidence of leprosy was significantly higher than expected based on available covariates, suggesting the presence of underlying social or environmental determinants not captured by standard indicators. Furthermore, the study sought to compare patterns of leprosy incidence across pre-defined socio-territorial groups of municipalities, with a particular focus on assessing whether combinations of low wealth were consistently associated with increased leprosy risk. Materials and methods STUDY AREA: STATE OF SÃO PAULO Demographic data from the 2022 Brazilian Census indicate that the state of São Paulo reached a total population of 44.4 million, reflecting an increase of 3.2 million residents over the previous twelve years, corresponding to an average annual growth of 263,200 individuals. Since 1940, the population has expanded by a factor of 6.2. 6 However, recent decades have witnessed a deceleration in growth rates due to declining fertility and a reduction in net migration. Between 2010 and 2022, the capital’s annual growth rate was 0.15%, significantly lower than the rates observed in the interior (0.79%) and the state as a whole (0.62%). The most recent census confirmed a reduction in the state’s overall population growth rate, which fell from 1.09% in the 2000–2010 period to 0.62% in the subsequent intercensal period. This shift was accompanied by a rise in the number of municipalities experiencing population decline, increasing from 102 to 197, while the number of municipalities with positive growth declined from 543 to 448. 6 In addition to demographic indicators, the São Paulo Index of Social Responsibility (IPRS), which evaluates municipalities based on wealth, longevity, and educational attainment, revealed notable changes between 2014 and 2018. The number of municipalities classified as vulnerable, characterised by low levels in all three dimensions, decreased from 77 to 61, with a corresponding reduction in the affected population from 2.35 million (5.5%) to 2.02 million (4.6%). 7 The number of dynamic municipalities, defined by their economic vitality and medium to high performance in education and longevity indicators, increased from 104 to 112, expanding the share of the population in this category from 32.1% (13.7 million) to 34.0% (15 million). Although the number of unequal municipalities, which generate wealth but exhibit low performance in either education or longevity, rose from 71 to 75, the associated population declined slightly from 45.3% (19.33 million) to 43.6% (19.18 million). Lastly, the group of equitable municipalities, which present low levels of wealth but relatively favourable outcomes in education and longevity, increased from 212 to 218 municipalities, encompassing 9.8% (4.31 million) of the state ’ s population in 2018, compared to 9.7% (4.14 million) in 2014. 7 DATA EXTRACTION The health and socioeconomic information used in this study was obtained from digitised and anonymised data provided by official state agencies. The dependent variable (DV) corresponds to the number of incident cases of leprosy reported in the state of São Paulo during the period from 2017 to 2020. These data were obtained from the Technical Division of Epidemiological Surveillance of Leprosy, part of the Centre for Epidemiological Surveillance of the São Paulo State Health Department. The independent variables include socioeconomic indicators derived from the São Paulo IPRS, which encompasses municipal-level measures of wealth, longevity, and education. These indicators were obtained from the State Data Analysis System (SEADE Foundation), an agency under the Government of the State of São Paulo. All IPRS data refer to the year 2018 and are publicly available for the state ’ s 645 municipalities. COVARIATE SELECTION: MUNICIPAL WEALTH INDICATOR Among the variables considered in the statistical modelling, the municipal wealth indicator (2018), derived from the IPRS, was selected as a covariate in the Poisson regression model. The choice of this variable was based on both theoretical relevance and empirical significance. The wealth indicator captures the economic profile of each municipality by integrating multiple components. These include electricity consumption in agriculture, commerce, and services; per capita value added; residential electricity consumption; and the average income of formally employed individuals in both the private and public sectors. These data are sourced from administrative records provided by the State Secretariats of Finance and Energy of São Paulo as well as the Ministry of Labour and Employment. The indicator is scaled from 0 to 100 and can be reproduced annually, ensuring its applicability in longitudinal studies. In the Poisson regression model, Wealth (2018) demonstrated a statistically significant and inverse association with the outcome variable (estimate = –0.03878; p < 0.001). This finding suggests that municipalities with higher levels of economic wealth tend to present lower expected counts of incident leprosy cases. This relationship is consistent with prior literature linking socioeconomic development to improved public health and environmental outcomes, reinforcing the theoretical justification for its inclusion in the model. The other covariates, longevity and education, were also evaluated; however, only education showed a statistically significant positive association in the model (estimate = 0.03811; p < 0.001), while longevity was not statistically significant ( p = 0.83). These results inform the understanding of how multidimensional socioeconomic factors influence the phenomenon under study. SPATIAL MODELLING: BYM2 MODEL In this study, we applied the BYM2 model to estimate the spatial distribution of leprosy incidence across municipalities in the state of São Paulo. Although standardised incidence ratios (SIRs) are commonly used in spatial epidemiology, they can be unstable and misleading, particularly in areas with small populations or where the disease is rare. In such cases, the expected number of cases may be very low, leading to high variance and potential misinterpretation of risk patterns. To address this limitation, hierarchical Bayesian models such as the BYM2 offer a more robust alternative by borrowing information from neighbouring regions and integrating relevant covariates. This enables the smoothing of extreme values and enhances the stability of risk estimates. 8 , 9 Simpson et al . 10 proposed the BYM2 model as an updated and reparameterised version of the traditional Besag–York–Mollié (BYM) model. 11 It enables the specification of interpretable and computationally efficient penalised complexity (PC) priors. In this model, the relative risk for area iii, denoted as ‘λi’, is modeled as: where E i is the expected number of cases in area i, X i β represents the fixed effects of covariates (e.g., municipal wealth), and U i is a spatially structured random effect combining W i , an intrinsic conditional autoregressive (CAR) term, and V i , an unstructured independent noise term. In the BYM2 formulation, these components are scaled and combined into a single expression to balance structured and unstructured effects via a mixing parameter ϕ , as follows: where τ b is the overall precision (inverse variance) of the combined spatial effect, and ϕ ∈ [0,1] controls the proportion of total variance attributed to the structured spatial component u * . When ϕ = 1, the model behaves as a fully structured spatial model, whereas ϕ = 0 corresponds to a model driven entirely by unstructured noise. This reparameterisation simplifies model interpretation and facilitates prior specification in the Bayesian framework. In particular, PC priors can be applied to penalise model complexity, thereby shrinking the structured spatial component toward a base model of spatially unstructured random variation, unless the data strongly support it. The model was implemented using the INLA (Integrated Nested Laplace Approximation) approach in R-INLA. The use of the BYM2 model in this context ensures statistically stable and spatially coherent estimates of leprosy risk, accommodating the heterogeneity in population size and enabling robust inference across small areas. The marginal precision of the spatially structured random effect ( τ b ) was assigned a penalized complexity (PC) prior defined as . Following the rule of thumb by Simpson et al ., 10 a marginal standard deviation of approximately 0.5 was assumed as a reasonable upper bound and thus set U = 0.5/0.31 and a = 0.01, yielding the prior . For the mixing parameter φ , which balances spatially structured and unstructured effects, we specified the prior P ( φ < 0.5) = 2/3 reflecting a conservative assumption that the unstructured component accounts for more of the variability. Given the presence of 191 zeros in the dataset, we also investigated the potential for zero inflation and selected model configurations accordingly to improve computational efficiency. For transparency and reproducibility, the final model expression below is presented using the syntax implemented in the INLA syntax rather than traditional mathematical notation: COMPUTATIONAL STATISTICAL ANALYSIS Exploratory data analysis was initially performed to detect outliers, missing values and assess zero inflation in the response variable. A spatial neighbourhood map was constructed to identify adjacent municipalities within São Paulo State, defining the neighbourhood structure required for spatial modelling ( Figure 1 ). This adjacency matrix was built using geographic boundary data to determine which municipalities share common borders, establishing the spatial relationships necessary for incorporating spatial dependence in the analysis. One isolated polygon was identified during this process. Spatial neighborhood structures were then defined based on this adjacency information to support spatial modeling, and expected counts were computed for each area i using the formula E i = r ( s ) × n ( i ), where r ( s ) is the overall disease rate (total number of cases divided by the total population across all areas), and n ( i ) is the population of area i . Download figure Open in new tab Figure 1. Neighbors of municipalities of São Paulo State. These expected counts were used to calculate the standardised incidence ratio (SIR) for preliminary spatial risk assessment. Based on exploratory patterns and covariate distributions, final model covariates were selected. The statistical analysis was conducted using R version 4.4.0, with the support of the following packages: terra, geodata, geostatsp, mapmisc, diseasemapping, INLA , and tmap . Results and discussions To examine the association between socio-territorial indicators and the spatial distribution of leprosy, we analysed municipality-level data for the period 2017–2020 across the 645 municipalities of São Paulo. The analysis combined descriptive epidemiological measures with spatial modelling to identify patterns of risk and their relationship with socioeconomic conditions. During the study period, 4562 new leprosy cases were reported, corresponding to a mean of 7.07 cases per municipality (range: 0–461) and a median of 2 (IQR: 0–5). Expected counts, calculated using the overall state detection rate and municipal population, also averaged 7.07 but ranged widely (0.084–1220.76), reflecting the large variation in population size across municipalities. The SIR ranged from 0.00 to 32.81 (median 0.82; mean 1.72), indicating that while most municipalities experienced incidence close to or below the expected level, a smaller subset exhibited markedly elevated risk relative to the state average. The municipal wealth index (2018) showed moderate socioeconomic variability across municipalities (mean 34.6; range 15–62). To facilitate interpretation of spatial patterns, three complementary maps were generated ( Figure 2 ): observed case counts, expected counts, and SIRs. For interpretation, Panel A illustrates the absolute burden of reported cases across municipalities, whereas Panel B adjusts for population size by presenting the number of cases expected if the state detection rate were uniformly applied throughout the study area. Panel C displays the SIR, enabling identification of municipalities where the observed incidence is higher or lower than expected relative to the state average. Geographically, the highest absolute numbers of reported cases in Panel A are concentrated in the more densely populated metropolitan and urbanised areas, particularly in the eastern portion of the state, including the metropolitan region of São Paulo, which largely reflects population concentration. Elevated case counts are also observed in the northern region (Fernandópolis municipality) and in the northwestern region around São José do Rio Preto and Ribeirão Preto, where case counts range from approximately 100 to 461. These municipalities are generally characterised by larger populations, which partly explains the higher number of reported cases, although Fernandópolis represents a notable exception, with relatively elevated case counts despite its smaller population size. Similarly, Panel B shows a spatial pattern driven by demographic distribution, with larger expected counts occurring in municipalities with greater population size across the eastern and central regions of São Paulo. However, Panel C reveals a different pattern when incidence is standardised: several municipalities in the western and northwestern regions exhibit SIR values above the state average, indicating higher-than-expected incidence relative to population size. These areas, therefore, represent atypical patterns in which the disease burden cannot be explained solely by population density and may reflect localised epidemiological or socio-territorial determinants of transmission. This comparison helps distinguish areas with truly elevated risk from those where high case numbers simply reflect larger population size. Download figure Open in new tab Figure 2. Spatial distribution of observed cases (A), Expected cases (B), and SIRs (C) for Leprosy (2017–2020) in São Paulo State. While these descriptive maps provide an overview of spatial variation, model-based estimates are necessary to account for spatial dependence and stabilise estimates in municipalities with small populations. To quantify the association between municipal socioeconomic conditions and leprosy incidence, a spatial Bayesian model using the BYM2 specification was fitted ( Table 1 ). View this table: View inline View popup Download powerpoint Table 1. Posterior means and 95% credible intervals for model parameters obtained from fitting the São Paulo leprosy data with the BYM2 model Correspondence to: Carlos Souto dos Santos Filho (e-mail: c300761{at}dac.unicamp.br )© The author(s). This article is Open Access under CC BY 4.0 1 The estimated intercept (log-risk) was 1.138 (95% CrI: 0.362–1.915). Municipal wealth showed a statistically significant negative association with leprosy incidence (β = − 0.059; 95% CrI − 0.081 to − 0.037), indicating that municipalities with higher socioeconomic status tended to have lower relative risk. The precision parameter ( τ = 0.430; 95% CrI 0.350–0.522) and the mixing parameter ( φ = 0.517; 95% CrI 0.349–0.684) suggest that both structured spatial dependence and local unstructured heterogeneity contribute to the observed variation in risk. The posterior distribution of the wealth coefficient is illustrated in Figure 3 . The entire 95% credible interval lies below zero, providing strong evidence for a negative association between wealth and leprosy risk. Download figure Open in new tab Figure 3. Posterior distribution of the coefficient of covariate wealth. Posterior municipal relative risks (RR) had a median of 0.96 and a mean of 1.75, with values ranging from 0.06 to 31.52 ( Table 2 ). Figure 4 presents the spatial distribution of the posterior mean RR and its uncertainty. Municipalities with darker shading in Panel A represent areas with higher estimated risk, while Panels B and C show the lower and upper limits of the 95% credible interval, highlighting areas where uncertainty is greater. In the colour scale used in the maps, darker purple tones represent lower RR values, while progressively lighter colours correspond to higher values, allowing areas with elevated estimated risk to be visually distinguished from municipalities with lower risk. The lower limit (LL) of the 95% credible interval varied from 0.0009 to 21.92, while the upper limit (UL) ranged from 0.35 to 53.10. These values indicate that although the majority of municipalities had low or average risk, there were high-risk clusters with substantially elevated relative risk, suggesting spatial heterogeneity in the distribution of leprosy that may be associated with underlying socio-environmental determinants. View this table: View inline View popup Download powerpoint Table 2. Summary statistics for RR, LL, and UL variables Download figure Open in new tab Figure 4. Mean (A) and lower (B) and upper (C) limits of 95% credible intervals of leprosy RR in São Paulo municipalities. To further understand the spatial heterogeneity of leprosy risk beyond observed covariates, we examined the posterior mean of the spatial random effect b from the BYM2 model. This parameter captures unmeasured spatial variation by combining both structured (spatially correlated) and unstructured (random noise) components. Figure 5 presents the posterior mean estimates of b across all municipalities in São Paulo. Positive values of b indicate areas with higher-than-expected leprosy risk not explained by the included covariate (wealth), while negative values suggest reduced risk or potential underreporting. This spatial residual helps identify hidden patterns of disease transmission and suggests municipalities where additional epidemiological investigation may be warranted. Importantly, this interpretation is strengthened when the spatial random effects are considered together with other model outputs, such as the estimated association with wealth and the predicted municipal relative risks, since the combined set of results provides a more comprehensive picture of spatial risk patterns than observed data or latent effects alone. Download figure Open in new tab Figure 5. Posterior mean of the BYM2 random effect b . To identify areas with significantly elevated leprosy risk, exceedance probabilities were calculated using a threshold of RR > 2, a criterion commonly adopted in public health to flag high-priority regions. This threshold reflects municipalities where the relative risk is at least double the state average, indicating potential hotspots of concern. Figure 6 displays the spatial distribution of exceedance probabilities across São Paulo municipalities. The colour scale aids interpretation: light yellow areas represent low probabilities (low-risk), orange to red areas indicate moderate evidence of elevated risk, and dark red to purple areas signal high probabilities (close to 1), reflecting strong statistical evidence that RR exceeds 2. Download figure Open in new tab Figure 6. Exceedance probabilities for leprosy relative risk greater than 2 across municipalities in São Paulo (2017–2020). The map reveals distinct spatial patterns. Clusters of high exceedance probabilities are concentrated in the western and northern regions of the state, while southeastern coastal areas also show some persistent high-risk zones. In contrast, central and southern interior municipalities generally display low probabilities, suggesting a lower likelihood of elevated leprosy risk. To assess the quality of the fitted BYM2 spatial model, posterior samples and densities were extracted using INLA’s internal sampling functions ( n = 1000). This approach enables visualisation of marginal posterior distributions and contributes to evaluating model fit beyond summary statistics ( Figure 7 ). The extracted densities help identify the distributional behaviour of key parameters and verify whether the posterior estimates are consistent with prior assumptions and data structure. It is worth noting that the R package used for model fitting and visualisation does not natively support the simultaneous plotting of prior and posterior distributions. Therefore, a direct visual comparison of how the data updates the prior distribution for each parameter could not be incorporated into Figure 7 . Download figure Open in new tab Figure 7. Histograms of posterior samples (black bars) obtained from fitting the BYM2 model using INLA ( n = 1000), along with posterior densities derived from the marginal distributions (blue lines). Model fit was further assessed using the Deviance Information Criterion (DIC). The DIC value of 2526.27 reflects the balance between model fit and complexity; although not interpretable in isolation, it serves as a basis for model comparison. The Conditional Predictive Ordinate (CPO) values were also examined to evaluate predictive performance and potential outliers. The distribution of CPO values, where 98% (633 out of 645) of municipalities had CPO < 0.01, suggests low predictive accuracy in many areas. This pattern may indicate overdispersion, zero inflation, or deviation from the assumed Poisson structure in specific municipalities. These findings underscore the need to interpret spatial patterns with caution, particularly in locations with extreme or sparse data. The BYM2 model revealed significant spatial heterogeneity in leprosy risk across the 645 municipalities, with relative risk estimates ranging from 0.06 to 31.52. Municipal wealth emerged as a significant protective factor (posterior mean: –0.059, 95% CrI: –0.081 to –0.037), indicating that economically advantaged areas consistently demonstrated lower leprosy incidence rates. The mixing parameter ( φ = 0.517) suggested approximately equal contributions of structured spatial dependence and unstructured random variation in explaining disease distribution. Exceedance probability analysis identified distinct high-risk clusters primarily concentrated in western and northern regions of the state, where municipalities exhibited probabilities exceeding the threshold of RR greater than 2.0, representing areas with at least double the state average incidence rate. The observed spatial clustering of leprosy cases reflects persistent socioeconomic disparities and suggests the influence of unmeasured environmental or social determinants operating at the municipal level. The concentration of high-risk areas in western and northern São Paulo aligns with historical patterns of regional development inequality, where these areas typically exhibit lower infrastructure investment and reduced access to specialised healthcare services. The stability of these spatial patterns over the four-year study period indicates sustained exposure conditions rather than temporary epidemiological fluctuations, similar to findings in other chronic infectious diseases where poverty-related factors create enduring transmission environments. The negative association between municipal wealth and leprosy incidence supports the well-established relationship between socioeconomic development and infectious disease burden, suggesting that comprehensive poverty reduction strategies may serve as effective primary prevention measures. Additionally, the substantial unexplained spatial variation captured by the random effects component indicates that factors beyond municipal wealth, such as housing quality, population density, healthcare accessibility, or cultural practices, likely contribute to disease transmission dynamics and warrant further epidemiological investigation. This study demonstrates several methodological strengths, including the use of four years of comprehensive surveillance data from São Paulo’s robust epidemiological system, ensuring high case ascertainment and diagnostic reliability. The BYM2 modelling approach effectively addressed the statistical challenges inherent in rare disease mapping by borrowing strength from neighbouring municipalities and incorporating spatial dependence, thereby producing more stable risk estimates than traditional standardised incidence ratios. The integration of penalised complexity priors prevented overfitting while maintaining interpretability, because these priors constrain the spatial random effects toward a simpler base model (i.e., no spatial structure) unless the data provide sufficient evidence for additional complexity. In the context of our municipal data, where several areas report few cases, this approach reduces the risk of spurious spatial patterns while still allowing meaningful spatial variation to be detected. The exceedance probability framework provided a practical tool for public health priority setting. However, important limitations must be acknowledged. The use of municipal-level aggregated data may mask within-municipality heterogeneity and introduce ecological fallacy when inferring individual-level relationships. Residence at diagnosis served as a proxy for exposure location, potentially misclassifying individuals with complex migration histories or long latency periods typical of leprosy. The model’s limited covariate structure, while statistically significant, explained only a portion of the observed spatial variation, suggesting that crucial unmeasured factors, including individual-level sociodemographic characteristics, environmental exposures, and healthcare utilisation patterns, remain unaccounted for. Furthermore, the high proportion of municipalities with low predictive accuracy (CPO < 0.01 in 98% of areas) indicates potential model misspecification or overdispersion that may affect the reliability of risk estimates in specific locations. Conclusions The observed distribution of leprosy incidence in São Paulo State exhibits spatial clustering associated with municipal wealth disparities. The persistent geographic patterns suggest that socioeconomic conditions are associated with variations in local leprosy risk across municipalities. These findings support targeted public health interventions in identified high-risk areas and highlight the importance of addressing underlying sociodemographic inequalities that may influence the local effectiveness of leprosy control strategies. Future research should explore approaches that integrate high-resolution spatial and temporal data with analyses stratified by vulnerable groups through spatio-temporal modelling frameworks to better understand disease dynamics and inform precision public health interventions. Data Availability All data produced in the present study are available upon reasonable request to the authors Ethical considerations Regarding research ethics and risk assessment, it is important to highlight that the study poses no risk to participants, since all data were previously anonymised and only epidemiologic, non-sensitive information was accessed. Therefore, the requirements of the Brazilian General Data Protection Law (LGPD - Law No. 13.853/2019) were fully met, which specifically provides for the possibility of processing data for scientific purposes without the need for the data subject’s consent. Conflict of interests The authors report no conflicts of interest. Funding No funding was paid for this research. Authors’ contributions CSSF conceived the study; CSSF designed the study protocol; CSSF collected data, performed data entry and carried out the data analysis and interpretation; CSSF, AJAC and GASA drafted the manuscript; CSSF, AJAC and GASA critically revised the manuscript for intellectual content; CSSF, AJAC and GASA read and approved the final manuscript. CSSF is guarantor of the paper. Patient consent statement No patient consent was required. Data sharing statement The supporting data for this article can be obtained from the corresponding author on request. Footnotes Title revised to better reflect the epidemiological focus of the study; Results section updated to enhance readability and flow; Interpretation of figures and maps clarified throughout; Methodological explanations refined for greater precision; Technical terminology removed to improve accessibility for a broader audience; Model specification and interpretation of spatial effects addressed and clarified; Wording related to socioeconomic determinants revised for accuracy and consistency. References ↵ Grijsen ML , Nguyen TH , Pinheiro RO , Singh P , Lambert SM , Walker SL , Geluk A. Leprosy . Nat Rev Dis Primers , 2024 ; 10 ( 1 ): 90 . doi: 10.1038/s41572-024-00575-1 . OpenUrl CrossRef PubMed ↵ Santacroce L , Del Prete R , Charitos IA , Bottalico L. Mycobacterium leprae: a historical study on the origins of leprosy and its social stigma . Infez Med , 2021 ; 29 ( 4 ): 623 – 632 . doi: 10.53854/liim-2904-18 . OpenUrl CrossRef PubMed ↵ Chen W , Chen Y , Cheng Z , Chen Y , Lv C , Ma L et al. Global patterns of syphilis, gonococcal infection, typhoid fever, paratyphoid fever, diphtheria, pertussis, tetanus, and leprosy from 1990 to 2021: findings from the Global Burden of Disease Study 2021 . Infect Dis Poverty , 2024 ; 13 ( 1 ): 66 . doi: 10.1186/s40249-024-01231-2 . OpenUrl CrossRef PubMed ↵ Boigny RN , de Sousa Cavalcante KK , Florencio CMGD , Nogueira PSF , Gomes CM , Alencar CH . Temporal trends and space-time distribution of leprosy relapse in Brazil from 2001 to 2021 . Trans R Soc Trop Med Hyg , 2024 ; 118 ( 8 ): 537 – 549 . doi: 10.1093/trstmh/trae021 . OpenUrl CrossRef PubMed ↵ Sczmanski AS , Pazin L , Sakae TM , Mazon J. Analysis of the clinical and epidemiological profile of leprosy in Brazil and major regions . An Bras Dermatol , 2025 ; 100 ( 4 ): 501127 . doi: 10.1016/j.abd.2025.501127 . OpenUrl CrossRef PubMed ↵ Instituto Brasileiro de Geografia e Estatística (IBGE ). Censo Demográfico 2022: Resultados Preliminares – População e Habitantes [Internet] . Rio de Janeiro : IBGE , 2023 . Available from: https://www.ibge.gov.br/en/statistics/social/labor/22836-2022-census-3.html . ↵ Fundação SEADE. índice Paulista de Responsabilidade Social – IPRS 2014-2018 . São Paulo : SEADE , 2019 . Available from: http://www.iprs.seade.gov.br/downloads/pdf/iprs_release_site.pdf . ↵ Gelfand AE , Diggle PJ , Guttorp P , Fuentes M (eds) Handbook of Spatial Statistics . Boca Raton, FL : Chapman & Hall/CRC , 2010 . ISBN: 978-1420072877 . ↵ Lawson AB . Bayesian Disease Mapping: Hierarchical Modeling in Spatial Epidemiology . 2nd edn, Boca Raton, FL : Chapman & Hall/CRC , 2009 . ISBN: 978-1584888406 . ↵ Simpson D , Rue H , Riebler A , Martins TG , Sørbye SH . Penalising model component complexity: a principled, practical approach to constructing priors . Stat Sci , 2017 ; 32 : 1 – 28 . doi: 10.1214/16-STS576 . OpenUrl CrossRef ↵ Besag J , York J , Mollié A. Bayesian image restoration, with two applications in spatial statistics . Ann Inst Statist Math , 1991 ; 43 ( 1 ): 1 – 20 . doi: 10.1007/BF00116466 . OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted April 22, 2026. Download PDF Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Socioeconomic determinants and spatial distribution of leprosy in São Paulo State, Brazil (2017–2020): a municipal-level analysis Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Socioeconomic determinants and spatial distribution of leprosy in São Paulo State, Brazil (2017–2020): a municipal-level analysis Carlos Souto dos Santos Filho , Ana Júlia Alves Câmara , Guilherme Aparecido Santos Aguilar medRxiv 2025.09.16.25335912; doi: https://doi.org/10.1101/2025.09.16.25335912 Share This Article: Copy Citation Tools Socioeconomic determinants and spatial distribution of leprosy in São Paulo State, Brazil (2017–2020): a municipal-level analysis Carlos Souto dos Santos Filho , Ana Júlia Alves Câmara , Guilherme Aparecido Santos Aguilar medRxiv 2025.09.16.25335912; doi: https://doi.org/10.1101/2025.09.16.25335912 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Epidemiology Subject Areas All Articles Addiction Medicine (568) Allergy and Immunology (863) Anesthesia (299) Cardiovascular Medicine (4426) Dentistry and Oral Medicine (443) Dermatology (382) Emergency Medicine (607) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1507) Epidemiology (15222) Forensic Medicine (30) Gastroenterology (1123) Genetic and Genomic Medicine (6589) Geriatric Medicine (667) Health Economics (997) Health Informatics (4525) Health Policy (1368) Health Systems and Quality Improvement (1612) Hematology (540) HIV/AIDS (1264) Infectious Diseases (except HIV/AIDS) (15910) Intensive Care and Critical Care Medicine (1103) Medical Education (623) Medical Ethics (145) Nephrology (667) Neurology (6588) Nursing (346) Nutrition (998) Obstetrics and Gynecology (1143) Occupational and Environmental Health (956) Oncology (3331) Ophthalmology (971) Orthopedics (369) Otolaryngology (420) Pain Medicine (435) Palliative Medicine (129) Pathology (663) Pediatrics (1690) Pharmacology and Therapeutics (691) Primary Care Research (710) Psychiatry and Clinical Psychology (5440) Public and Global Health (9221) Radiology and Imaging (2195) Rehabilitation Medicine and Physical Therapy (1369) Respiratory Medicine (1196) Rheumatology (593) Sexual and Reproductive Health (710) Sports Medicine (529) Surgery (711) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'9fff245f191f1640',t:'MTc3OTQ4NzczMw=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00
unpaywall
last seen: 2026-05-23T02:00:01.238055+00:00
License: CC-BY-4.0