Fisher-Rao distance and sex differences in disease prevalence trajectories

preprint OA: closed CC-BY-4.0
📄 Open PDF Full text JSON View at publisher
Full text 39,512 characters · extracted from preprint-html · click to expand
Fisher-Rao distance and sex differences in disease prevalence trajectories | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Fisher-Rao distance and sex differences in disease prevalence trajectories View ORCID Profile José Manuel Rodríguez Caballero doi: https://doi.org/10.1101/2025.11.14.25340249 José Manuel Rodríguez Caballero 1 Département de mathématiques et de statistique, Université Laval Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for José Manuel Rodríguez Caballero For correspondence: jose-manuel.rodriguez-caballero.1{at}ulaval.ca Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF Abstract Objectives We introduce a new application of the Fisher–Rao geodesic distance to quantify sex differences in age-stratified chronic-disease prevalence trajectories, modelling those trajectories as dynami-cal systems on the hyperbolic plane and using GBD 2021 data. Methods We analysed prevalence for 10 major chronic conditions across three regions—US states (50 states + DC), 24 Western European countries, and 47 Japanese prefectures—over 1990–2019. We logit-transformed prevalence and summarised each age-sex cohort by normal-approximation parameters ( µ, σ ), which were then embedded in the hyperbolic plane. Sex differences were quantified as the difference between the total Fisher–Rao trajectory lengths for males and females. We assessed cross-regional consistency using parametric (mean differences) and nonparametric (Cohen’s g) summaries, and compared Fisher–Rao results to KL divergence, absolute mean differences, and absolute SD differences. Study design Cross-sectional analysis of GBD 2021 prevalence data modelled as trajectories in the hyperbolic plane. Results The Fisher–Rao distance showed greater cross-regional consistency than the alternative metrics. Males showed greater trajectory shifts in neoplasms, cardiovascular diseases, chronic respiratory diseases, diabetes/kidney diseases, skin/subcutaneous diseases, and sense organ diseases. Females showed greater shifts in neurological disorders, mental disorders, and substance use disorders. Digestive diseases exhibited mixed patterns. Conclusions This geometry-informed metric outperforms alternatives in assessing sex disparities in disease burdens, enhancing public health surveillance and equity in chronic disease management. Future extensions should incorporate gender dimensions. 1 Introduction The Fisher–Rao metric has its roots in Fisher’s 1922 Fisher information matrix for statistical estimation. [ 1 ]. Rao (1945) formalised this idea as a metric tensor on statistical manifolds and introduced geodesic distances now known as the Rao distance. [ 2 ] This laid the groundwork for information geometry, advanced by Shun-ichi Amari in the 1980s via dual affine connections and applications to machine learning and neural networks [ 3 ]. Recent work applies the Fisher–Rao metric in biological contexts such as generative modelling and optimal transport. The FISHER-FLOW model employs Fisher-Rao reparameterisation for generative modelling over discrete data [ 4 ], evaluated on DNA promoter and enhancer sequences. Related studies optimise cosine schedules in masked diffusion models for biological sequences [ 5 ] and extend to L p -Fisher-Rao metrics with Amari-Čencov α -connections for Finsler geometries [ 6 ]. The Wasserstein-Fisher-Rao metric models optimal transport in leaf venation, blood circulation, and neuronal networks [ 7 ]. In shape analysis, a core area of statistical learning, the Fisher-Rao metric facilitates unsupervised clustering of biological objects by quantifying shape similarities [ 8 ]. In phylogenetics, it arises from character distributions under two-state symmetric Markov models on trees [ 9 ]. It also supports functional data registration for neuroscience spike trains and gene expression [ 10 ]. This paper presents a novel epidemiologic application of the Fisher-Rao geodesic distance to quantify sex-based differences in chronic disease prevalence trajectories across age groups, aligning with multidisciplinary approaches to disease etiology and health equity. We model trajectories as dynamical systems on the hyperbolic plane, representing epidemiological macrostates of population health burdens. Leveraging Global Burden of Disease (GBD) 2021 data for 10 major chronic conditions, we compute a statistic as the difference in total Fisher-Rao distances along male and female trajectories across the US, Western Europe, and Japan (1990–2019). We assess crossregional consistency parametrically and nonparametrically, comparing against Kullback-Leibler divergence, absolute mean differences, and absolute standard deviation differences. This framework addresses novel issues in population-based epidemiology by providing a consistent, geometry-informed metric to characterise sex disparities in disease determinants and outcomes, enhancing public health surveillance and equity in chronic disease management. 2 Materials and Methods 2.1 Model Formulation We developed a model motivated by hyperbolic dynamical systems theory [ 11 , 12 ] to track changes in disease prevalence across five-year age groups stratified by sex. Dynamical systems provide a mathematical framework widely used in biology and medicine [ 13 ] to describe how state variables evolve over time or, as here, across successive age cohorts, analogous to cohort-progression models in epidemiology. To ensure prevalence rates remain realistic and non-negative, we apply a (base 10) logit transformation [ 14 ] and assume a normal distribution for the transformed data. Each epidemiological summary (in logit scale), or macrostate [ 15 ], represents the overall disease burden in a population subset, capturing its average level (mean, denoted µ ) and variability (standard deviation, denoted σ ). These macrostates are positioned on the hyperbolic plane, a curved geometric space suitable for statistical distributions because the metric has an information-theoretic interpretation [ 16 , 17 ]: where ℍ denotes the hyperbolic plane in the Poincaré model, ℝ 2 is two-dimensional real space, and σ > 0 ensures positive variability. In information geometry, the statistical manifold [ 18 ] of the normal distribution is defined as the set ℍ endowed with the Fisher-Rao distance d FR [ 1 , 2 , 3 ], a metric that measures dissimilarity between gaussian random variables and , is given by the formula [ 19 ]: where acosh is the inverse hyperbolic cosine. The general definition of the Fisher-Rao distance [ 20 ], involving differential geometry, will not be used in the present article. Age groups are defined in five-year intervals as 𝒜 = { t k : k ∈ ℕ}, where t k = [5 k , 5 k + 4] and ℕ denotes the natural numbers starting at 0. In practice, we consider k = 0, …, 18, corresponding to the age ranges 0–4 through 90–94 years. Biological sex categories are 𝒮 = {male, female}, consistent with the SAGER guidelines [ 21 ] and restricted to sex because the dataset does not include gender information [ 22 ]. The population space X , containing all possible populations, evolves under a mapping f : X → X , with iterations x n +1 = f ( x n ) representing aging 5 years, and the initial condition x 0 = x ∈ X . The macrostate map p : X → ℍ assigns p ( x ) = ( µ, σ ). Subsets for sex φ and age t evolve as . From Global Burden of Disease (GBD) 2021 data [ 22 ], we derive macrostate sequence p ( x 0 ), p ( x 1 ), …, p ( x 18 ) of x 0 , x 1 , …, x 18 , or disease prevalence trajectories, for each sex φ : illustrated in Figures 1 and 2 for chronic respiratory diseases in California, 1990, by sex. Download figure Open in new tab Figure 1. Trajectories in ( µ, σ ) space for chronic respiratory diseases in California (1990). Markers indicate successive time points (age groups); connecting lines show the temporal path of the parameter estimates. Sex: Male. Download figure Open in new tab Figure 2. Trajectories in ( µ, σ ) space for chronic respiratory diseases in California (1990). Markers indicate successive time points (age groups); connecting lines show the temporal path of the parameter estimates. Sex: Female. To reconcile the dynamical-systems framing with cross-sectional age slices we adopt a time-independent (autonomous) model for aging: the map f : X → X that advances a population state by one five-year step is assumed not to depend on calendar time. Equivalently, for any population state x and any calendar year t we assume the same aging rule applies, so that x n +1 = f ( x n ) has the same meaning whether it represents cohort B moved forward five years or cohort A observed five years older. Under this stationarity assumption a five-year older age slice in year t may be interpreted, within the model, as the same cohort observed in year t + 5, which permits treating cross-sectional age-profiles as synthetic cohort trajectories. We emphasize that this is a simplification: it ignores period effects (secular trends, epidemics, policy changes), cohort-specific exposures, selective mortality, migration, and other calendar-time heterogeneities that can make period age-profiles an imperfect proxy for true longitudinal cohort change. To assess robustness, we compare results across multiple calendar years. 2.2 Model Analysis To quantify sex differences in prevalence evolution, we compute d = d male − d female , where d φ is the total trajectory length for sex φ : providing a geometrically meaningful notion of length for epidemiological shifts. We analyse d parametrically, assuming a normal distribution d ~ 𝒩 ( µ, σ 2 ) to estimate means and variances, and nonparametrically via the frequency of d > 0. Cumulative distances are plotted for intuition, as in Figure 3 for chronic respiratory diseases. Download figure Open in new tab Figure 3. Cumulative Fisher-Rao distance by sex for chronic respiratory diseases in California (1990). The horizontal axis is the centre 5 r + 2 of the age group t r =]5 r , 5 r + 4]. 2.3 Fitting the model to data We applied our model to data from the Global Burden of Disease Study, manually retrieved from the IHME website [ 22 ]. The R scripts used for data cleaning and analysis are provided in the supplementary material. 2.3.1 Data Sources Drawing on IHME’s GBD 2021 estimates [ 22 , 23 ], we examine prevalence per 100,000, stratified by age, sex, location, and year, with 95% uncertainty intervals from systematic reviews and integrations [ 24 , 25 ]. Focusing on the US (51 locations: 50 states and the District of Columbia), Western Europe (24 countries: Andorra, Austria, Belgium, Cyprus, Denmark, Finland, France, Germany, Greece, Iceland, Ireland, Israel, Italy, Luxembourg, Malta, Monaco, Netherlands, Norway, Portugal, San Marino, Spain, Sweden, Switzerland, United Kingdom), and Japan (47 prefectures), we compare age-specific tra-jectories to reveal sex differences, embracing the data’s open-ended nature over rigid unification. 2.3.2 Data Extraction and Preprocessing Age midpoints are assigned as 2 for < 5, incrementing to 92 for 90–94. We logit-transform 1 the prevalence assuming normality: where Φ −1 (0.975) ≈ 1.96 is the 97.5th percentile point of the standard normal distribution. Processed CSV files—one per region—contain age, sex, disease, subregional location, year, and the parameters µ and σ . Data from the pandemic years 2020–2021 were excluded to mitigate bias [ 26 ]. 2.4 Cross-Regional Consistency We evaluated the consistency of sex-specific shifts in age-stratified disease prevalence trajectories across the United States, Western Europe, and Japan from 1990 to 2019, using four metrics to quantify total trajectory shifts: absolute mean difference ( µ -distance) absolute standard deviation difference ( σ -distance) Kullback-Leibler divergence (KL-divergence) [ 27 ] and Fisher-Rao distance (FR-distance) For each sex φ , disease, year, and location, the total shift was the sum of distances across 18 consecutive 5-year age groups, assuming normal distributions for prevalence parameters. In the parametric approach, sex differences were computed as per location (inside a region), then averaged to estimate mean µ per region, assuming normality of d f . Consistency was defined as the number of diseases (out of 10) with uniform sign of µ across all regions (all positive or all negative). If µ = 0 in any region, it is interpreted as an inconsistency, as zero has no sign. In the nonparametric approach, Cohen’s g measured the probability of greater male shifts minus 0.5 across locations per region, i.e., where n is the number of locations and 1 {·} is the indicator function. According to Jacob Cohen [ 28 ], the effect size g is conventionally interpreted as small, medium, or large when | g ≈ |0.05, | g | ≈ 0.15, and | g |≈ 0.25, respectively. Consistency was the number of diseases with uniform sign of g across regions (all positive or all negative). If g = 0 in any region, it is interpreted as an inconsistency, as zero has no sign. 2.5 Sex-Specific Shifts Using FR-distance, we computed sex differences d = d male − d female per location, then derived regional summary statistics: Cohen’s g , mean µ , standard deviation σ , skewness γ 1 , excess kurtosis κ , Shapiro-Wilk p-value p SW for normality, and t-test p-value p t for mean deviation from zero. Results for 1990 exemplify patterns across 1990–2019. It is important to note the ambiguity in the notation: the prevalence is modelled as being normally distributed on the base-10 logit scale, 𝒩 ( µ, σ 2 ), whereas in the parametric model, we assume d ~ 𝒩 ( µ, σ 2 ). However, the parameters µ and σ in these two contexts are not the same. 2.6 Ethics Statement This study uses publicly available secondary data from IHME GBD 2021 [ 22 ], exempt from ethical review per institutional guidelines and the Declaration of Helsinki. No human subjects were involved. 3 Results 3.1 Cross-Regional Consistency Supplementary table for parametric consistency (1990–2019) show FR-distance yielded the highest consistency (e.g., 10/10 diseases in early 1990s). Supplementary table for nonparametric consistency (1990–2019) confirms FR-distance’s superior performance (e.g., 10/10 in mid-1990s). These findings highlight FR-distance’s utility in capturing geodesic shifts on the hyperbolic plane of normal distribution parameters, offering a novel epidemiologic method for assessing trajectory consistency in population health data. 3.2 Sex-Specific Shifts Diseases with consistently greater male shifts (positive g and µ, p t < 0.05) included neoplasms (supplementary table showing g = 0.50, µ = 11.44 to 17.61 across regions), cardiovascular diseases (supplementary table showing g = 0.27 to 0.50, µ = 0.69 to 4.87), chronic respiratory diseases (supplementary table showing g = 0.21 to 0.50, µ = 1.77 to 13.21), diabetes and kidney diseases (supplementary table showing g = 0.42 to 0.50, µ = 1.82 to 3.91), skin and subcutaneous diseases (supplementary table showing g = 0.50, µ = 5.61 to 12.14), and sense organ diseases (supplementary table showing g = 0.50, µ = 3.79 to 6.92). Diseases with greater female shifts (negative g and µ, p t < 0.05) included neurological disorders (supplementary table showing g = −0.50, µ = −0.86 to −2.78), mental disorders (supplementary table showing g = −0.21 to −0.50, µ = −0.42 to −6.48), and substance use disorders (supplementary table showing g = −0.42 to −0.50, µ = −1.56 to −3.28). Digestive diseases showed mixed patterns, with no significant sex differences in the United States ( p t = 0.19) or Western Europe ( p t = 0.63), but male predominance in Japan ( p t < 0.05; supplementary table showing g = 0.00 to 0.31, µ = 0.07 to 0.54). This application of FR-distance provides a robust, geometry-informed metric for quantifying sex disparities in disease trajectories, enhancing etiologic insights and equity assessments in public health surveillance. 4 Discussion This study introduces a novel application of the Fisher-Rao geodesic distance, rooted in information geometry, to quantify sex-based differences in disease prevalence trajectories across age groups using GBD 2021 data from 1990 to 2019. By modelling trajectories as dynamical systems on the hyperbolic plane, the metric provides superior cross-regional consistency compared to alternatives like Kullback-Leibler divergence, absolute mean differences, and absolute standard deviation differences. Key findings reveal greater male shifts in neoplasms, cardiovascular diseases, chronic respiratory diseases, diabetes and kidney diseases, skin and subcutaneous diseases, and sense organ diseases; greater female shifts in neurological disorders, mental disorders, and substance use disorders; and variable patterns for digestive diseases across the US, Western Europe, and Japan. These results advance epidemiologic methods by offering a geometry-informed tool to assess sex disparities in chronic disease burdens, enhancing public health surveillance and equity assessments. The framework’s consistency supports its use in population-based analyses of disease determinants, aligning with multidisciplinary approaches to etiology. Limitations include data biases from the COVID-19 pandemic—elevated prevalence for major depressive and anxiety disorders, unchanged self-harm rates [ 26 ]—prompting exclusion of 2020–2021 data, and lack of gender information, limiting focus to biological sex. Gender, a multifaceted social determinant, influences health via environmental exposures like air pollution [ 29 ] and requires integration of genderaffirming hormone therapy in frameworks [ 30 ]. To address its complexity, avoid binary models; instead, represent gender as a vector space capturing cultural, social, and relational dimensions using Likert scales [ 31 , 32 , 33 , 34 ]. Future extensions include applying Fisher-Rao distance to gender-based differences, including transgender population, formalising population dynamics to prove theorems for particular models (without aiming to unify biosciences [ 35 ]), and developing a notion of entropy [ 36 ] to answer the question how many microstates (possible populations) correspond to the same macrostate ( µ, σ )? 5 Conclusions This paper introduces an innovative Fisher-Rao geodesic distance framework that models disease prevalence as trajectories on the hyperbolic plane to measure sex-based disparities between age groups with greater cross-regional consistency. Applied to GBD 2021 data for 10 major chronic disease categories in the US, Western Europe, and Japan (1990–2019), it outperforms Kullback-Leibler divergence and absolute mean/standard deviation differences. Males show greater shifts in neoplasms, cardiovascular, chronic respiratory, diabetes/kidney, skin/subcutaneous, and sense organ diseases; females in neurological, mental, and substance use disorders; digestive diseases vary by region. This geometry-informed metric advances epidemiologic methods for assessing disease burden determinants, promoting health equity through population-based analyses of sex differences. Future work should integrate gender dimensions, including transgender populations, to enhance public health surveillance and address inequities. Data Availability All data produced are available online at Global Burden of Disease Study 2021 (GBD 2021) https://ghdx.healthdata.org/gbd-2021 https://ghdx.healthdata.org/gbd-2021 7 Declaration of generative AI and AI-assisted technologies in the writing process During the preparation of this work the author used Grok 4 Heavy for language editing, LaTeX, R code, bibliographic suggestions and brainstorming. The author reviewed and edited the content as needed and takes full responsibility for the content of the published article. 8 Data availability The data is available on the website: https://vizhub.healthdata.org/gbd-results/ A Tables in Parametric Approach View this table: View inline View popup Download powerpoint Table 1: Consistency:1990–1999 (parametric) View this table: View inline View popup Download powerpoint Table 2: Consistency: 2000–2009 (parametric) View this table: View inline View popup Download powerpoint Table 3: Consistency: 2010–2019 (parametric) B Tables in Nonparametric Approach View this table: View inline View popup Download powerpoint Table 4: Consistency: 1990–1999 (nonparamet-ric) View this table: View inline View popup Download powerpoint Table 5: Consistency: 2000–2009 (nonparamet-ric) View this table: View inline View popup Download powerpoint Table 6: Consistency: 2010–2019 (nonparamet-ric) C Tables in Diseases with Greater Male Shifts View this table: View inline View popup Download powerpoint Table 7: Neoplasms parameters (greater male shifts). Year: 1990. View this table: View inline View popup Download powerpoint Table 8: Cardiovascular diseases parameters (greater male shifts). Year: 1990. View this table: View inline View popup Download powerpoint Table 9: Chronic respiratory diseases parameters (greater male shifts). Year: 1990. View this table: View inline View popup Download powerpoint Table 10: Diabetes and kidney diseases parameters (greater male shifts). Year: 1990. View this table: View inline View popup Download powerpoint Table 11: Skin and subcutaneous diseases parameters (greater male shifts). Year: 1990. View this table: View inline View popup Download powerpoint Table 12: Sense organ diseases parameters (greater male shifts). Year: 1990. D Tables in Diseases with Greater Female Shifts View this table: View inline View popup Download powerpoint Table 13: Neurological disorders parameters (greater female shifts). Year: 1990. View this table: View inline View popup Download powerpoint Table 14: Mental disorders parameters (greater female shifts). Year: 1990. View this table: View inline View popup Download powerpoint Table 15: Substance use disorders parameters (greater female shifts). Year: 1990. E Table in Mixed Patterns View this table: View inline View popup Download powerpoint Table 16: Digestive diseases parameters (mixed patterns). Year: 1990. Note that the fact g = 0 in the Western European data corresponds to an inconsistency of the Fisher-Rao distance according to our definition of consistency. 6 Acknowledgements None. Funding: None declared. Competing Interests: None declared. Footnotes ↵ 1 We use base-10 logarithms for intuition, reflecting the ubiquity of the decimal system. Abbreviations GBD Global Burden of Disease IHME Institute for Health Metrics and Evaluation FR Fisher-Rao KL Kullback-Leibler SAGER Sex and Gender Equity in Research References [1]. ↵ R. A. Fisher , On the mathematical foundations of theoretical statistics , Philosophical transactions of the Royal Society of London. Series A, containing papers of a mathematical or physical character 222 ( 594-604 ) ( 1922 ) 309 – 368 . doi: 10.1098/rsta.1922.0009 . OpenUrl CrossRef [2]. ↵ C. R. Rao , Information and the Accuracy Attainable in the Estimation of Statistical Parameters , Springer New York , New York, NY , 1992 , pp. 235 – 247 . doi: 10.1007/978-1-4612-0919-5_16 . URL https://doi.org/10.1007/978-1-4612-0919-5_16 OpenUrl CrossRef [3]. ↵ S.-i. Amari , Differential-Geometrical Methods in Statistics , Vol. 28 of Lecture Notes in Statistics, Springer-Verlag Berlin Heidelberg, Berlin , 1985 . doi: 10.1007/978-1-4612-5056-2 . URL https://link.springer.com/book/10.1007/978-1-4612-5056-2 OpenUrl CrossRef [4]. ↵ A. Globerson , L. Mackey , D. Belgrave , A. Fan , U. Paquet , J. Tomczak , C. Zhang O. Davis , S. Kessler , M. Petrache , I. I. Ceylan , M. Bronstein , A. J. Bose , Fisher flow matching for generative modeling over discrete data , in: A. Globerson , L. Mackey , D. Belgrave , A. Fan , U. Paquet , J. Tomczak , C. Zhang (Eds.), Advances in Neural Information Processing Systems , Vol. 37 , Curran Associates, Inc ., 2024 , pp. 139054 – 139084 . URL https://proceedings.neurips.cc/paper_files/paper/2024/file/fadec8f2e65f181d777507d1df69b92f-Paper-Conference.pdf OpenUrl [5]. ↵ J. Zheng , Z. Lu , Universal response inequalities beyond steady states via trajectory information geometry , Phys. Rev. E 112 ( 2025 ) L012103 . doi: 10.1103/scg2-qkxv . URL https://link.aps.org/doi/10.1103/scg2-qkxv OpenUrl CrossRef [6]. ↵ M. Bauer , A. Le Brigant , Y. Lu , C. Maor , The l p -fisher–rao metric and amari–Č encov α-connections , Calculus of Variations and Partial Differential Equations 63 ( 2 ) ( 2024 ) 56 . doi: 10.1007/s00526-024-02660-5 . URL https://doi.org/10.1007/s00526-024-02660-5 OpenUrl CrossRef [7]. ↵ J. Haskovec , P. Markowich , S. Portaro , Measure-based approach to mesoscopic modeling of optimal transportation networks , arXiv preprint arxiv: 2401.07922 ( 2024 ). [8]. ↵ S. A. Gattone , A. De Sanctis , T. Russo , D. Pulcini , A shape distance based on the Fisher–Rao metric and its application for shapes clustering , Physica A: Statistical Mechanics and its Applications 487 ( 2017 ) 93 – 102 . doi: 10.1016/j.physa.2017.06.014 . URL https://www.sciencedirect.com/science/article/pii/S0378437117306556 OpenUrl CrossRef [9]. ↵ M. K. Garba , T. M. W. Nye , J. Lueg , S. F. Huckemann , Information geometry for phylogenetic trees , Journal of Mathematical Biology 82 ( 3 ) ( 2021 ) 19 . doi: 10.1007/s00285-021-01553-x . URL https://doi.org/10.1007/s00285-021-01553-x OpenUrl CrossRef PubMed [10]. ↵ A. Srivastava , W. Wu , S. Kurtek , E. Klassen , J. S. Marron , Registration of functional data using Fisher-Rao metric , arXiv preprint arxiv: 1103.3817 ( 2011 ). [11]. ↵ J.-C. Yoccoz , Introduction to Hyperbolic Dynamics , Springer Netherlands, Dordrecht , 1995 , pp. 265 – 291 . doi: 10.1007/978-94-015-8439-5_11 . OpenUrl CrossRef [12]. ↵ J. Franchi , Y. Le Jan , Hyperbolic dynamics and Brownian motion: an introduction, Oxford Mathematical Monographs , Oxford , 2012 . doi: 10.1093/acprof:oso/9780199654109.001.0001 . OpenUrl CrossRef [13]. ↵ K. Aihara , H. Suzuki , Theory of hybrid dynamical systems and its applica-tions to biological and medical systems , Philosophical Transactions of the Royal Society A 368 ( 2010 ) 4893 – 4914 . doi: 10.1098/rsta.2010.0237 . URL https://doi.org/10.1098/rsta.2010.0237 OpenUrl CrossRef PubMed [14]. ↵ D. G. Kleinbaum , M. Klein , Logistic Regression: A Self-Learning Text , 3rd Edition, Statistics for Biology and Health, Springer New York, New York, NY , 2010 . doi: 10.1007/978-1-4419-1742-3 . URL https://link.springer.com/book/10.1007/978-1-4419-1742-3 OpenUrl CrossRef [15]. ↵ A. Gupta , D. Jain , Revisiting the concept of macrostates and microstates in a degenerate system: Finite and infinite levels , Resonance – Journal of Science Education 30 ( 10 ) ( 2025 ) 1329 – 1351 , open-access article (Indian Academy of Sciences). Accessed 2025-10-21 . URL https://www.ias.ac.in/describe/article/reso/030/10/1329-1351?lang=English OpenUrl [16]. ↵ N. Ay , J. Jost , H.V. Lê , L. Schwachhöfer , Information Geometry, Vol. 64 of Ergebnisse der Mathematik und ihrer Grenzgebiete. 3 . Folge /A Series of Modern Surveys in Mathematics , Springer , Cham , 2017 . doi: 10.1007/978-3-319-56478-4 . OpenUrl CrossRef [17]. ↵ J. Hofrichter , J. Jost , T. D. Tran , Information Geometry and Population Genetics: The Mathematical Structure of the Wright-Fisher Model , Vol. 62 of Understanding Complex Systems , Springer, Cham , 2017 . [18]. ↵ S.-i. Amari , Information Geometry and Its Applications , Vol. 194 of Applied Mathematical Sciences , Springer, Tokyo , 2016 . doi: 10.1007/978-4-431-55978-8 . OpenUrl CrossRef [19]. ↵ F. Nielsen , A Simple Approximation Method for the Fisher–Rao Distance between Multivariate Normal Distributions , Entropy 25 ( 4 ) ( 2023 ) 654 . doi: 10.3390/e25040654 . OpenUrl CrossRef PubMed [20]. ↵ S.-i. Amari , H. Nagaoka , Methods of Information Geometry, Vol. 191 of Translations of Mathematical Monographs , American Mathematical Society, Providence, RI , 2000 . doi: 10.1109/TIT.2009.2016067 . OpenUrl CrossRef [21]. ↵ V. M. Miller , M. Rice , L. Schiebinger , M. R. Jenkins , J. Werbinski , A. Núñez , S. Wood , T. R. Viggiano , L. T. Shuster , Embedding concepts of sex and gender health differences into medical curricula , J Womens Health (Larchmt) 22 ( 3 ) ( 2013 ) 194 – 202 , epub 2013 Feb 15. doi: 10.1089/jwh.2012.4193 . OpenUrl CrossRef Web of Science [22]. ↵ Institute for Health Metrics and Evaluation (IHME ), Gbd results , https://vizhub.healthdata.org/gbd-results/ , accessed: September 2025 ( 2024 ). URL https://vizhub.healthdata.org/gbd-results [23]. ↵ A. J. Ferrari , D. F. Santomauro , A. Aali , Y. H. Abate , C. Abbafati , H. Abbastabar , S. Abd ElHafeez , M. Abdelmasseh , S. Abd-Elsalam , A. Abdollahi , et al. , Global incidence, prevalence, years lived with disability (YLDs), disability-adjusted life-years (DALYs), and healthy life expectancy (HALE) for 371 diseases and injuries in 204 countries and territories and 811 subnational locations, 1990–2021: a systematic analysis for the Global Burden of Disease Study 2021 , The Lancet 403 ( 10440 ) ( 2024 ) 2133 – 2161 . doi: 10.1016/S0140-6736(24)00757-8 . OpenUrl CrossRef [24]. ↵ D. G. Kleinbaum , L. L. Kupper , H. Morgenstern , Epidemiologic Research: Principles and Quantitative Methods, Lifetime Learning Publications , Belmont, Calif ., 1982 . [25]. ↵ K. J. Rothman , K. F. Huybrechts , E. J. Murray , Epidemiology: An Introduction , Oxford University Press , New York , 2025 . doi: 10.1093/oso/9780197751541.001.0001 . OpenUrl CrossRef [26]. ↵ W. Jang , H. Cho , S. Kim , L. Boyer , G. Fond , J. Kang , C. J. Nehs , D. Pizzol , S. Lee , J. Oh , H. J. Kim , Y. Son , H. Lee , D. K. Yon , Global burden of anxiety, depression, and self-harm (1990–2021) and the impact of the COVID-19 pandemic , Journal of Affective Disorders 392 ( 2025 ) 120201 . doi: 10.1016/j.jad.2025.120201 . URL https://www.sciencedirect.com/science/article/pii/S016503272501643X OpenUrl CrossRef PubMed [27]. ↵ D. I. Belov , R. D. Armstrong , Distributions of the Kullback–Leibler divergence with applications , British Journal of Mathematical and Statistical Psychology 64 ( 2 ) ( 2011 ) 291 – 309 . doi: 10.1348/000711010X522227 . OpenUrl CrossRef Web of Science [28]. ↵ J. Cohen , A power primer , Psychological Bulletin 112 ( 1 ) ( 1992 ) 155 – 159 . doi: 10.1037/0033-2909.112.1.155 . OpenUrl CrossRef PubMed Web of Science [29]. ↵ J. E. Clougherty , A growing role for gender analysis in air pollution epidemiology , Environmental health perspectives 118 ( 2 ) ( 2010 ) 167 – 176 . OpenUrl CrossRef PubMed Web of Science [30]. ↵ Q. Zhang , M. Goodman , N. Adams , T. Corneil , L. Hashemi , B. P. C. Kreukels , J. Motmans , R. L. Snyder , E. Coleman , Epidemiological considerations in transgender health: A systematic review with focus on higher quality data ., International journal of transgender health 21 2 ( 2020 ) 125 – 137 . doi: 10.1080/26895269.2020.1753136 . URL https://api.semanticscholar.org/CorpusID:218828390 OpenUrl CrossRef [31]. ↵ G. R. Bauer , Sex and gender multidimensionality in epidemiologic research , American Journal of Epidemiology 192 ( 1 ) ( 2023 ) 122 – 132 . doi: 10.1093/aje/kwac173 . OpenUrl CrossRef PubMed [32]. ↵ A. V. Ballering , T. C. Olde Hartman , J. G. Rosmalen , Gender scores in epidemiological research: methods, advantages and implications , The Lancet Regional Health Europe 43 ( 2024 ) 100962 . doi: 10.1016/j.lanepe.2024.100962 . URL https://www.sciencedirect.com/science/article/pii/S2666776224001297 OpenUrl CrossRef PubMed [33]. ↵ H. Colineaux , A. Soulier , B. Lepage , M. Kelly-Irving , Considering sex and gender in epidemiology: a challenge beyond terminology. from conceptual analysis to methodological strategies , Biology of Sex Differences 13 ( 1 ) ( 2022 ) 23 . doi: 10.1186/s13293-022-00430-6 . URL https://doi.org/10.1186/s13293-022-00430-6 OpenUrl CrossRef PubMed [34]. ↵ C. Miani , L. Wandschneider , J. Niemann , S. Batram-Zantvoort , O. Razum , Measurement of gender as a social determinant of health in epidemiology—a scoping review , PLoS One 16 ( 11 ) ( 2021 ) e0259223 . doi: 10.1371/journal.pone.0259223 . OpenUrl CrossRef PubMed [35]. ↵ L. Gyllingberg , A. Birhane , D. J. Sumpter , The lost art of mathematical modelling , Mathematical Biosciences 362 ( 2023 ) 109033 . doi: 10.1016/j.mbs.2023.109033 . URL https://www.sciencedirect.com/science/article/pii/S0025556423000743 OpenUrl CrossRef PubMed [36]. ↵ M. Gromov , In a search for a structure, part 1: On entropy , Entropy 17 ( 2013 ) 1273 – 1277 . doi: 10.4171/120-1/4 . OpenUrl CrossRef View the discussion thread. Back to top Previous Next Posted November 17, 2025. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Fisher-Rao distance and sex differences in disease prevalence trajectories Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Fisher-Rao distance and sex differences in disease prevalence trajectories José Manuel Rodríguez Caballero medRxiv 2025.11.14.25340249; doi: https://doi.org/10.1101/2025.11.14.25340249 Share This Article: Copy Citation Tools Fisher-Rao distance and sex differences in disease prevalence trajectories José Manuel Rodríguez Caballero medRxiv 2025.11.14.25340249; doi: https://doi.org/10.1101/2025.11.14.25340249 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Epidemiology Subject Areas All Articles Addiction Medicine (568) Allergy and Immunology (863) Anesthesia (299) Cardiovascular Medicine (4426) Dentistry and Oral Medicine (443) Dermatology (382) Emergency Medicine (607) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1507) Epidemiology (15222) Forensic Medicine (30) Gastroenterology (1123) Genetic and Genomic Medicine (6589) Geriatric Medicine (667) Health Economics (997) Health Informatics (4525) Health Policy (1368) Health Systems and Quality Improvement (1612) Hematology (540) HIV/AIDS (1264) Infectious Diseases (except HIV/AIDS) (15910) Intensive Care and Critical Care Medicine (1103) Medical Education (623) Medical Ethics (145) Nephrology (667) Neurology (6588) Nursing (346) Nutrition (998) Obstetrics and Gynecology (1143) Occupational and Environmental Health (956) Oncology (3331) Ophthalmology (971) Orthopedics (369) Otolaryngology (420) Pain Medicine (435) Palliative Medicine (129) Pathology (663) Pediatrics (1690) Pharmacology and Therapeutics (691) Primary Care Research (710) Psychiatry and Clinical Psychology (5440) Public and Global Health (9221) Radiology and Imaging (2195) Rehabilitation Medicine and Physical Therapy (1369) Respiratory Medicine (1196) Rheumatology (593) Sexual and Reproductive Health (710) Sports Medicine (529) Surgery (711) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'9ffed7c6ee6452ad',t:'MTc3OTQ4NDU5Ng=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00
unpaywall
last seen: 2026-05-23T02:00:01.238055+00:00
License: CC-BY-4.0