Full text
44,208 characters
· extracted from
preprint-html
· click to expand
Exploring Novel Biomarkers for Early Detection of Osteoporosis | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Exploring Novel Biomarkers for Early Detection of Osteoporosis View ORCID Profile Filipe Ricardo Carvalho , Virna Ferreira Queiroz , View ORCID Profile Paulo Jorge Gavaia doi: https://doi.org/10.1101/2025.05.30.25328641 Filipe Ricardo Carvalho 1 Faculty of Medicine and Biomedical Sciences, University of Algarve , Faro, Portugal 2 Centre of Marine Sciences (CCMAR/CIMAR LA), University of Algarve, Faro, Portugal Universidade do Algarve - Campus de Gambelas , 8005-139 Faro, Portugal Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Filipe Ricardo Carvalho For correspondence: frcarvalho{at}ualg.pt Virna Ferreira Queiroz 1 Faculty of Medicine and Biomedical Sciences, University of Algarve , Faro, Portugal Find this author on Google Scholar Find this author on PubMed Search for this author on this site Paulo Jorge Gavaia 1 Faculty of Medicine and Biomedical Sciences, University of Algarve , Faro, Portugal 2 Centre of Marine Sciences (CCMAR/CIMAR LA), University of Algarve, Faro, Portugal Universidade do Algarve - Campus de Gambelas , 8005-139 Faro, Portugal Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Paulo Jorge Gavaia Abstract Full Text Info/History Metrics Data/Code Preview PDF Abstract Purpose/Introduction Osteoporosis is characterized by diminished BMD and deteriorated bone microstructure, significantly increasing fracture susceptibility. This study leverages machine learning for identifying key predictors of osteoporosis, potentially improving non-invasive screening tools. Methods We utilized the “Bone Mineral Density” dataset from Harvard University, categorizing variables into demographics, bone loss prevention treatments, and lifestyle/associated pathologies. A Boolean variable “OP” was defined to indicate presence of osteoporosis. Data preprocessing included imputation for missing values and normalization. Statistical analyses such as Welch’s T-test and multiple linear regression were conducted to identify significant markers. Additionally, unsupervised learning techniques, like Louvain clustering, were used to uncover natural data patterns, while supervised learning models aimed to predict osteoporosis. Results The study identified significant markers associated with osteoporosis, including magnesium levels, high- and low-density lipoproteins, chronic obstructive pulmonary disease, and chronic kidney disease. Multiple linear regression analysis revealed robust associations between osteoporosis and biomarkers such as ALT, BUN, CREA, LDL-C, and Mg, even after controlling for age, height, and weight. Among supervised learning models, Random Forest and Gradient Boosting algorithms showed the highest accuracy in predicting osteoporosis, with Random Forest identified as the preferred model. Conclusions In our work, it was possible to identify the main biochemical parameters and clinical histories that are potential predictors of osteoporosis. The findings suggest that integrating machine learning techniques with clinical data can enhance early detection and intervention strategies, ultimately improving patient outcomes. Further refinement is recommended to validate these results across diverse populations and improve predictive models for broader application. Introduction Osteoporosis (OP) is a progressive skeletal disorder characterized by diminished bone mineral density (BMD) and deterioration of bone microstructure ( 1 , 2 ). This condition significantly increases bone fragility and susceptibility to fractures ( 3 ). While reduced BMD is a key indicator of fracture risk, other factors such as bone geometry, microarchitecture, and size also contribute to overall bone strength and resilience against trauma ( 2 , 4 ). Often referred to as a “silent disease,” OP typically remains undetected until a fracture occurs, requiring imaging and radiologic tests for diagnosis. Fragility fractures, the most evident clinical manifestation of OP, commonly occur in the hip, spine, and distal radius ( 5 – 7 ). The relationship between fracture risk and BMD varies between men and women, influenced by age-related differences in bone weakness progression ( 2 , 8 , 9 ). The condition is classified into two main categories: primary OP, associated with age and decreased sex hormones (particularly estrogen), and secondary OP, linked to other pathologies or medical treatments ( 10 ). Primary OP disproportionately affects women due to their naturally lower bone density and the impact of menopause. However, estrogen deficiency also plays a role in male OP, as bone cells in both sexes possess estrogen receptors. Men with OP are more likely to experience secondary forms of the disease, often due to underlying pathologies or medication-induced bone loss ( 5 , 11 ). The elderly population, which is rapidly growing worldwide, faces the highest risk of OP. This demographic shift presents increasing social and economic challenges related to the disease. Age-related decline in bone mass and increased fracture risk are compounded by other factors such as low body mass index, alcohol and tobacco consumption, history of falls, previous fractures, family history of OP, and certain chronic and inflammatory diseases ( 12 – 14 ). Understanding the complex interplay of factors contributing to OP is crucial for developing effective diagnostic, preventive, and treatment strategies ( 15 , 16 ). As the global population ages, the need for accurate, accessible, and non-invasive screening tools becomes increasingly urgent. Artificial intelligence (AI) and machine learning (ML) have emerged as promising tools in addressing this urgent need, offering potential solutions for early detection and risk assessment of osteoporosis. Recent studies have explored various AI-driven approaches, including deep learning algorithms for analyzing bone densitometry images ( 17 ), convolutional neural networks for interpreting radiographs, and ensemble learning methods for integrating multiple risk factors ( 18 – 20 ). These AI tools have shown promising results in improving the accuracy of fracture risk prediction and osteoporosis diagnosis. For instance, some researchers have developed ML models that can predict BMD from routine CT scans, potentially reducing the need for specialized DXA scans ( 21 ). Others have utilized natural language processing to extract relevant information from electronic health records, enhancing the identification of high-risk individuals ( 22 ). Additionally, AI-powered clinical decision support systems have been proposed to assist healthcare providers in making more informed treatment decisions based on individual patient data and established clinical guidelines ( 15 ). As these technologies continue to evolve, they hold the potential to revolutionize osteoporosis screening and management, enabling more personalized and proactive approaches to bone health. Purpose This study aims to explore the potential of machine learning techniques in identifying key biochemical and clinical markers associated with OP, potentially leading to improved early detection and intervention strategies. Methods The data used in this study was from the “Bone mineral density” dataset ( 23 ) obtained from the Harvard Dataverse platform, developed by the Institute for Quantitative Social Science (IQSS) at Harvard University. The dataset comprises comprehensive clinical information, dual-energy X-ray absorptiometry (DXA) measurements, and various variables crucial for studying bone health, OP, and fracture risk. Variables were categorized into three main groups ( Table 1 ): Demographics & Analytics: Personal characteristics and medical biomarkers. Bone Loss Prevention Treatments: Interventions aimed at maintaining bone health. Lifestyle/Associated Pathologies: Factors and conditions potentially correlated with OP ( Figure 1 ). View this table: View inline View popup Table 1. Organization into database groups Bone mineral density . Download figure Open in new tab Figure 1. Comparison of pathologies between the Osteoporosis (OP) and Control groups VT: venous thrombosis; RV: vitamin D deficiency; DKA: coronary artery disease; CKD: chronic kidney disease; COPD: chronic obstructive pulmonary disease; DM: diabetes mellitus; HTN: hypertension; AS: ankylosing spondylitis. 1. Defining the Target Variable Due to the absence of metadata defining OP in the original dataset, we created a Boolean variable “OP” ( Figure 2 ). This variable was set to True if a participant met any of the following criteria: Download figure Open in new tab Figure 2. Violin plot comparing T-score values between individuals with osteoporosis (OP) and a control group across three key skeletal regions: the thoracolumbar region (TLT), femoral neck (FNT), and lumbar vertebrae L1 to L4 (L1-4T) The plot’s shape illustrates the distribution of T-score differences, with wider sections indicating higher frequency of data points at those values. TLT in the control group averaged −0.64 (SD 0.97), while in the OP group it was −1.82 (SD 1.22). FNT showed −1.02 (SD 0.93) for controls and −2.17 (SD 1.17) for the OP group. L1-4T averaged −0.27 (SD 1.36) in controls and −1.40 (SD 1.68) in the OP group. These statistics, visualized through the violin plot, highlight the consistently lower bone density and greater variability in T-scores among osteoporosis patients across all measured skeletal regions. T-score ≤ −2.5 in at least one of the tested locations: femoral neck (TNF), thoracolumbar region (TLT), or L1-L4 (L1.4T). History of fractures, this definition aligns with established guidelines ( 2 ). 2. Data pre-processing 2.1. Missing data filling and Data normalization Imputation Missing values were imputed using the mean of each variable. For certain analyses, data were normalized to a 0-1 scale to standardize values across variables, facilitating comparisons. This process transforms the minimum value to 0 and the maximum to 1, with intermediate values adjusted proportionally. 2.2. Statistical Analysis with Welch’s T-Test Welch’s t-test was employed to compare means between the OP and control groups for each variable. This test is suitable for samples with potentially unequal variances or sizes. Two-tailed P-values were calculated, with P < 0.05 considered statistically significant. The analysis was performed on the entire sample and separately for men and women to identify gender-specific differences ( Table 2 ). View this table: View inline View popup Download powerpoint Table 2. Results of the coefficients and p-values of the multiple linear regression analysis. p<0.05;**p<0.001 Coef.: Coefficient. 3. Correlation analysis A correlation matrix was generated and visualized as a heatmap to explore relationships between variables, with a focus on their associations with OP and BMD. This analysis intended to establish patterns and identify key correlations among the dataset parameters (supplementary material Figure 5). 4. Comparison Between Groups and Control of Covariates To investigate the relationship between OP (represented by the independent variable OP) and various biochemical variables (dependent variables), while accounting for covariates such as age, height, and weight, we performed multiple linear regression analyses. This approach allowed us to control for the effects of covariates and understand how their variances affect the generated models. We selected the following dependent variables for analysis: alanine aminotransferase (ALT), aspartate aminotransferase (AST), blood urea nitrogen (BUN), blood creatinine (CREA), uric acid (URIC), fasting blood glucose (FBG), high-density cholesterol (HDL-C), low-density cholesterol (LDL-C), serum levels of calcium (Ca), phosphorus (P), and magnesium (Mg). The independent variable was OP, with age, height, and weight as covariates. This method enabled us to apply a T-test and determine whether the coefficients significantly impact the prediction of each dependent variable. We applied this analysis to the total sample, as well as separately female and male groups, to identify any gender-specific differences. 5. Prevalence of OP in Different Pathological Conditions Recognizing that secondary OP can occur in relation to other pathologies and lifestyle factors, we analyzed the prevalence of OP among subjects with various comorbidities. We organized the incidence of OP in relation to the presence of diseases or lifestyles considered to be risk factors in both the OP and control groups ( Figure 1 ). 6. Unsupervised Learning Analytics We employed unsupervised machine learning techniques to identify natural patterns in the data, particularly focusing on variables correlated with the T-score associated with OP. The Louvain Clustering method was chosen for this analysis. First, we normalized the data and applied Principal Component Analysis (PCA) to reduce dimensionality. PCA identifies the directions of maximum variance, reducing redundancy and noise in the data. This allowed us to select the main components for the elaboration of the RadViz multivariate data visualization algorithm. We then created a visual representation of connections between objects using k-nearest neighbors (KNN) with Euclidean distance metric and 17 neighbors. The Louvain community detection algorithm was applied to this graph to optimize modularity and find highly interconnected node communities into clusters based on their natural similarities. 7. Development of a Predictive OP Model through Supervised Learning For our supervised learning approach, we developed a predictive model for OP. To ensure model efficiency and avoid redundancy, we excluded variables related to bone density values and potential treatments (calcium, calcitriol, and bisphosphonates). We divided the data into a training set (75% of the data) and a test set (25%). We then tested eight different classification algorithms to determine which would perform best in predicting the True classes of OP: Gradient Boosting, Random Forest, Decision Tree, Logistic Regression, AdaBoost, Neural Network, Support Vector Machine (SVM), Naive Bayes. To evaluate the results of the developed models, we used the following metrics: Area under the ROC curve (AUC), Classification Accuracy (CA), F1 score (precision-weighted harmonic mean and recall), Precision (proportion of true positives among instances classified as positive), Recall (ratio of true positives among all positive instances) and Matthews Correlation Coefficient (MCC). Finally, we identified the importance of features that most strongly influenced the results of the chosen algorithm for predicting the diagnosis. 8. Data Analysis Tools We used Orange Data Mining software (version 3.36.2) ( 24 ) for all data analyses. The specific plugins employed include Orange Data Table: For importing, cleaning, and preparing the raw data, Louvain Clustering: For unsupervised learning analysis, Correlations and Heat Map: For correlation analysis and visualization, Modeling Plugins: For implementing supervised learning algorithms, Test and Score: For evaluating algorithmic performance on test data. Feature Importance: For analyzing variable influence on model accuracy Results 1. Pathologies, lifestyle and osteoporosis The prevalence of OP in relation to various pathologies and lifestyle factors within our study population is present in Figure 1 . Among the variables examined, venous thrombosis showed the highest co-occurrence with OP, with 55.17% of individuals with this condition. Vitamin D deficiency was the second most prevalent condition, with 47.32% followed by coronary artery disease with 35.37%, while OP cases were observed in chronic kidney disease and chronic obstructive pulmonary disease patients in 34.84% and 34.39%, respectively the distribution of T-scores in relation to control and OP groups. A Violin Plot was constructed to visualize this distribution of the density curves of the T-scores for L1-4T, TNF, TLT regions, allowing for a comparison of data distribution between the OP and non-OP groups ( Figure 2 ). 2. Biochemical Data Results To analyze the biochemical parameters and their behaviors between OP and control groups, we used Welch’s t-test and multiple linear regression to assess the impact of covariates. Significant differences were found for ALT, were the OP group showed mean value of 22.86 with a standard deviation (SD) of 13.91, compared to 23.77 (SD = 17.41) in the control group. Significant differences were also found in BUN OP averaging 5.52 (SD = 1.85) and the control group at 5.65 (SD = 3.67). In CREAT with a mean of 74.49 (SD = 26.69) in OP versus 73.81 (SD = 25.36) for the controls. Notably, LDL-C levels average 2.53 (SD = 0.91) against the control’s 2.62 (SD = 0.89). Magnesium (Mg) presented the most notable variation, with the OP group averaging lower at 0.83 (SD = 0.11) compared to 0.88 (SD = 0.09) in the control group ( Figure 3 ). Download figure Open in new tab Figure 3. Mean concentration values of significant biomarkers A, B, C: Alanine aminotransferase (ALT) values. For the Total and Female groups, significant differences were found for *p<0.05. D, E, F: Aspartate aminotransferase (AST) values. For the male group, significant differences were found for *p<0.05. G, H, I: Nitrogen urea (BUN) values. For the Total groups, significant differences were found for *p<0.05. J, K, L: Low-density lipoprotein (LDL-C) values. For the Total and Female groups, significant differences were found for **p<0.001. M, N, O: Serum calcium (Ca) values. For the female group, significant differences were found for *p<0.05. P, Q, R: Serum magnesium (Mg) values. For all groups – Total, Female and Male – significant differences were found for **p<0.001. The coefficients for age across all biomarkers were relatively small and did not indicate significant associations. The height and weight coefficients were not significant for most biomarkers, except for Mg, where both height and weight had significant positive influences. The significant relationships between OP and the biomarkers ALT, BUN, CREAT, and LDL-C remained robust even after controlling for age, height, and weight, indicating that the associations of these biomarkers with OP are independent of these potential confounding variables. However, for Mg, the significant positive influences of height and weight suggest that its association with OP is influenced by these covariates (supplementary material, Table 3). 3. Correlation of variables Correlation analysis (supplementary material Figure 5), illustrates the correlations between various variables, emphasizing their associations with bone parameters. OP was inversely correlated with bone mineral density (BMD) and T-score. Treatments such as calcium, calcitriol, bisphosphonates, and calcitonin also show inverse correlations with BMD and T-scores of the femoral neck and thoracolumbar regions. These findings are consistent with our expectations, given the associations of these variables with bone health. Mg exhibited significant correlations: a strong negative correlation with OP and direct correlations with BMD and T-scores of the lumbar region, indicating its potential as an evaluation parameter. Additionally, a subtle positive association was observed between alanine aminotransferase (ALT) and aspartate aminotransferase (AST) with bone health; ALT correlates with the femoral neck, femoral neck T-score, thoracolumbar region, and thoracolumbar T-score. Conversely, uric acid (URIC) and high-density lipoprotein cholesterol (HDL-C) displayed opposite behaviors. URIC showed positive correlations with bone health parameters, particularly the femoral neck and thoracolumbar region, while HDL-C was inversely correlated with bone components. 4. Analysis of unsupervised learning outcomes Louvain clustering identified four clusters from the data, as visualized in the Radviz plot in (supplementary material Figure 6). This analysis aimed to explore variable behaviors based on similarities, without targeted algorithmic interventions. Cluster 1 (C1) includes OP, HDL-C, LDL-C, BUN, TLT, FNT, L1-4T, TL, FN, P, Mg, and Gender. Cluster 2 (C2) comprises BMI, Age, Weight, URIC, CREAT, Height, AST, and ALT. Cluster 3 (C3) contains L1-4, while Cluster 4 (C4) consists of FBG. The inclusion of OP in C1 is particularly significant, revealing a hidden pattern among these variables. To ensure unbiased clustering of biochemical parameters, data on diseases or treatments were excluded. 5. Analysis of the different supervised learning models Among the tested algorithms (supplementary material, Table 4), Gradient Boosting yielded the highest accuracy, closely followed by Random Forest. Both demonstrated strong performance in correctly identifying OP diagnoses, while other algorithms showed decreasing predictive accuracy, with Naive Bayes performing poorest. Confusion matrices (supplementary material Figure 7) for Gradient Boosting and Random Forest models, based on the 25% test data, revealed their respective performances: Gradient Boosting: 328 correct diagnoses (39 true positives for OP), 56 misclassifications (50 false negatives, 6 false positives). Random Forest: More false positives ( 14 ) but fewer false negatives (47), Higher true positives ( 42 ) compared to Gradient Boosting Due to Random Forest’s superior ability to identify OP, it was led to its selected as the preferred predictive model. Feature importance analysis ( Figure 4 ) highlighted the most influential characteristics for the Random Forest model, which were Mg, COPD, history of fractures, height, and CAD. Download figure Open in new tab Figure 4. Feature Importance in the Random Forest Model Figure illustrates the relative importance of various features in the Random Forest model for predicting osteoporosis (OP) diagnoses. The analysis identifies Magnesium (Mg), Chronic Obstructive Pulmonary Disease (COPD), history of fractures, height, and Coronary Artery Disease (CAD) as the most influential variables. These features significantly contribute to the model’s predictive accuracy, highlighting their critical roles in the assessment and diagnosis of osteoporosis. Conclusion Our study aimed to identify key biochemical and clinical markers associated with OP using machine learning techniques. The results highlight several important findings and areas for further investigation. Magnesium emerged as a significant predictor of bone health, showing strong correlations with BMD and OP. This aligns with previous research indicating magnesium’s crucial role in bone development and matrix formation ( 25 , 26 ). The highly significant values found between Mg and OP, along with the exceptionally strong correlation between Mg and especially L1-4 BMD, warrant further in-depth analysis. Despite the need for additional research, Mg demonstrates robust potential as a predictor of BMD. However, it is critical to note that in our multiple linear regression analysis, the significance of magnesium’s association with OP was influenced by covariates such as age, height, and weight. These factors contribute to bone health and could potentially confound the direct impact of Mg. Age, in particular, is a well-known determinant of bone density changes ( 27 – 29 ), while height ( 30 , 31 ) and weight ( 32 , 33 ) influence biomechanical stress on the skeleton ( 34 – 36 ), affecting bone remodeling processes. The interplay of these covariates suggests that while Mg remains an important factor, its independent predictive power for bone health might be overestimated if these variables are not adequately controlled. Furthermore, the clinical diagnosis of Mg deficiency remains challenging, as serum levels may not accurately reflect total body Mg status ( 37 ). This underscores the importance of developing more accurate methods to assess Mg levels in the context of bone health evaluation. Therefore, while magnesium’s role in bone health is significant( 38 ), its assessment and the influence of other physiological factors must be carefully considered in both clinical and research settings to fully understand its impact. Lipid profiles, particularly HDL-C and LDL-C, demonstrated noteworthy associations with bone health. Low HDL-C levels have been linked to impaired osteoblast differentiation and function ( 39 ) high LDL-C levels may promote osteoclastogenesis ( 40 ). These findings suggest a potential connection between lipid metabolism and bone health, which warrants further investigation. Liver enzymes, especially ALT, showed relevance in our predictive model. This association may be explained by the link between chronic liver diseases and OP, known as hepatic osteodystrophy ( 41 ). However, the specific mechanisms underlying this relationship require further elucidation. Uric acid demonstrated a positive correlation with bone health parameters, supporting previous findings of its potential protective effect on BMD in the elderly ( 42 ). However, the relationship between uric acid and bone health appears complex and may be influenced by gender and age. The prevalence of OP in individuals with comorbidities such as chronic obstructive pulmonary disease (COPD) and chronic kidney disease (CKD) aligns with existing literature. These conditions share risk factors with OP and may involve treatments that affect bone metabolism ( 43 , 44 ). This study demonstrates the potential of machine learning techniques in identifying key biochemical and clinical markers associated with OP. Magnesium, lipid profiles, liver enzymes, and uric acid emerged as significant predictors, alongside established risk factors such as age and comorbidities. While our findings provide valuable insights, several limitations must be acknowledged. The cross-sectional nature of the data limits causal inferences, and the generalizability of the results to diverse populations requires further investigation. Additionally, the predictive model, while promising, needs further refinement to improve its accuracy and clinical utility. Future research should focus on longitudinal studies to establish causal relationships between identified markers and OP development. Refinement of machine learning models to enhance predictive accuracy and reduce false negatives. Validation of findings in diverse populations to ensure broad applicability. This study provides a foundation for developing more comprehensive and accurate screening tools for OP. By integrating biochemical markers with clinical risk factors, we may improve early detection and intervention strategies, ultimately reducing the burden of OP-related fractures and improving patient outcomes. Data Availability All data produced in the present work are contained in the manuscript Conflict of interest The authors declare that they have no conflict of interest. This statement applies to Filipe Ricardo Carvalho, Virna Ferreira Queiroz and Paulo Jorge Gavaia. Acknowledgements This study received Portuguese national funds from FCT - Foundation for Science and Technology through projects UIDB/04326/2020 (DOI:10.54499/UIDB/04326/2020), UIDP/04326/2020 (DOI:10.54499/UIDP/04326/2020) and LA/P/0101/2020 (DOI:10.54499/LA/P/0101/2020). References 1. ↵ Kanis JA , McCloskey E V. , Johansson H , Cooper C , Rizzoli R , Reginster JY . European guidance for the diagnosis and management of osteoporosis in postmenopausal women . Osteoporosis International . 2013 ; 24 ( 1 ). 2. ↵ Kanis JA , McCloskey E V , Johansson H , Oden A , Melton LJ , Khaltaev N. A reference standard for the description of osteoporosis . Bone [Internet] . 2008 ; 42 ( 3 ): 467 – 75 . Available from : doi: 10.1016/j.bone.2007.11.001 OpenUrl CrossRef PubMed Web of Science 3. ↵ Pimentel A , Ureña-Torres P , Bover J , Luis Fernandez-Martín J , Cohen-Solal M. Bone Fragility Fractures in CKD Patients . Vol. 108 , Calcified Tissue International . 2021 . 4. ↵ Pouresmaeili F , Kamalidehghan B , Kamarehei M , Goh YM . A comprehensive overview on osteoporosis and its risk factors . Ther Clin Risk Manag [Internet] . 2018 Nov 6; 14 : 2029 – 49 . Available from: https://pubmed.ncbi.nlm.nih.gov/30464484 OpenUrl 5. ↵ Patsch JM , Burghardt AJ , Yap SP , Baum T , Schwartz A V , Joseph GB , et al. Increased cortical porosity in type 2 diabetic postmenopausal women with fragility fractures . J Bone Miner Res [Internet] . 2013 Feb [cited 2015 Jul 17]; 28 ( 2 ): 313 – 24 . Available from: http://www.pubmedcentral.nih.gov/articlerender.fcgi?artid=3534818&tool=pmcentrez&rendertype=abstract OpenUrl 6. Matkovic V , Goel P , Mobley SL , Badenhop-Stevens NE , Ha EJ , Li B , et al. Decreased bone mass in adolescents with bone fragility fracture but not in young children: a case–control study . Front Endocrinol (Lausanne) . 2023 ; 14 . 7. ↵ Mitchell JA , Chesi A , Cousminer DL , McCormack SE , Kalkwarf HJ , Lappe JM , et al. Multidimensional Bone Density Phenotyping Reveals New Insights Into Genetic Regulation of the Pediatric Skeleton . Journal of Bone and Mineral Research . 2018 ; 33 ( 5 ). 8. ↵ Sozen T , Ozisik L , Calik Basaran N. An overview and management of osteoporosis . Eur J Rheumatol . 2017 ; 4 ( 1 ). 9. ↵ Lorentzon M , Johansson H , Harvey NC , Liu E , Vandenput L , McCloskey E V. , et al. Osteoporosis and fractures in women: the burden of disease . Vol. 25 , Climacteric . 2022 . 10. ↵ Porter JL , Varacallo M , Castano M. Osteoporosis (Nursing) . StatPearls . 2021 . 11. ↵ Glaser DL , Kaplan FS . Osteoporosis . Spine (Phila Pa 1976) [Internet] . 1997 ; 22 ( Supplement ): 12S – 16S . Available from : doi: 10.1097/00007632-199712151-00003 OpenUrl CrossRef PubMed Web of Science 12. ↵ Cummings SR , Melton LJ . Epidemiology and outcomes of osteoporotic fractures . The Lancet [Internet] . 2002 ; 359 ( 9319 ): 1761 – 7 . Available from : doi: 10.1016/s0140-6736(02)08657-9 OpenUrl CrossRef 13. Lane NE . Epidemiology, etiology, and diagnosis of osteoporosis . Am J Obstet Gynecol [Internet] . 2006 ; 194 ( 2 ): S3 – 11 . Available from : doi: 10.1016/j.ajog.2005.08.047 OpenUrl CrossRef PubMed Web of Science 14. ↵ Briot K , Geusens P , Em Bultink I , Lems WF , Roux C. Inflammatory diseases and bone fragility . Vol. 28 , Osteoporosis International . 2017 . 15. ↵ Kanis JA , McCloskey E V. , Harvey NC , Cooper C , Rizzoli R , Dawson-Hughes B , et al. The need to distinguish intervention thresholds and diagnostic thresholds in the management of osteoporosis . Osteoporosis International . 2023 ; 34 ( 1 ). 16. ↵ Park SY , Kim SH , Lee YK , Shin JH , Ha YC , Chung HY . Position Statement: Postmenopausal Osteoporosis Treatment Strategies in Korea . Vol. 30 , Journal of Bone Metabolism . 2023 . 17. ↵ Tang C , Zhang W , Li H , Li L , Li Z , Cai A , et al. CNN-based qualitative detection of bone mineral density via diagnostic CT slices for osteoporosis screening . Osteoporosis International . 2021 ; 32 ( 5 ). 18. ↵ Yang J , Liao M , Wang Y , Chen L , He L , Ji Y , et al. Opportunistic osteoporosis screening using chest CT with artificial intelligence . Osteoporosis International . 2022 ; 33 ( 12 ). 19. Valentinitsch A , Trebeschi S , Kaesmacher J , Lorenz C , Löffler MT , Zimmer C , et al. Opportunistic osteoporosis screening in multi-detector CT images via local classification of textures . Osteoporosis International . 2019 ; 30 ( 6 ). 20. ↵ Mookiah MRK , Rohrmeier A , Dieckmeyer M , Mei K , Kopp FK , Noel PB , et al. Feasibility of opportunistic osteoporosis screening in routine contrastenhanced multi detector computed tomography (MDCT) using texture analysis . Osteoporosis International . 2018 ; 29 ( 4 ). 21. ↵ Sollmann N , Löffler MT , El Husseini M , Sekuboyina A , Dieckmeyer M , Rühling S , et al. Automated Opportunistic Osteoporosis Screening in Routine Computed Tomography of the Spine: Comparison With Dedicated Quantitative CT . Journal of Bone and Mineral Research . 2022 ; 37 ( 7 ). 22. ↵ Almog YA , Rai A , Zhang P , Moulaison A , Powell R , Mishra A , et al. Deep Learning with Electronic Health Records for Short-Term Fracture Risk Identification: Crystal Bone Algorithm Development and Validation . J Med Internet Res . 2020 ; 22 ( 10 ). 23. ↵ He L. Harvard Dataverse . 2021 [cited 2024 Jul 17]. Bone mineral density . Available from : doi: 10.7910/DVN/UDZIJS OpenUrl CrossRef 24. ↵ Demšar J , Curk T , Erjavec A , Gorup Č , Hočevar T , Milutinovič M , et al. Orange: Data mining toolbox in python . Journal of Machine Learning Research . 2013 ; 14 . 25. ↵ Abrams SA , Chen Z , Hawthorne KM . Magnesium Metabolism in 4-Year-Old to 8-Year-Old Children . Journal of Bone and Mineral Research [Internet] . 2013 ; 29 ( 1 ): 118 – 22 . Available from : doi: 10.1002/jbmr.2021 OpenUrl CrossRef 26. ↵ Castiglioni S , Cazzaniga A , Albisetti W , Maier JAM . Magnesium and osteoporosis: current state of knowledge and future research directions . Nutrients [Internet] . 2013 Jul 31; 5 ( 8 ): 3022 – 33 . Available from: https://pubmed.ncbi.nlm.nih.gov/23912329 OpenUrl 27. ↵ Eghbali P , Becce F , Goetti P , Vauclair F , Farron A , Büchler P , et al. Age- and sex-specific normative values of bone mineral density in the adult glenoid . Journal of Orthopaedic Research . 2023 ; 41 ( 2 ). 28. Botha D , Lynnerup N , Steyn M. Age estimation using bone mineral density in South Africans . Forensic Sci Int . 2019 ; 297 . 29. ↵ Cho MJ , Moon SH , Lee JH , Lee JH . Association between osteoporotic vertebral compression fractures and age, bone mineral density, and european quality of life-5 dimensions in korean postmenopausal women: A nationwide cross-sectional observational study . CiOS Clinics in Orthopedic Surgery . 2021 ; 13 ( 2 ). 30. ↵ Moayyeri A , Ahmadi-Abhari S , Hossein-Nezhad A , Larijani B , Soltani A. Bone mineral density and estimated height loss based on patients’ recalls . Osteoporosis International . 2006 ; 17 ( 6 ). 31. ↵ Yu C , Wang S , Meng X , Li W , Deng Y , Li N , et al. The impact of height on low/reduced bone mineral density in Chinese adolescents aged 12-14 years old: gender differences . Arch Osteoporos . 2019 ; 14 ( 1 ). 32. ↵ Wang X , Yang S , He G , Xie L. The association between weight-adjusted-waist index and total bone mineral density in adolescents: NHANES 2011–2018 . Front Endocrinol (Lausanne) . 2023 ; 14 . 33. ↵ Zhang Y , Wu H , Li C , Liu C , Liu M , Liu X , et al. Associations between weight-adjusted waist index and bone mineral density: results of a nationwide survey . BMC Endocr Disord . 2023 ; 23 ( 1 ). 34. ↵ Recnik G , Kralj-Iglič V , Iglič A , Antolič V , Kramberger S , Rigler I , et al. The role of obesity, biomechanical constitution of the pelvis and contact joint stress in progression of hip osteoarthritis . Osteoarthritis Cartilage . 2009 ; 17 ( 7 ). 35. Issa RitaI , Griffin Timothy M . Pathobiology of obesity and osteoarthritis: integrating biomechanics and inflammation . Pathobiology of Aging & Age-related Diseases . 2012 ; 2 ( 1 ). 36. ↵ Zhao G , Wang H , Wang L , Ibrahim Y , Wan Y , Sun J , et al. The Biomechanical Effects of Different Bag-Carrying Styles on Lumbar Spine and Paraspinal Muscles: A Combined Musculoskeletal and Finite Element Study . Orthop Surg . 2023 ; 15 ( 1 ). 37. ↵ Razzaque MS . Magnesium: Are We Consuming Enough? Nutrients [Internet] . 2018 Dec 2; 10 ( 12 ): 1863 . Available from: https://pubmed.ncbi.nlm.nih.gov/30513803 OpenUrl 38. ↵ Groenendijk I , van Delft M , Versloot P , van Loon LJC , de Groot LCPGM. Impact of magnesium on bone health in older adults: A systematic review and meta-analysis . Bone . 2022 ; 154 . 39. ↵ Papachristou NI , Blair HC , Kypreos KE , Papachristou DJ . High-density lipoprotein (HDL) metabolism and bone mass . J Endocrinol [Internet]. 2017/03/17 . 2017 May ; 233 ( 2 ): R95 – 107 . Available from: https://pubmed.ncbi.nlm.nih.gov/28314771 OpenUrl 40. ↵ Xie R , Huang X , Zhang Y , Liu Q , Liu M. High Low-Density Lipoprotein Cholesterol Levels are Associated with Osteoporosis Among Adults 20-59 Years of Age . Int J Gen Med [Internet] . 2022 Feb 28; 15 : 2261 – 70 . Available from: https://pubmed.ncbi.nlm.nih.gov/35250302 OpenUrl 41. ↵ Yadav A , Carey EJ . Osteoporosis in Chronic Liver Disease . Nutrition in Clinical Practice [Internet] . 2012 ; 28 ( 1 ): 52 – 64 . Available from : doi: 10.1177/0884533612470145 OpenUrl CrossRef PubMed 42. ↵ Nabipour I , Sambrook PN , Blyth FM , Janu MR , Waite LM , Naganathan V , et al. Serum uric acid is associated with bone health in older men: A cross-sectional population-based study . Journal of Bone and Mineral Research [Internet] . 2010 ; 26 ( 5 ): 955 – 64 . Available from : doi: 10.1002/jbmr.286 OpenUrl CrossRef 43. ↵ Bolster MB . Osteoporosis and Bone Health in Patients with Lung Disease . Clin Chest Med [Internet] . 2010 ; 31 ( 3 ): 555 – 63 . Available from : doi: 10.1016/j.ccm.2010.04.006 OpenUrl CrossRef 44. ↵ Ebeling PR , Nguyen HH , Aleksova J , Vincent AJ , Wong P , Milat F. Secondary Osteoporosis . Endocr Rev [Internet] . 2021 ; 43 ( 2 ): 240 – 313 . Available from : doi: 10.1210/endrev/bnab028 OpenUrl CrossRef View the discussion thread. Back to top Previous Next Posted May 31, 2025. Download PDF Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Exploring Novel Biomarkers for Early Detection of Osteoporosis Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Exploring Novel Biomarkers for Early Detection of Osteoporosis Filipe Ricardo Carvalho , Virna Ferreira Queiroz , Paulo Jorge Gavaia medRxiv 2025.05.30.25328641; doi: https://doi.org/10.1101/2025.05.30.25328641 Share This Article: Copy Citation Tools Exploring Novel Biomarkers for Early Detection of Osteoporosis Filipe Ricardo Carvalho , Virna Ferreira Queiroz , Paulo Jorge Gavaia medRxiv 2025.05.30.25328641; doi: https://doi.org/10.1101/2025.05.30.25328641 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Health Informatics Subject Areas All Articles Addiction Medicine (568) Allergy and Immunology (863) Anesthesia (300) Cardiovascular Medicine (4435) Dentistry and Oral Medicine (444) Dermatology (382) Emergency Medicine (608) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1509) Epidemiology (15229) Forensic Medicine (30) Gastroenterology (1124) Genetic and Genomic Medicine (6600) Geriatric Medicine (668) Health Economics (997) Health Informatics (4536) Health Policy (1368) Health Systems and Quality Improvement (1613) Hematology (541) HIV/AIDS (1264) Infectious Diseases (except HIV/AIDS) (15916) Intensive Care and Critical Care Medicine (1103) Medical Education (623) Medical Ethics (146) Nephrology (667) Neurology (6599) Nursing (346) Nutrition (998) Obstetrics and Gynecology (1144) Occupational and Environmental Health (957) Oncology (3332) Ophthalmology (974) Orthopedics (369) Otolaryngology (420) Pain Medicine (436) Palliative Medicine (130) Pathology (663) Pediatrics (1693) Pharmacology and Therapeutics (691) Primary Care Research (711) Psychiatry and Clinical Psychology (5447) Public and Global Health (9232) Radiology and Imaging (2198) Rehabilitation Medicine and Physical Therapy (1370) Respiratory Medicine (1196) Rheumatology (593) Sexual and Reproductive Health (712) Sports Medicine (530) Surgery (712) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'a00cb1381ff658f4',t:'MTc3OTYyOTgxNw=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.