Full text
47,506 characters
· extracted from
preprint-html
· click to expand
Routine Blood Tests as Predictors of Periodontal Disease Risk Using a Machine Learning Approach | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Routine Blood Tests as Predictors of Periodontal Disease Risk Using a Machine Learning Approach Bushra Ahmad , Khaled Saleh , Saleh Alharbi , Y. Natalie Jeong , Athanasios Zavras , Hend Alqaderi doi: https://doi.org/10.1101/2024.06.10.24308375 Bushra Ahmad 1 Department of Periodontology, Tufts University School of Dental Medicine , Boston, MA, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: bushra.ahmad{at}tufts.edu Khaled Saleh 2 Department of Periodontology, Al Amiri Dental Specialty Center , Kuwait City, Kuwait Find this author on Google Scholar Find this author on PubMed Search for this author on this site Saleh Alharbi 3 Department of Periodontology, King Abdulaziz Medical City , Riyadh, Saudi Arabia Find this author on Google Scholar Find this author on PubMed Search for this author on this site Y. Natalie Jeong 1 Department of Periodontology, Tufts University School of Dental Medicine , Boston, MA, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Athanasios Zavras 4 Department of Public Health and Community Service, Tufts University School of Dental Medicine , Boston, MA, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Hend Alqaderi 4 Department of Public Health and Community Service, Tufts University School of Dental Medicine , Boston, MA, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Abstract Full Text Info/History Metrics Data/Code Preview PDF ABSTRACT Background Periodontal disease is a prevalent chronic inflammatory condition associated with systemic health complications. Early identification of high-risk individuals is crucial for targeted preventive and therapeutic interventions. In this study, we aimed to develop and evaluate machine learning models using routine blood tests to predict periodontal disease risk. This will help to develop accessible and cost-effective screening tools for early detection in a non-dental setting. Methods This study utilized data from the 2013-2014 National Health and Nutrition Examination Survey (NHANES), including full-mouth periodontal examinations, demographic variables, and routine blood tests (complete blood count [CBC], lipid profile, liver and kidney function tests). Periodontitis was defined as a binary outcome based on attachment loss and probing depth at interproximal sites. Individuals meeting any of these criteria were classified as having periodontitis. Seven machine learning models were developed and evaluated using precision, recall, and accuracy metrics. Results The Random Forest Classifier achieved the highest performance, scoring 0.91 in precision, recall, and accuracy for predicting periodontitis. Key predictive features included smoking status, age, education level, gamma glutamyl transferase, albumin, blood urea nitrogen, glucose, phosphorus, creatinine, basophil count, and total calcium levels. Conclusion This study underscores the promise of machine learning, especially the Random Forest Classifier, in predicting periodontal disease risk using routine blood tests and demographics. The model accurately identified periodontitis cases, with key features revealing the complex relationship between systemic health and periodontal disease. This suggests the potential for developing machine learning-based screening tools for early periodontal disease detection in non-dental settings. 1 INTRODUCTION Periodontal disease, a chronic inflammatory condition affecting tooth-supporting tissues, is a major public health concern with a global prevalence of 20%-50%.[ 1 ] Severe periodontal disease, characterized by extensive tissue destruction and tooth loss, has been associated with systemic conditions such as diabetes, cardiovascular disease, and adverse pregnancy outcomes.[ 2 , 3 ] Early identification of high-risk individuals is crucial for targeted preventive and therapeutic interventions to reduce disease burden and complications. Routine blood tests, such as CBC and comprehensive metabolic panels are widely accessible and provide valuable information about an individual’s overall health status, including inflammation, nutrition, and organ function.[ 4 ] In recent studies, researchers have explored routine blood tests as potential biomarkers for various diseases, including periodontal disease.[ 5 ] Associations between blood test parameters (e.g., white blood cell count, C-reactive protein, vitamin D levels) and periodontal disease severity have been reported.[ 6 , 7 ] However, most studies have been limited by small sample sizes and focused on a narrow range of blood test parameters. Machine learning, a subset of artificial intelligence, is a powerful tool for analyzing complex medical data and developing predictive models for disease risk assessment.[ 8 ] Machine learning algorithms can identify patterns and relationships in large datasets, enabling the development of accurate and robust predictive models.[ 9 ] In periodontal disease, machine learning approaches have been applied to various data types (e.g., clinical, radiographic, salivary biomarkers) to predict disease progression and treatment outcomes.[ 10 , 11 ] However, the application of machine learning to routine blood test data for predicting periodontal disease risk has not been sufficiently explored. Given the well-established evidence linking systemic conditions, especially metabolic and inflammatory conditions, to the risk of periodontal disease,[ 12 ] it is plausible to hypothesize that certain blood biomarkers may accurately predict the risk of periodontal disease. In this study, we aimed to develop and evaluate machine learning models using routine blood test data from the NHANES adult population to predict periodontal disease risk. By identifying key blood test parameters associated with periodontal disease and assessing the predictive performance of machine learning models, this study contributes to the development of accessible and cost-effective screening tools for early detection in a non-dental setting. The NHANES is a nationally representative survey conducted by the Centers for Disease Control and Prevention (CDC) that collects comprehensive health and nutrition data from the US population.[ 13 ] The NHANES dataset includes demographic, clinical, and laboratory data, making it a valuable resource for investigating associations between routine blood tests and periodontal disease risk in a large, diverse population.[ 13 ] 2 MATERIALS AND METHODS Study Population The 2013-2014 NHANES, a cross-sectional survey and publicly accessible survey, provided the data for this study. We complied with the Data Use Restrictions established by the National Center for Health Statistics, and the CDC. The survey employs a complex, multistage, stratified, and clustered sampling design to represent the non-institutionalized civilian US population. NHANES includes a questionnaire, laboratory assays, and clinical examination measures to assess health outcomes and explanatory variables. The NHANES database indicates that roughly 5,000 individuals, covering a wide age range, participated in at-home interviews and comprehensive health assessments conducted at Mobile Examination Centers. For participants 30 years and older, the survey included full-mouth periodontal examinations performed by pre-calibrated dental professionals within the mobile examination facilities. Periodontal Examination In the NHANES study conducted from 2013 to 2014, participants aged 30 years and older underwent a comprehensive full-mouth periodontal examination (FMPE), excluding those with health conditions requiring antibiotic prophylaxis before periodontal assessment. The primary aim of the FMPE was to obtain gold-standard measurements of clinical attachment loss (AL). To achieve this, two direct measurements were taken at each site: the distance from the cemento-enamel junction to the free gingival margin (CEJ-FGM) and the probing depth (PD). These measurements were collected at six sites (mesiobuccal, midbuccal, distobuccal, mesiolingual, midlingual, and distolingual) on all teeth, except for the third molars. All measurements were rounded down to the nearest whole millimeter. The clinical AL was then determined by calculating the difference between the CEJ-FGM and PD measurements. Periodontitis (Output) In this study, periodontitis was defined as a binary outcome, where individuals were categorized as either having periodontitis or not having periodontitis. The presence of periodontitis was determined by the severity of the condition, which was classified into the three categories of mild, moderate, and severe. Mild periodontitis was defined as having ≥ 2 interproximal sites with a ≥ 3 mm attachment loss (AL) and ≥ 2 interproximal sites with ≥ 4 mm PD, not on the same tooth, or 1 site with ≥ 5 mm PD. Moderate periodontitis was characterized by the presence of two or more interproximal sites with ≥ 4 mm clinical AL, not on the same tooth, or two or more interproximal sites with PD ≥ 5 mm, also not on the same tooth. Severe periodontitis was defined as the presence of two or more interproximal sites with ≥ 6 mm AL, not on the same tooth, and one or more interproximal site(s) with ≥ 5 mm PD. If an individual met the criteria for any of these three categories, they were considered to have periodontitis. Conversely, if an individual did not meet any of the criteria for mild, moderate, or severe periodontitis, they were classified as not having periodontitis. Routine Blood Tests (Inputs) We examined lipid profile (low-density lipoprotein, high-density lipoprotein, triglyceride, and total cholesterol), CBC, and liver and kidney function tests (gamma glutamyl transferase (GGT), creatinine, phosphorus, blood urea nitrogen, creatinine phosphokinase (CPK), alkaline phosphatase, aspartate aminotransferase (AST), and alanine aminotransferase (ALT). Demographics and other Input Variables We classified participants’ smoking status as current smokers if they had smoked at least 100 cigarettes in their lifetime and currently smoked daily or occasionally, and as never smokers if they had never smoked 100 or more cigarettes. Diabetes status was a binary variable (diabetic or non-diabetic) based on participants’ self-reported history of diabetes diagnosis by a health care professional. Participants were divided into four age categories: 30 to 34 years, 35 to 49 years, 50 to 64 years, and 65 years and above. Sex was represented as a binary variable, with participants classified as either male or female. The race variable was categorized into five groups: non-Hispanic White, non-Hispanic Black, Hispanic, non-Hispanic Asian, and others. To represent participants’ financial status, we used the ratio of income to the federal poverty level (FPL), dividing this variable into three categories: less than 138% of the FPL, between 138% and 399% of the FPL, and 400% or more of the FPL. Participants’ education levels were categorized into three groups: those who had not completed high school, those who had graduated from high school or obtained a General Education Development high school equivalency test (GED), and those who had pursued education beyond high school. Finally, participants were classified as "Yes" for "Medical condition" if they reported a diagnosis of arthritis, cancer, or coronary heart disease, and as "No" if they did not report any of these diseases. Statistical Analysis We employed Chi-square tests to compare categorical demographic variables stratified by the presence of periodontal disease. We used T-tests and Mann-Whitney tests to compare the levels of blood biomarkers between subjects with and without periodontal disease, depending on the normality of the data distribution. Machine learning models, including Decision Tree, Tuned Decision Tree, Random Forest, Tuned Random Forest, Adaptive Boosting, Gradient Boosting, and XGBoost Classifiers, were developed and evaluated using precision, recall, and accuracy metrics. The most important predictive features were identified for the best-performing model. Machine Learning For the study, we employed a robust methodology to develop and evaluate machine learning models for predicting periodontal disease. We divided the dataset into a training set (70%) for model development and a test set (30%) for assessing predictive performance. The output variable was a binary variable whether having periodontal disease or not having periodontal disease, and input variables encompassed 14 variables from the routine blood tests, such as lipid profile, CBC, liver and kidney function tests, demographics, and other covariates. We constructed seven models using the Decision Tree, Random Forest Classifier, and XGBoost machine learning algorithms. To address class imbalance in the dataset, we employed a resampling technique by adjusting the ‘class_weight’ hyperparameter in our models. Specifically, we set ‘class_weight’ to {0: 0.5, 1: 0.5}, ensuring that each class was treated with equal importance, thereby mitigating bias towards the majority class. Additionally, we set the ‘random_statè parameter to ‘1’ to ensure reproducibility of the results. For the decision tree models, we utilized GridSearch for hyperparameter tuning to compute the optimum values of hyperparameters. The hyperparameters optimized included the maximum depth of the tree (‘max_depth’), specified in the range of 2 to 7, and the minimum number of samples required at a leaf node (‘min_samples_leaf’), with values of 5, 10, 20, and 25. A split point at any depth was only considered if it left at least ‘min_samples_leaf’ training samples in each of the left and right branches. Additionally, we tuned the criterion used to measure the quality of a split, selecting either "gini" for the Gini impurity or "entropy" for information gain. For the Random Forest Classifier, a bagging algorithm was used with decision trees as the base models. Samples were taken from the training data, and each sample’s prediction was made by a decision tree. The final prediction was determined by combining the results from all the decision trees through voting. The hyperparameters tuned for the Random Forest Classifier included the number of trees in the forest (‘n_estimators’), the minimum number of samples required to split an internal node (‘min_samples_split’), with values of 1, 2, 5, and 10, the minimum number of samples required at a leaf node (‘min_samples_leaf’), with values of 1, 4, and 10, and the number of features to consider when looking for the best split (‘max_features’), with values of 0.5 and ‘auto’. We employed XGBoost (Extreme Gradient Boosting), a tree-based ensemble machine learning technique, for model building. Hyperparameter tuning for boosting included algorithms such as Adaboost, Gradient Boosting, and XGBoost. This involved optimizing parameters to enhance model performance and ensure robust predictive capabilities. The model performance was evaluated using recall, precision, and accuracy. These metrics were calculated from the confusion matrix. Recall measures the model’s ability to correctly identify positive instances, precision measures the accuracy of the positive predictions made, and accuracy provides the overall correctness of the model. To identify the most influential features in predicting periodontal disease, we conducted a feature importance analysis on the best-performing model. We used Stata 17 for descriptive analysis and employed Python for machine learning analysis. 3 RESULTS Table 1 presents the descriptive characteristics of the study population, stratified by periodontitis status. Significant differences were observed between the two groups in terms of various demographic and health-related factors. Participants with periodontitis were more likely to be current smokers, male, older, and of Hispanic or Black race/ethnicity than those without periodontitis. They also tended to have lower educational attainment and lower income levels. Additionally, diabetes was more prevalent among participants with periodontitis. However, no significant difference was found between the two groups in terms of the presence of any medical condition. View this table: View inline View popup TABLE 1: Descriptive summary of the population characteristics with and without periodontitis. Table 2 summarizes the levels of various blood biomarkers in patients with and without periodontitis. Patients with periodontitis exhibited significantly higher levels of glucose, creatinine, gamma glutamyl transferase, and basophil number compared to those without periodontitis. In contrast, albumin and phosphorus levels were significantly lower in the periodontitis group. No significant differences were observed in blood urea nitrogen and total calcium levels between the two groups. View this table: View inline View popup Download powerpoint TABLE 2: Descriptive summary of blood biomarkers in patients with and without periodontitis. Table 3 compares the performance of various machine learning models in predicting periodontitis. The Random Forest Classifier demonstrated the highest performance across all three metrics, scoring 0.91 across precision, recall, and accuracy. Conversely, the Tuned Decision Tree Classifier scored the last with 0.80 across the board. View this table: View inline View popup Download powerpoint TABLE 3: Comparison of the performance of various machine learning models in predicting periodontitis. Figure 1 shows the confusion matrix for the best-performing model which details the true positives (91%), false negatives (9%), false positives (10%), and true negatives (90%) produced by the model. Download figure Open in new tab FIGURE 1: Confusion matrix of the Random Forest Classifier model for predicting periodontitis. Figure 2 demonstrates the most important features that predict periodontitis. The features included demographic factors such as education level, age, sex, and income. Smoking, CBC tests, and liver and kidney function tests were also included. Download figure Open in new tab FIGURE 2: Feature importance ranking for periodontitis prediction model. 4 DISCUSSION We evaluated seven machine learning models using routine blood test data from a representative sample of the US adult population to predict the risk of periodontal disease. All models demonstrated high accuracy, precision, and recall, ranging from 80% to 91%. The Random Forest Classifier achieved the highest performance, with precision, recall, and accuracy of 0.91. These results indicate that routine blood test measurements combined with demographic factors can accurately predict periodontal disease risk. Smoking status emerged as the strongest predictive feature in our study, with current smokers being at higher risk for periodontitis compared to non-smokers. This finding is consistent with the well-established evidence that smoking is a major risk factor for periodontal disease.[ 14 ] Smoking has been shown to impair the immune response, alter the oral microbiome, and compromise the healing capacity of periodontal tissues, leading to increased susceptibility to periodontal destruction.[ 15 ] Age was another important predictive feature in our study, with older individuals being at higher risk for periodontal disease. This finding is supported by numerous epidemiological studies that have demonstrated an increased prevalence and severity of periodontal disease with advancing age.[ 16 ] The cumulative exposure to risk factors over time, along with age-related changes in the immune system and tissue homeostasis, may contribute to the higher risk of periodontal disease in older adults.[ 17 ] Education level was also identified as one of the top predictive features, which is in line with research consistently showing a strong association between lower education levels and higher prevalence and severity of periodontal disease.[ 18 ] Individuals with lower education levels may have limited access to dental care, and lower oral health literacy, and may engage in health-compromising behaviors, all of which contribute to an increased risk of periodontal disease.[ 19 ] GGT, a liver enzyme associated with oxidative stress and systemic inflammation, has been reported to have elevated levels in patients with periodontal disease, indicating a link between liver function and periodontal health.[ 20 , 21 ] Sanikop et al. found that GGT levels were significantly higher in patients with chronic periodontitis compared to healthy controls and positively correlated with the severity of periodontal destruction.[ 22 ] Our findings further support the association between GGT and periodontal disease, highlighting its potential as a biomarker for periodontal risk assessment. Furthermore, serum albumin was another predictive feature in our model. Serum albumin is the main protein synthesized by the liver and is a practical marker of general health status, demonstrating the severity of underlying diseases. Inflammation and malnutrition both reduce albumin concentration by decreasing its rate of synthesis.[ 23 ] Ogawa et al. suggest an inverse relationship between periodontal disease and serum albumin concentration, possibly influenced by nutritional aspects and inflammatory markers such as C-reactive protein.[ 23 ] The decreased serum albumin levels associated with periodontitis may be attributed to the impairment of the host response, including phagocytic function, cell-mediated immunity, complement system, secretory antibody, and cytokine production and function, potentially contributing to the progression of periodontal destruction.[ 23 ] Blood urea nitrogen (BUN) is a marker of kidney function. Various factors can influence BUN levels, such as kidney function, protein intake, and catabolic states.[ 24 ] Our model revealed that BUN played a role in predicting periodontitis, in addition to other variables. Some studies have reported associations between elevated BUN and periodontal disease severity. Kshirsagar et al. found that individuals with periodontal disease had a higher prevalence of renal insufficiency, as indicated by elevated BUN levels.[ 24 ] Akar et al. reported that BUN levels were significantly higher in patients with chronic periodontitis than in healthy controls.[ 25 ] The evidence suggests a link between impaired kidney function, reflected by elevated BUN, and periodontal disease progression, possibly due to the bidirectional relationship between these two conditions. Blood glucose was one of the most influential features for predicting periodontitis in our study, aligning with the well-known bidirectional relationship between hyperglycemia or diabetes and periodontal disease. Individuals with diabetes have a higher risk of periodontitis, and periodontal inflammation can induce insulin resistance and worsen glycemic control.[ 26 ] Hyperglycemia contributes to an exaggerated inflammatory response, impaired wound healing, altered oral microbial composition, amplifying periodontal destruction.[ 27 ] Our results, combined with substantial evidence, emphasize the importance of screening for diabetes and monitoring glycemic status in individuals at high risk for periodontitis to enable timely intervention and co-management. Our study identified serum phosphorus levels as a significant predictive feature, with lower levels associated with increased periodontitis risk, aligning with previous research suggesting an inverse relationship between serum phosphorus and periodontal disease.[ 28 ] Although the underlying mechanisms remain unclear, they may involve phosphorus’s role in bone metabolism and inflammation.[ 28 ] Further research is needed to elucidate the precise relationship. Creatinine, a marker of kidney function, was identified as a predictor of periodontal disease in our study.[ 29 ] Previous research by Arora et al. and Kapellas et al. supports this association, demonstrating higher creatinine levels in patients with chronic periodontitis and linking elevated creatinine with an increased risk of periodontal disease.[ 30 , 31 ] Our findings reinforce this link and suggest that creatinine may be a useful biomarker for periodontal risk assessment. Our study identified basophil count as an important predictive feature of periodontal disease. Recent studies support this finding, suggesting a potential role of basophils in the pathogenesis of periodontal disease. Basophils release histamine and other inflammatory mediators, contributing to the inflammatory process in periodontal tissues.[ 32 ] Arun et al. found a significant increase in basophil count in patients with chronic periodontitis compared to healthy controls.[ 33 ] Agarwal et al. reported that basophil count was positively associated with the severity of periodontal disease.[ 34 ] These findings, along with our results, highlight the potential of basophil count as a biomarker for periodontal disease risk assessment. Our study identified total calcium levels as an important variable in predicting the risk of periodontitis. Machado et al. noted that the relationship between serum calcium levels and periodontitis remains unclear.[ 35 ] However, other studies have reported conflicting results, suggesting a potential link between altered calcium homeostasis and periodontal disease.[ 36 , 37 ] Various factors, including dietary intake, hormonal regulation, and certain medical conditions, can affect serum calcium levels.[ 35 ] Although the exact mechanisms linking calcium to periodontitis remain unclear, alterations in calcium metabolism may influence periodontal health through its effects on bone metabolism, immune function, or other physiological processes.[ 35 ] Further research exploring the relationship between calcium homeostasis, periodontal disease, and other systemic factors could clarify calcium’s role in the pathogenesis of periodontitis. Artificial intelligence and machine learning techniques have the potential to revolutionize periodontal disease risk assessment and prediction.[ 8 , 38 ] These technologies utilize advanced statistical modeling and algorithmic learning to uncover complex relationships within large datasets, enabling the development of highly accurate prediction tools.[ 39 , 40 ] Recent studies have demonstrated promising applications in periodontal disease management, including predicting treatment outcomes, detecting disease from radiographs, and identifying high-risk individuals.[ 10 , 41 , 42 ] Our findings further highlight the importance of integrating medical and dental care by demonstrating that routine blood tests can predict the risk of developing periodontitis. This machine learning model provides a valuable tool for early detection and prevention of periodontitis in primary care and non-dental healthcare settings. Based on our findings, we have several recommendations. We propose that medical professionals, particularly those in primary care, incorporate periodontal risk assessments into their evaluations using accessible blood parameters. To effectively implement these recommendations, we suggest developing a standardized screening protocol that uses our predictive model to identify individuals at high risk for periodontitis. Once identified, these patients can be referred to dental professionals for further evaluation and treatment, fostering a collaborative approach between medical and dental care providers. By bridging the gap between these two domains of healthcare, we can enhance the early detection and management of periodontitis, ultimately leading to improved oral and overall health outcomes for patients. This integrated approach can also raise awareness among medical professionals about the importance of oral health and its connection to systemic well-being, encouraging a more comprehensive and holistic view of patient care. While our study offers valuable insights, it is limited by its cross-sectional design, preventing the assessment of temporal relationships, and its reliance on a single NHANES cycle, potentially limiting generalizability. Future research should validate these models in independent cohorts and explore incorporating additional clinical and biological markers alongside routine blood tests to enhance prediction accuracy. Prospective studies are also needed to examine the temporal relationships between predictive factors and disease progression. 5 CONCLUSION In conclusion, our study demonstrates the potential of machine learning models to accurately predict periodontal disease risk using routine blood tests and demographic data. Identifying key biomarkers like GGT, albumin, BUN, glucose, phosphorus, creatinine, basophil count, and total calcium, our model offers a valuable tool for early detection and risk assessment in non-dental settings. Integrating this into routine medical exams could facilitate timely referrals and proactive management, improving oral and overall health. Further research is needed to validate these findings in diverse populations and explore additional biomarkers for enhanced predictive accuracy of machine learning models for periodontal disease risk assessment. Data Availability The data that supports the findings of this study are available from the corresponding author upon reasonable request. AUTHOR CONTRIBUTIONS Bushra Ahmad designed the study, acquired data, assisted with data analysis, and wrote the manuscript. Khaled Saleh contributed to the writing of the manuscript, interpreting the data, and revising the manuscript. Saleh Alharbi revised the manuscript. Hend Alqaderi supervised the study, assisted with machine learning analysis, and revised the manuscript. Y. Natalie Jeong provided critical revisions of the manuscript. All authors approved the final version of the manuscript to be published and agreed to be accountable for all aspects of the work. Footnotes Author Approval: All authors have seen and approved the manuscript. Competing Interests Statement: The authors declare no competing interests. Data Availability Statement: The data that supports the findings of this study are available from the corresponding author upon reasonable request. Funding Statement: This research did not receive any specific grant from funding agencies in the public, commercial, or not-for-profit sectors. REFERENCES 1. ↵ Nazir MA . Prevalence of periodontal disease, its association with systemic diseases and prevention . Int J Health Sci (Qassim) . 2017 ; 11 ( 2 ): 72 – 80 . OpenUrl 2. ↵ Preshaw PM , Bissett SM. Periodontitis and diabetes . Br Dent J. 2019 ; 227 ( 7 ): 577 - 584 . doi: 10.1038/s41415-019-0794-5 . OpenUrl CrossRef PubMed 3. ↵ Daalderop LA , Wieland BV , Tomsin K , et al. Periodontal disease and pregnancy outcomes: Overview of systematic reviews . JDR Clin Trans Res . 2018 ; 3 ( 1 ): 10 – 27 . doi: 10.1177/2380084417731097 . OpenUrl CrossRef 4. ↵ Barati M , Alinejad F , Bahar MA , et al. Comparison of WBC, ESR, CRP and PCT serum levels in septic and non-septic burn cases . Burns . 2008 ; 34 ( 6 ): 770 – 774 . OpenUrl CrossRef PubMed Web of Science 5. ↵ Bansal T , Pandey A , Asthana AK . C-reactive protein (CRP) and its association with periodontal disease: A brief review . J Clin Diagn Res . 2014 ; 8 ( 7 ): ZE21 - ZE24 . doi: 10.7860/JCDR/2014/8355.4646 . OpenUrl CrossRef 6. ↵ Loos BG . Systemic markers of inflammation in periodontitis . J Periodontol . 2005 ; 76 ( 11 Suppl ): 2106 - 2115 . doi: 10.1902/jop.2005.76.11-S.2106 . OpenUrl CrossRef PubMed Web of Science 7. ↵ Zhan Y , Samietz S , Holtfreter B , et al. Prospective study of serum 25-hydroxy vitamin D and tooth loss . J Dent Res . 2014 ; 93 ( 7 ): 639 – 644 . doi: 10.1177/0022034514534985 . OpenUrl CrossRef PubMed 8. ↵ Rajkomar A , Dean J , Kohane I . Machine learning in medicine . N Engl J Med . 2019 ; 380 ( 14 ): 1347 – 1358 . doi: 10.1056/NEJMra1814259 . OpenUrl CrossRef PubMed 9. ↵ Deo RC . Machine learning in medicine . Circulation . 2015 ; 132 ( 20 ): 1920 – 1930 . doi: 10.1161/CIRCULATIONAHA.115.001593 . OpenUrl Abstract / FREE Full Text 10. ↵ Kim J , Lee HS , Song IS , Jung KH . DeNTNet: Deep Neural Transfer Network for the detection of periodontal bone loss using panoramic dental radiographs . Sci Rep . 2019 ; 9 ( 1 ): 17615 . Published 2019 Nov 26. doi: 10.1038/s41598-019-53758-2 . OpenUrl CrossRef 11. ↵ Papantonopoulos G , Takahashi K , Bountis T , Loos BG . Artificial neural networks for the diagnosis of aggressive periodontitis trained by immunologic parameters . PLoS One . 2014 ; 9 ( 3 ): e89757 . doi: 10.1371/journal.pone.0089757 . OpenUrl CrossRef 12. ↵ Chapple ILC , Genco R; Working group 2 of the joint EFP/AAP workshop. Diabetes and periodontal diseases: consensus report of the Joint EFP/AAP Workshop on Periodontitis and Systemic Diseases . J Periodontol . 2013 ; 84 ( 4 suppl ): S106 - S112 . doi: 10.1902/jop.2013.1340011 . OpenUrl CrossRef PubMed 13. ↵ Centers for Disease Control and Prevention . National Health and Nutrition Examination Survey . Accessed April 27 , 2024 . https://www.cdc.gov/nchs/nhanes/index.htm 14. ↵ Leite FRM , Nascimento GG , Scheutz F , López R . Effect of smoking on periodontitis: A systematic review and meta-regression . Am J Prev Med . 2018 ; 54 ( 6 ): 831 – 841 . OpenUrl CrossRef PubMed 15. ↵ Nociti FH Jr , Casati MZ , Duarte PM . Current perspective of the impact of smoking on the progression and treatment of periodontitis . Periodontol 2000 . 2015 ; 67 ( 1 ): 187 - 210 . OpenUrl CrossRef 16. ↵ Eke PI , Dye BA , Wei L , Thornton-Evans GO , Genco RJ . Prevalence of periodontitis in adults in the United States: 2009 and 2010 . J Dent Res . 2012 ; 91 ( 10 ): 914 – 920 . doi: 10.1177/0022034512457373 OpenUrl CrossRef PubMed 17. ↵ Ebersole JL , Graves CL , Gonzalez OA , et al. Aging, inflammation, immunity, and periodontal disease . Periodontol 2000 . 2016 ; 72 ( 1 ): 54 - 75 . doi: 10.1111/prd.12135 OpenUrl CrossRef PubMed 18. ↵ Borrell LN , Crawford ND . Socioeconomic position indicators and periodontitis: Examining the evidence . Periodontol 2000 . 2012 ; 58 ( 1 ): 69 - 83 . OpenUrl CrossRef PubMed 19. ↵ Boillot A , El Halabi B , Batty GD , Rangé H , Czernichow S , Bouchard P . Education as a predictor of chronic periodontitis: A systematic review with meta-analysis population-based studies . PLoS One . 2011 ; 6 ( 7 ): e21508 . OpenUrl CrossRef PubMed 20. ↵ Lee DH , Blomhoff R , Jacobs DR Jr . Is serum gamma glutamyl transferase a marker of oxidative stress? Free Radic Res . 2004 ; 38 ( 6 ): 535 – 539 . doi: 10.1080/10715760410001694026 OpenUrl CrossRef PubMed Web of Science 21. ↵ Dabra S , China K , Kaushik A . Salivary enzymes as diagnostic markers for detection of gingival/periodontal disease and their correlation with the severity of the disease . J Indian Soc Periodontol . 2012 ; 16 ( 3 ): 358 – 364 . doi: 10.4103/0972-124X.100911 OpenUrl CrossRef PubMed 22. ↵ Sanikop S , Patil S , Agrawal P . Gingival crevicular fluid alkaline phosphatase as a potential diagnostic marker of periodontal disease . J Indian Soc Periodontol . 2012 ; 16 ( 4 ): 513 – 518 . doi: 10.4103/0972-124X.106879 OpenUrl CrossRef 23. ↵ Ogawa H , Yoshihara A , Amarasena N , Hirotomi T , Miyazaki H . Association between serum albumin and periodontal disease in community-dwelling elderly . J Clin Periodontol . 2006 ; 33 : 312 – 316 . doi: 10.1111/j.1600-051X.2006.00901 . OpenUrl CrossRef PubMed 24. ↵ Kshirsagar AV , Moss KL , Elter JR , Beck JD , Offenbacher S , Falk RJ . Periodontal disease is associated with renal insufficiency in the Atherosclerosis Risk In Communities (ARIC) study . Am J Kidney Dis . 2005 ; 45 ( 4 ): 650 – 657 . doi: 10.1053/j.ajkd.2004.12.011 OpenUrl CrossRef PubMed Web of Science 25. ↵ Akar H , Akar GC , Carrero JJ , Stenvinkel P , Lindholm B . Systemic consequences of poor oral health in chronic kidney disease patients . Clin J Am Soc Nephrol . 2011 ; 6 ( 1 ): 218 – 226 . doi: 10.2215/CJN.05470610 OpenUrl Abstract / FREE Full Text 26. ↵ Preshaw PM , Alba AL , Herrera D , et al. Periodontitis and diabetes: a two-way relationship . Diabetologia . 2012 ; 55 ( 1 ): 21 - 31 . doi: 10.1007/s00125-011-2342-y OpenUrl CrossRef PubMed Web of Science 27. ↵ Polak D , Shapira L . An update on the evidence for pathogenic mechanisms that may link periodontitis and diabetes . J Clin Periodontol . 2018 ; 45 ( 2 ): 150 – 166 . OpenUrl PubMed 28. ↵ Najeeb S , Zafar MS , Khurshid Z , Zohaib S , Almas K . The role of nutrition in periodontal health: an update . Nutrients . 2016 ; 8 ( 9 ): 530 . doi: 10.3390/nu8090530 OpenUrl CrossRef 29. ↵ Kshirsagar AV , Moss KL , Elter JR , Beck JD , Offenbacher S , Falk RJ . Periodontal disease is associated with renal insufficiency in the Atherosclerosis Risk In Communities (ARIC) study . Am J Kidney Dis . 2005 ; 45 ( 4 ): 650 – 657 . OpenUrl CrossRef PubMed Web of Science 30. ↵ Arora N , Mishra A , Chugh S . Microbial role in periodontitis: Have we reached the top? Some unsung bacteria other than red complex . J Indian Soc Periodontol . 2014 ; 18 ( 1 ): 9 – 13 . OpenUrl 31. ↵ Kapellas K , Singh A , Bertotti M , Nascimento GG , Jamieson LM . Periodontal and chronic kidney disease association: A systematic review and meta-analysis . Nephrology (Carlton) . 2019 ; 24 ( 2 ): 202 – 212 . OpenUrl 32. ↵ Galdiero MR , Varricchi G , Seaf M , Marone G , Levi-Schaffer F , Marone G . Bidirectional Mast Cell-Eosinophil Interactions in Inflammatory Disorders and Cancer . Front Med (Lausanne) . 2017 ; 4 : 103 . Published 2017 Jul 24 . doi: 10.3389/fmed.2017.00103 OpenUrl CrossRef 33. ↵ Arun KV , Talwar A , Kumar TS . T-helper cells in the etiopathogenesis of periodontal disease: A mini-review . J Indian Soc Periodontol . 2011 ; 15 ( 1 ): 4 – 10 . OpenUrl PubMed 34. ↵ Agarwal S , Suzuki JB , Riccelli AE . Role of cytokines in the modulation of neutrophil chemotaxis in localized juvenile periodontitis . J Periodontal Res . 1994 ; 29 ( 2 ): 127 – 137 . OpenUrl PubMed 35. ↵ Machado AC , Quirino MR , Nascimento LF . Relation between chronic periodontal disease and plasmatic levels of triglycerides, total cholesterol and fractions . Braz Oral Res . 2005 ; 19 ( 4 ): 284 – 289 . doi: 10.1590/s1806-83242005000400009 . OpenUrl CrossRef PubMed 36. ↵ Sewón LA , Karjalainen SM , Soderling E , Lapinleimu H , Simell O . Associations between salivary calcium and oral health . J Clin Periodontol . 1998 ; 25 ( 11 Pt 1 ): 915 - 919 . doi: 10.1111/j.1600-051x.1998.tb02390 . OpenUrl CrossRef PubMed 37. ↵ Amarasena N , Yoshihara A , Hirotomi T , Takano N , Miyazaki H . Association between serum calcium and periodontal disease progression in non-institutionalized elderly . Gerodontology . 2008 ; 25 ( 4 ): 245 – 250 . doi: 10.1111/j.1741-2358.2007.00215 . OpenUrl CrossRef PubMed 38. ↵ Schwendicke F , Golla T , Dreher M , Krois J . Convolutional neural networks for dental image diagnostics: A scoping review . J Dent . 2019 ; 91 : 103226 . doi: 10.1016/j.jdent.2019.103226 37. OpenUrl CrossRef 39. ↵ Trombelli L , Farina R , Silva CO , Tatakis DN . Plaque-induced gingivitis: Case definition and diagnostic considerations . J Periodontol . 2018 ; 89 Suppl 1 : S46 – S73 . doi: 10.1002/JPER.17-0576 39. OpenUrl CrossRef PubMed 40. ↵ Feres M , Louzoun Y , Haber S , et al. Support vector machine-based differentiation between aggressive and chronic periodontitis using microbial profiles . Int Dent J . 2018 ; 68 ( 1 ): 39 – 46 . doi: 10.1111/idj.12321 . OpenUrl CrossRef 41. ↵ Lee JH , Kim DH , Jeong SN , Choi SH . Diagnosis and prediction of periodontally compromised teeth using a deep learning-based convolutional neural network algorithm . J Periodontal Implant Sci . 2018 ; 48 ( 2 ): 114 – 123 . doi: 10.5051/jpis.2018.48.2.114 42. OpenUrl CrossRef 42. ↵ Ahmad B , Saleh K , Alharbi S , Alqaderi H , Jeong YN . Artificial Intelligence in Periodontology: Performance Evaluation of ChatGPT, Claude, and Gemini on the In-service Examination . medRxiv . Published online May 29 , 2024 : 2024.05.29.24308155 . doi: 10.1101/2024.05.29.24308155 OpenUrl Abstract / FREE Full Text View the discussion thread. Back to top Previous Next Posted June 11, 2024. Download PDF Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Routine Blood Tests as Predictors of Periodontal Disease Risk Using a Machine Learning Approach Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Routine Blood Tests as Predictors of Periodontal Disease Risk Using a Machine Learning Approach Bushra Ahmad , Khaled Saleh , Saleh Alharbi , Y. Natalie Jeong , Athanasios Zavras , Hend Alqaderi medRxiv 2024.06.10.24308375; doi: https://doi.org/10.1101/2024.06.10.24308375 Share This Article: Copy Citation Tools Routine Blood Tests as Predictors of Periodontal Disease Risk Using a Machine Learning Approach Bushra Ahmad , Khaled Saleh , Saleh Alharbi , Y. Natalie Jeong , Athanasios Zavras , Hend Alqaderi medRxiv 2024.06.10.24308375; doi: https://doi.org/10.1101/2024.06.10.24308375 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Dentistry and Oral Medicine Subject Areas All Articles Addiction Medicine (573) Allergy and Immunology (864) Anesthesia (302) Cardiovascular Medicine (4449) Dentistry and Oral Medicine (444) Dermatology (383) Emergency Medicine (609) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1515) Epidemiology (15240) Forensic Medicine (30) Gastroenterology (1130) Genetic and Genomic Medicine (6614) Geriatric Medicine (669) Health Economics (1000) Health Informatics (4550) Health Policy (1372) Health Systems and Quality Improvement (1613) Hematology (543) HIV/AIDS (1268) Infectious Diseases (except HIV/AIDS) (15928) Intensive Care and Critical Care Medicine (1106) Medical Education (624) Medical Ethics (147) Nephrology (668) Neurology (6622) Nursing (346) Nutrition (999) Obstetrics and Gynecology (1147) Occupational and Environmental Health (957) Oncology (3343) Ophthalmology (977) Orthopedics (369) Otolaryngology (421) Pain Medicine (436) Palliative Medicine (130) Pathology (665) Pediatrics (1695) Pharmacology and Therapeutics (693) Primary Care Research (714) Psychiatry and Clinical Psychology (5459) Public and Global Health (9249) Radiology and Imaging (2205) Rehabilitation Medicine and Physical Therapy (1371) Respiratory Medicine (1197) Rheumatology (597) Sexual and Reproductive Health (715) Sports Medicine (530) Surgery (714) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'a02934bf2ad9593a',t:'MTc3OTkyODgwNg=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.