Development and validation of a personalised antipsychotic selection tool for first-line treatment in severe mental illness

doi:10.1101/2025.03.24.25324323

Development and validation of a personalised antipsychotic selection tool for first-line treatment in severe mental illness

2025 · doi:10.1101/2025.03.24.25324323

preprint OA: gold CC-BY-4.0

📄 Open PDF Full text JSON View at publisher

Full text 47,642 characters · extracted from preprint-html · click to expand

Development and validation of a personalised antipsychotic selection tool for first-line treatment in severe mental illness | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Development and validation of a personalised antipsychotic selection tool for first-line treatment in severe mental illness S Hardoon , DPJ Osborn , M Boman , F Ben Abdesslem , A Richards-Belle , N Launders , K Man , ICK Wong , C Dalman , G Ambler , I Petersen , JF Hayes doi: https://doi.org/10.1101/2025.03.24.25324323 S Hardoon 1 Division of Psychiatry, UCL , London, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: s.hardoon{at}ucl.ac.uk DPJ Osborn 1 Division of Psychiatry, UCL , London, UK 2 North London NHS Foundation Trust , London, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site M Boman 1 Division of Psychiatry, UCL , London, UK 3 Division of Clinical Epidemiology, Karolinska Institute , Stockholm, Sweden Find this author on Google Scholar Find this author on PubMed Search for this author on this site F Ben Abdesslem 1 Division of Psychiatry, UCL , London, UK 4 Department of Clinical Neuroscience, Karolinska Institute , Stockholm, Sweden 5 Research Institutes of Sweden , Stockholm, Sweden Find this author on Google Scholar Find this author on PubMed Search for this author on this site A Richards-Belle 1 Division of Psychiatry, UCL , London, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site N Launders 1 Division of Psychiatry, UCL , London, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site K Man 6 UCL School of Pharmacy, UCL , London, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site ICK Wong 6 UCL School of Pharmacy, UCL , London, UK 7 Department of Pharmacology and Pharmacy, University of Hong Kong Find this author on Google Scholar Find this author on PubMed Search for this author on this site C Dalman 8 Department of Global Public Health, Karolinska Institute , Stockholm, Sweden Find this author on Google Scholar Find this author on PubMed Search for this author on this site G Ambler 9 Department of Statistical Science, UCL , London, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site I Petersen 10 Institute of Epidemiology and Healthcare, UCL , London, UK 11 Department of Clinical Epidemiology, Aarhus University , Denmark Find this author on Google Scholar Find this author on PubMed Search for this author on this site JF Hayes 1 Division of Psychiatry, UCL , London, UK 2 North London NHS Foundation Trust , London, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF Summary Background Guidance is lacking on choice of first-line antipsychotic for individuals with incident severe mental illness (SMI). Patients may try several before an effective, well-tolerated drug is identified, delaying symptom improvement. We aimed to develop a personalised selection tool to identify the optimum first-line antipsychotic, based on individual sociodemographic and clinical characteristics. Methods Risk prediction development and validation study using electronic health records (EHRs) from primary care in England (Clinical Practice Research Datalink) linked to Hospital Episode Statistics, including 11,811 individuals with incident SMI prescribed aripiprazole, olanzapine, quetiapine or risperidone as first-line treatment between 2007-2016. The outcome was time to psychiatric hospitalisation or change to different antipsychotic within 3 years of commencing treatment. Prediction algorithms were developed using Cox proportional hazards models in a 70% training sample and validated in a 30% hold-out sample. This baseline model was compared with machine learning survival models of increasing complexity. Potential predictors included demographics, diagnoses, concomitant medications and laboratory findings. Outcomes Among 8,225 individuals in the development cohort, 4,456 (54.2%) experienced the outcome. In model validations, 1,022 (53.3%) of 1,916 in the validation cohort did not receive the optimal antipsychotic identified by the personalised selection tool. The predicted 3-year outcome risk if all individuals received the medication assigned by the tool was 6.3% lower (95% CI 4.0%-8.5%) than the observed 3-year risk in the validation cohort, and 10.2% lower (95%CI 7.9%-12.5%) than if individuals were randomly assigned an antipsychotic (corresponding numbers need to treat of 16 and 10). Machine learning approaches did not meaningfully improve model performance. Interpretation A personalised tool based on EHR data could improve treatment success rates by optimising first-line antipsychotic selection. Machine learning did not outperform traditional prediction methods. Further research will assess the impact on adverse events and in other populations. Funding UK Research and Innovation grant MR/V023373/1. Evidence before this study We searched PubMed for articles published from database inception to December 13, 2024, with no language restrictions. We searched titles and abstracts using the terms ((prediction) AND ((treatment response) OR (treatment rule) OR (treatment outcome)) AND ((psychosis) OR (severe mental illness) OR (schizophrenia) OR (bipolar disorder))). We identified 187 articles for full text screening. A number of studies exist on the prediction of lithium treatment response. A recent systematic review summarised the results of eight studies that used biomarkers, clinical and socio-demographic features to predict treatment response in psychosis, however these commonly compared responders with non-responders, rather than developing treatment selection rules. Two studies did generate treatment selection recommendations. One used a Super Learner in Taiwan National Health insurance data to optimise antipsychotic selection in first episode psychosis, resulting in a 7% improvement in estimated treatment success rate. The second examined antipsychotic selection, choosing between risperidone and aripiprazole, in children using Korean National Health insurance data and found a 1.2-1.5 times increase in antipsychotic continuation using their model compared to their allocated treatment. They found no improvement in performance when comparing machine learning with simple regression models. Neither model has been externally validated. We could not find any models that are in clinical use. Added value of this study We found that a simple treatment selection prediction model, based on data contained in the electronic health records at the point that an individual with severe mental illness is first prescribed an antipsychotic, could reduce treatment failure rates by 6-10%. In our validation cohort 75% of patients were switched to an alternative antipsychotic medication by the treatment selection tool. In line with the limited number of previous studies in this area, we did not observe meaningful improvements in predictive properties when machine learning approaches were compared with traditional models. Implications of all the available evidence Prediction models for optimising treatment selection in psychiatry are becoming increasingly possible with data from electronic health records. Improving treatment selection for people with SMI is low risk, compared to other prediction problems in psychiatry, and could improve long-term outcomes. Models still need full external validation and testing in new cohorts. Background Severe mental illnesses (SMI), including schizophrenia, bipolar disorder and other non-organic psychotic illnesses, have a lifetime prevalence of approximately 1% each, and are in the top twenty diseases in terms of disability. This disability burden has been increasing over the past 30 years.[ 1 ] SMI is associated with high levels of premature mortality and morbidity, with a mean age of death 15 years younger than the general population.[ 2 ] SMI is challenging to treat. Thirty different antipsychotics are approved for use in the United Kingdom (UK), but it can take a long time to find the optimal antipsychotic for a patient, delaying potential improvements in symptoms. Early, optimised treatment in incident SMI could reduce symptom burden, non-adherence and morbidity. Personalised or precision medicine aims to assign a patient the optimal treatment, based on their predicted response; thereby moving from average group outcomes to the prediction of outcomes for individual patients.[ 3 ] Algorithms that predict response to different medications based on a patient’s demographic, clinical, genetic and biomarker characteristics may be used to better determine which first-line treatment is most likely to be effective for an individual patient.[ 4 ] Regarding personalising treatment for SMI, there is ongoing work focusing on genome-wide associations[ 5 ] and biomarkers (for example, from functional magnetic resonance imaging [ 6 ] and electroencephalography[ 7 ]). However, these approaches have yet to bear fruit clinically. Despite the rich data available, little attention has been paid to predictive analytics using other data sources such as Electronic Health Records (EHRs), which can provide real-world outcomes and adverse event information for large numbers of patients with SMI. This contrasts with cardiovascular disease (CVD), where algorithms for CVD risk are in use clinically[ 8 ]. Models selecting between approved and commonly used treatments are low risk compared to other prediction problems in psychiatry; such as prediction of psychosis or suicide, where false negatives and false positives can have devastating impact [ 9 ]. Machine learning procedures may improve on traditional regression methods, because of the ability to discover hidden risk factors and interactions, nonlinear, and higher-order effects, as well as to approximate intricate functions that are poorly represented by individual covariate or interaction terms.[ 10 , 11 ] Previous studies have used machine learning methods to predict treatment response in depression,[ 12 , 13 ] but few personalised medicine studies exist for SMI.[ 11 , 14 , 15 ] The majority of the studies in people with SMI focus on predicting response to particular medications, rather than comparing different medications to obtain an overall personalised treatment selection rule.[ 16 – 19 ] The two previous studies which do, both concern personalised treatment selection for schizophrenia in Asian populations; applicability to other populations and SMI groups is unknown.[ 20 , 21 ] The aim of this study was to use a large EHR data set to develop and validate algorithms to predict treatment response to different antipsychotics in incident SMI, in order to identify the optimum first-line antipsychotic treatment. Four antipsychotics, most commonly prescribed as first-line treatments in the UK, were considered: aripiprazole, quetiapine, olanzapine and risperidone.[ 22 ] A secondary aim was to compare machine learning methods with traditional regression modelling for development of the algorithms. Methods Data source Data came from the Clinical Practice Research Datalink (CPRD) Aurum database, which comprises anonymised EHRs retrieved from participating general practices using EMIS software across the UK [ 23 ]. A CPRD data set build from May 2022 was used. The database includes recorded diagnoses, symptoms and other health data (blood tests, health indicators), and all issued medication prescriptions. Medical diagnoses and symptoms information is recorded using a mixture of Read, SNOMED and local EMIS coding systems. Records from primary care practices in England which had agreed to record linkage were linked by the data providers to secondary care hospital records from Hospital Episode Statistics (HES) data, including records from accident and emergency (A&E) (from 1/4/2007 to 31/03/2020), and admitted patient care (APC) (1/4/1997 to 31/03/2021). Study design In a nationwide retrospective cohort derived from EHRs, we conducted risk prediction algorithm development and validation for predicting response to different antipsychotics as first-line treatment in severe mental illness. We compared traditional risk prediction modelling and machine learning methods.[ 10 , 11 ] Setting The National Health Service in England. Cohort The cohort comprised of individuals with incident SMI between January 2007 and December 2016, who commenced on one of four antipsychotics as a first-line monotherapy treatment: aripiprazole, quetiapine, olanzapine, and risperidone (identified as the first antipsychotic prescription in prescription records). The 10-year period ensured the newest drug aripiprazole was available in routine practice (following approval in 2004) and the end date enabled three years follow-up (to December 2019) before the 2020 COVID-19 pandemic, and to coincide with the timeframe of HES linkage. Patients aged 10-99 years at time of first prescription were included. Incident SMI cases were defined as the first clinical record of schizophrenia, other psychosis or bipolar disorder. Code lists for these diagnoses were updated from established lists.[ 24 ] Further details of how the cohort was defined are given in the Appendix. 70% of the cohort was randomly selected to be a “development cohort” used for developing the risk prediction algorithms. The remaining 30% of the cohort was used for testing the algorithms (validation cohort). The development cohort was split further into four separate cohorts according to antipsychotic received, likewise for the validation cohort. Outcome/ Choice of primary measure Our outcome was time to a new intervention for psychosis. This included: a switch to a different antipsychotic, add-on of another antipsychotic or mood stabiliser, or psychiatric hospitalisation. This composite measure was chosen to capture treatment failure and similar outcomes have been used in pragmatic randomised controlled trials in psychiatry.[ 25 , 26 ] Psychiatric hospitalisations were included as indicative of increased severity of symptoms and thus treatment failure. Switches/add-ons of medications were included as indicative of the initial medication being suboptimal and thus treatment failure. Discontinuation of the medication alone was not included in the outcome as it could indicate both the medication being ineffective or the medication being effective enough for symptoms to have improved to the extent that medication is halted. The components of our outcome are well-recorded in EHRs and strongly associated with worsened quality of life.[ 27 ] Antipsychotic medications were identified from drug issue records as records with BNF Chapter 4.2 or with SNOMED codes mapped to BNF Chapter 4.2. Psychiatric hospitalisations were identified from linked HES records as hospital APC or A&E episodes with a psychiatric primary diagnosis (ICD chapters F10-F69) and/or with a psychiatric treatment specialty and/or a record of self-harm (given as a primary or subsequent diagnosis, or as the reason for the A&E episode) and/or a symptom/ injury as a primary diagnosis (ICD T36-50, T96, Y10-34, Y87.2, R44-46, R63.6) with a psychiatric secondary diagnosis. Follow-up Follow-up start (baseline) was the date of the first prescription for the antipsychotic given as first-line monotherapy. Study exit (censor date) was the earliest of: death date, date patient transferred out of the practice, date of last data collection for practice, 31 December 2019, three years after baseline. Follow-up time was time from baseline to the earliest of censor date or date of outcome. Potential predictors Following sample size calculations (see Appendix) we considered an initial set of key demographic and psychiatric variables totalling 23 coefficients, to satisfy the smallest cohort sample size calculation: age at baseline, sex, ethnicity, type of SMI (schizophrenia, bipolar disorder, other psychosis), time from first SMI diagnosis to first antipsychotic prescription, prior diagnoses in the primary care records of: depression, anxiety, eating disorder, personality disorder, post-traumatic stress disorder, adverse childhood experiences, prior recorded drug misuse or alcohol misuse and the number of psychiatric hospitalisations in the previous year. We then considered a wider list of pharmacological and physical health predictors (full list in Table 1 ). Details of how predictors were ascertained and sample size calculations are in the Appendix. View this table: View inline View popup Table 1: Distributions of predictor variables in the development cohorts Statistical methods Classical risk prediction model development Separate prediction models for each of the four medication types were developed, first considering the key predictors totalling 23 coefficients, and then the wider list. Prediction models were derived from Cox proportional hazards multivariable regression models. Backwards elimination using the Akaike Information Criteria was used to identify which predictors to retain in the final models. The prediction models for each medication type were then combined to form the overall treatment rule: an individual is assigned the medication for which they are computed to have the lowest overall predicted 3-year risk. Full details of model development (including imputation of missing data, use of fractional polynomials to assess form of continuous variables, categorisations of variables) are given in the Appendix, with levels of missingness reported in Appendix Table 1. Model validation and comparisons Model validity was assessed by computing Uno’s C index and Royston’s D statistic for discrimination, the calibration slope and the sensitivity and specificity at three years for different risk thresholds. Each medication risk prediction model was validated in the separate validation cohort for that medication. Details of the model validations are given in the Appendix. The utility of the overall treatment rule was investigated by comparing the predicted 3-year risk if all individuals are assigned the medication dictated by the risk prediction models (medication which corresponds to lowest predicted risk for the individual) with i) the outcome under the observed medications; ii) the predicted outcome if all people were to receive the same one medication (for each of the four medications in turn); iii) the predicted outcome if all patients were randomly allocated one of the four medications. Absolute risk reductions, and corresponding numbers needed to treat, comparing the risk prediction model medication assignment with each of the other scenarios were computed. In addition, individuals were grouped into two categories: those whose recorded medication was the same as predicted and those whose recorded medication differed from that predicted. Then the outcome was compared between the two groups. Machine learning model development In addition to the classical Cox regression models, several machine learning models (adapted for survival data) were considered: random forest, extreme gradient boosted model, linear and kernel support vector machines, deep learning neural networks and a Super Learner ensemble, combining all the models together. Details of the machine learning models are given in the Appendix. Results Cohort characteristics A total of 11,811 individuals with SMI were identified for inclusion in the analysis, as having received aripiprazole, olanzapine, quetiapine or risperidone as a first-line monotherapy, between 2007-2016. Of these, 8,225 were included in the development cohorts: 904 (11%) having received aripiprazole forming the aripiprazole development cohort, and 2,975 (36%), 2,408 (29%), and 1,968 (24%) in the olanzapine, quetiapine and risperidone cohorts respectively. The remaining 3,556 individuals constituted the validation cohorts, including 397 (11%) individuals having received aripiprazole, and 1,306 (37%), 1,027 (29%) and 826 (23%) having received olanzapine, quetiapine and risperidone respectively. Distributions of predictors in the development cohorts according to medication are shown in table 1 . Predictor distributions in the validation cohorts were broadly similar (Appendix Table 2). Treatment outcomes In the aripiprazole development cohort, outcome events occurred within three years in 456 individuals over 1,487 person-years of follow-up, corresponding to an incidence rate of 306.8 per 1000 person-years at risk (PYAR), 95% confidence interval (CI) 279.9 to 336.3 ( Table 2 ). Among the 456 events, 261 (57.2%) were hospitalisations, 150 (32.9%) were medication switches and 45 (9.9%) were medication add-ons (Appendix table 3). Incidence rates in the olanzapine, quetiapine and risperidone cohorts were: 351.5 (95% CI 335.0 to 368.9), 356.7 (95% CI 338.0 to 376.5) and 332.9 (313.2 to 353.9) respectively. Similar proportions of events were hospitalisations in these groups as for aripiprazole. The five most common medication switches and add-ons in each medication cohort are shown in Appendix table 4. View this table: View inline View popup Download powerpoint Table 2: Incidence rates of treatment failure (hospitalisation and/or medication changes/ add-ons) in the development and validation cohorts Development cohorts Incidence rates of outcome events in the validation cohorts were: aripiprazole 330.4 (95% CI 289.2 to 377.6), olanzapine 317.8 (95% CI 294.9 to 342.4), quetiapine 378.8 (95% CI 349.2 to 410.9) and risperidone 332.9 (95% CI 302.8 to 365.8), per 1000 PYAR. Cox regression models development The final risk prediction models, after backwards elimination for each medication starting from the full list of predictors are shown in table 3 . Key retained predictors included age, sex, ethnicity, time from SMI diagnosis to first prescription, SMI diagnosis, prior depression, anxiety, alcohol misuse and number of prior psychiatric hospitalisations. The final risk prediction models after backwards elimination, developed starting instead from a limited number of predictors totalling 23 coefficients are shown in Appendix table 5. View this table: View inline View popup Table 3: Classical statistical prediction models after backwards elimination – starting from full list of predictors Cox regression models validation and decision rule evaluation Discrimination and calibration statistics and sensitivities and specificities at different risk thresholds for the risk prediction models applied to the validation cohorts are presented in Appendix table 6. Medications predicted by the selection tool based on these Cox models for each individual in the validation cohorts are tabulated against the actual first-line treatment received in table 4 . Models derived from the full list of predictors were used for the selection tool, but results were similar using the models derived from predictors totalling 23 coefficients. More than half of those originally prescribed aripiprazole as first-line treatment were also assigned aripiprazole by the personalised selection tool (58%). View this table: View inline View popup Download powerpoint Table 4: Medications assigned by decision rule versus medications actually prescribed in the validation cohort However, only 18%, 29% and 16% of those prescribed olanzapine, quetiapine and risperidone were assigned the same medication by the decision rule. In all 2,662 (75%) of the those in the validation cohort were assigned a different medication by the selection tool. The mean predicted 3-year risk using our selection tool was 6.3% lower than the observed risk (absolute risk reduction 6.3% (95% CI 4.0% to 8.5%)), corresponding to a number needed to treat of 16 (95% CI 12 to 25). The mean predicted 3-year risk using the treatment rule was between 4% and 13% lower than in the scenario where all individuals were assigned any one medication, and 10% lower than in the scenario of random allocation ( Table 5 ). Further, as a separate evaluation, among individuals in the development cohort who were assigned the same medication by the treatment rule as the medication they were originally prescribed, the observed 3-year risk was 58.8%, while among those for whom a different medication was assigned by the treatment rule, the observed 3-year risk was 55.0% (relative risk of 1.07). View this table: View inline View popup Download powerpoint Table 5: Predicted 3-year risk of treatment failure using decision rule and other treatment rules versus observed 3-year risk of treatment failure in validation cohort Machine learning models development and validation Discrimination statistics from application of the machine learning models to the validation cohorts are shown in Appendix table 7. Of the machine learning models, the extreme gradient boosted models appeared to have consistently stronger performance across all four medication groups, although differences in C statistics between the different models were marginal. The machine learning models, including the Super Learner ensemble, did not materially outperform the classical statistical survival models. Discussion We successfully developed a treatment selection tool to identify the optimum of four medications: aripiprazole, olanzapine, quetiapine and risperidone for use as first-line monotherapy in SMI. The decision rule consisted of applying risk prediction models specific to each medication, encompassing a range of clinical and demographic predictors, to an individual, and then selecting the medication for which the corresponding risk prediction model predicted the lowest 3-year risk of treatment failure (hospitalisation or a change in medication). The tool was applied to a separate validation cohort of individuals who had received one of these medications. We found that had all individuals received the medication indicated by the decision rule, 75% of individuals would have been prescribed a different medication from that actually received. The 3-year risk of treatment failure in the cohort could have been 6% lower than that observed, corresponding to a number needed to treat of 16, and 10% lower than had medications been randomly assigned. To our knowledge, this is the first study to develop a treatment decision rule for all incident SMI (schizophrenia, bipolar disorder and other psychosis) and in populations outside of Asia. A previous study in Taiwan which developed a treatment rule using machine learning for first episode schizophrenia, found a similar difference of 7% between predicted treatment success using the treatment rule, and that observed (52% versus 45%).[ 21 ] In agreement with the present study, they also found that aripiprazole was the most frequently recommended medication by the treatment rule, lending further support to our findings. Another previous study developed a treatment rule for children and adolescents with schizophrenia in South Korea.[ 20 ] That study reported a ratio of treatment continuation (study outcome) of those receiving the medication assigned by the treatment rule relative to those not receiving the assigned medication of 1.2 to 1.5. This is higher than the 1.07 relative risk of treatment failure comparing these two groups in our study. However, the outcome in that study is not directly comparable to our study as it included stopping the medication, as opposed to just switching or adding to the medication. As outlined in the Methods, this is problematic as stopping the medication could indicate treatment success as well as treatment failure. Interestingly, the study in South Korea also compared classical statistical (logistic) regression models with machine learning models and in agreement with our study, found machine learning models did not materially improve performance. The authors attribute the lack of superiority of machine learning models in part to the use of clinically meaningful predictors such that machine learning models had little to add, a finding supported by previous studies using structured data with clinical meaningful predictors[ 28 , 29 ]. This could also be the case in our study. Further, we carefully examined all continuous predictors to assess the appropriate form/transformation in the statistical models, thus the added benefit of machine learning models in capturing non-linear and higher order effects may be limited. Strengths of the study include the wide range of well-defined clinical and demographic predictors available for inclusion in the models, and which reflect the information available to clinicians in practice, thus supporting potential implementation. In addition, the study included a large sample of individuals with SMI receiving first-line monotherapy of one of the four medications of interest, thus the statistical models were powered to include the large number of predictors available. Previous studies have shown people with SMI in UK primary care databases to be broadly representative of the UK SMI population.[ 24 ] A study limitation is the lack of information on medication dose: the treatment decision rule thus only assigns the type of medication and not the dose. The modelling implicitly assumes that the individual is receiving the optimum dose, but treatment failure could be due to the dose being incorrect, rather that the type of medication being suboptimal. However, in the course of treating a patient, the dose is likely to be adjusted and optimised before resorting to changing the medication, thus dose should not unduly influence the results. Secondly, medication adherence is unknown, although we only included people with at least one repeat prescription to indicate the individual adhering to the medication (see Appendix). A third limitation is the nature of the CPRD, comprising a routinely-collected snapshot of an individual’s primary care records, for the period during which the individual is included in the CPRD, which means that historical patient records prior to an individual registering with a general practice that contributes data to CPRD may not be captured. This means that historical antipsychotic prescriptions may be missed such that the first-line treatment as defined here is not the true first antipsychotic medication. However, we only included individuals in the study, for whom the first recorded antipsychotic medication use occurred at least one year after the patient entered the study (Appendix). This helped to minimise the possibility of prior uncaptured antipsychotic medication use. A further limitation is that although a large number of relevant predictors were included, some information was not available which may have equally limited the predictive power of both the machine learning models and the statistical models, specifically genetic factors, and information on severity and clinical presentation of SMI. Future research could explore the influence of these additional factors, as well as potential modifications to try to improve the machine learning models. Further research will also consider the combined impact of the treatment rule on treatment failure (effectiveness outcome) and adverse outcomes (weight gain, hypertension, hypercholesterolemia and diabetes), and the application of the treatment rule in different populations. Future research should also consider cost-effectiveness of the treatment rule when used in routine clinical practice. In conclusion, the results of this study suggest that use of a personalised treatment selection tool in SMI to assign first-line medications could help to reduce the risk of treatment failure in severe mental illness. Our treatment rule was developed using classical, clearly defined, easily characterised and interpreted statistical models, using a range of predictors available in UK national health data. Although developed using primary care data, the models should be applicable in other health services such as secondary care psychiatric services, where antipsychotics tend to be first prescribed. This means the tool could feasibly be implemented in UK practice. Further work is necessary to prospectively validate the models. As we found little improvement in performance using machine learning, integration of our simple statistical models into clinical workflows would be relatively straightforward. Low risk prediction decisions, such as selection of treatment from a number of approved options, could improve outcomes for people with SMI. Funding This research is funded by UKRI grant MR/V023373/1, the University College London Hospitals NIHR Biomedical Research Centre and the NIHR North Thames Applied Research Collaboration (JFH). NL is supported by a HDR UK personal fellowship (Big Data for Complex Disease driver programme: HDR-23012). This work is affiliated to HDR UK which is funded by the Medical Research Council (UKRI), the National Institute for Health Research, the British Heart Foundation, Cancer Research UK, the Economic and Social Research Council (UKRI), the Engineering and Physical Sciences Research Council (UKRI), Health and Care Research Wales, Chief Scientist Office of the Scottish Government Health and Social Care Directorates, and Health and Social Care Research and Development Division (Public Health Agency, Northern Ireland). NL is additionally supported by the UK Research and Innovation grant MR/W014386/1 and MR/V023373/1 and by the NIHR University College London Hospitals Biomedical Research Centre, and NIHR North Thames Applied Research Collaboration. ARB is funded by the Wellcome Trust through a PhD Fellowship in Mental Health Science (218497/Z/19/Z). This research was funded in whole or in part by the Wellcome Trust. For the purpose of Open Access, the author has applied a CC BY public copyright licence to any Author Accepted Manuscript (AAM) version arising from this submission. Data Availability Study data were accessed via Clinical Practice Research Datalink (CPRD). Authors cannot share the data directly. However data can be accessed directly from CPRD following approval and licensing. Reference List 1. ↵ He , H. , et al. , Trends in the incidence and DALYs of schizophrenia at the global, regional and national levels: results from the Global Burden of Disease Study 2017 . Epidemiol Psychiatr Sci , 2020 . 29 : p. e91 . OpenUrl PubMed 2. ↵ Hayes , J.F. , et al. , Mortality gap for people with bipolar disorder and schizophrenia: UK-based cohort study 2000-2014 . Br J Psychiatry , 2017 . 211 ( 3 ): p. 175 – 181 . OpenUrl Abstract / FREE Full Text 3. ↵ Fernandes , B.S. , et al. , The new field of’precision psychiatry’ . BMC Med , 2017 . 15 ( 1 ): p. 80 . OpenUrl PubMed 4. ↵ Del Fabro , L. , et al. , Machine learning methods to predict outcomes of pharmacological treatment in psychosis . Transl Psychiatry , 2023 . 13 ( 1 ): p. 75 . OpenUrl PubMed 5. ↵ Hernandez , M. , et al. , Clinical Utility and Implementation of Pharmacogenomics for the Personalisation of Antipsychotic Treatments . Pharmaceutics , 2024 . 16 ( 2 ). 6. ↵ Voineskos , A.N. , et al. , Functional magnetic resonance imaging in schizophrenia: current evidence, methodological advances, limitations and future directionWs.orld Psychiatry , 2024 . 23 ( 1 ): p. 26 – 51 . OpenUrl 7. ↵ Lee , H.S. and J.S. Kim , Implication of Electrophysiological Biomarkers in Psychosis: Focusing on Diagnosis and Treatment Response J . Pers Med , 2022 . 12 ( 1 ). 8. ↵ Gidlow , C.J. , et al. , Cardiovascular disease risk communication in NHS Health Checks using QRISK®2 and JBS3 risk calculators: the RICO qualitative and quantitative study . Health Technol Assess , 2021 . 25 ( 50 ): p. 1 – 124 . OpenUrl CrossRef PubMed 9. ↵ Belsher , B.E. , et al. , Prediction Models for Suicide Attempts and Deaths: A Systematic Review and Simulation . JAMA Psychiatry , 2019 . 76 ( 6 ): p. 642 – 651 . OpenUrl PubMed 10. ↵ Vollmer , S. , et al. , Machine learning and artificial intelligence research for patient benefit: 20 critical questions on transparency, replicability, ethics, and effectiveness . BMJ , 2020 . 368 : p. l6927 . OpenUrl FREE Full Text 11. ↵ Chekroud , A.M. , et al. , The promise of machine learning in predicting treatment outcomes in psychiatry . World Psychiatry , 2021 . 20 ( 2 ): p. 154 – 170 . OpenUrl CrossRef PubMed 12. ↵ Hentati Isacsson , N. , et al. , Making the most out of timeseries symptom data: A machine learning study on symptom predictions of internet-based CBT . Internet Interventions , 2024 . 38 : p. 100773 . OpenUrl PubMed 13. ↵ Hentati Isacsson , N. , et al. , Methodological choices and clinical usefulness for machine learning predictions of outcome in Internet-based cognitive behavioural therapy . Communications Medicine , 2024 . 4 ( 1 ): p. 196 . OpenUrl PubMed 14. ↵ Meehan , A.J. , et al. , Clinical prediction models in psychiatry: a systematic review of two decades of progress and challenges . Mol Psychiatry , 2022 . 27 ( 6 ): p. 2700 – 2708 . OpenUrl PubMed 15. ↵ Hayes , J.F. , et al. , Predicting maintenance lithium response for bipolar disorder from electronic health records-a retrospective study . PeerJ , 2024 . 12 : p. e17841 . OpenUrl PubMed 16. ↵ Kim , T.T. , et al. , Predictive modeling for response to lithium and quetiapine in bipolar disorder . Bipolar Disord , 2019 . 21 ( 5 ): p. 428 – 436 . OpenUrl 17. Nunes , A. , et al. , Prediction of lithium response using clinical data . Acta Psychiatr Scand , 2020 . 141 ( 2 ): p. 131 – 141 . OpenUrl PubMed 18. Koutsouleris , N. , et al. , Multisite prediction of 4-week and 52-week treatment outcomes in patients with first-episode psychosis: a machine learning approach . Lancet Psychiatry , 2016 . 3 ( 10 ): p. 935 – 946 . OpenUrl PubMed 19. ↵ Leighton , S.P. , et al. , Development and validation of multivariable prediction models of remission, recovery, and quality of life outcomes in people with first episode psychosis: a machine learning approach . Lancet Digit Health , 2019 . 1 ( 6 ): p. e261 – e270 . OpenUrl CrossRef 20. ↵ Jeon , S.M. , et al. , Comparison of prediction methods for treatment continuation of antipsychotics in children and adolescents with schizophrenia . Evid Based Ment Health , 2022 . 21. ↵ Wu , C.S. , et al. , Development and Validation of a Machine Learning Individualized Treatment Rule in First-Episode Schizophrenia . JAMA Netw Open , 2020 . 3 ( 2 ): p. e1921660 . OpenUrl 22. ↵ Richards-Belle , A. , et al. , Prescribing of antipsychotics for people diagnosed with severe mental illness in UK primary care 2000–2019: 20-year investigation of who receives treatment, with which agents and at what doses The British Journal of Psychiatry , 2024 : p. 1-9. 23. ↵ Wolf , A. , et al. , Data resource profile: Clinical Practice Research Datalink (CPRD) Aurum . Int J Epidemiol , 2019 . 48 ( 6 ): p. 1740 – 1740g . OpenUrl CrossRef PubMed 24. ↵ Hardoon , S. , et al. , Recording of Severe Mental Illness in United Kingdom Primary Care , 2000-2010 . Plos One , 2013 . 8 ( 12 ). 25. ↵ Geddes , J. , et al. , Lithium plus valproate combination therapy versus monotherapy for relapse prevention in bipolar I disorder (BALANCE): a randomised open-label trial . Lancet , 2010 . 375 ( 9712 ): p. 385-395. 26. ↵ Kane , J. , et al. , Effect of Long-Acting Injectable Antipsychotics vs Usual Care on Time to First Hospitalization in Early-Phase Schizophrenia: A Randomized Clinical Trial . Jama Psychiatry , 2020 . 77 ( 12 ): p. 1217 – 1224 . OpenUrl PubMed 27. ↵ Hasan , A ., The correlation between the quality of life and clinical variables among outpatients with schizophrenia . Psychiatry Research , 2019 . 271 : p. 39 – 45 . OpenUrl PubMed 28. ↵ Khera , R. , et al. , Use of Machine Learning Models to Predict Death After Acute Myocardial Infarction . Jama Cardiology , 2021 . 6 ( 6 ): p. 633 – 641 . OpenUrl PubMed 29. ↵ Ye , Y. , et al. , Comparison of Machine Learning Methods and Conventional Logistic Regressions for Predicting Gestational Diabetes Using Routine Clinical Data: A Retrospective Cohort Study . Journal of Diabetes Research , 2020 . 2020 . View the discussion thread. Back to top Previous Next Posted March 24, 2025. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Development and validation of a personalised antipsychotic selection tool for first-line treatment in severe mental illness Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Development and validation of a personalised antipsychotic selection tool for first-line treatment in severe mental illness S Hardoon , DPJ Osborn , M Boman , F Ben Abdesslem , A Richards-Belle , N Launders , K Man , ICK Wong , C Dalman , G Ambler , I Petersen , JF Hayes medRxiv 2025.03.24.25324323; doi: https://doi.org/10.1101/2025.03.24.25324323 Share This Article: Copy Citation Tools Development and validation of a personalised antipsychotic selection tool for first-line treatment in severe mental illness S Hardoon , DPJ Osborn , M Boman , F Ben Abdesslem , A Richards-Belle , N Launders , K Man , ICK Wong , C Dalman , G Ambler , I Petersen , JF Hayes medRxiv 2025.03.24.25324323; doi: https://doi.org/10.1101/2025.03.24.25324323 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Psychiatry and Clinical Psychology Subject Areas All Articles Addiction Medicine (568) Allergy and Immunology (863) Anesthesia (299) Cardiovascular Medicine (4423) Dentistry and Oral Medicine (443) Dermatology (382) Emergency Medicine (607) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1507) Epidemiology (15219) Forensic Medicine (30) Gastroenterology (1123) Genetic and Genomic Medicine (6587) Geriatric Medicine (667) Health Economics (997) Health Informatics (4524) Health Policy (1368) Health Systems and Quality Improvement (1612) Hematology (540) HIV/AIDS (1264) Infectious Diseases (except HIV/AIDS) (15910) Intensive Care and Critical Care Medicine (1103) Medical Education (623) Medical Ethics (145) Nephrology (667) Neurology (6588) Nursing (345) Nutrition (998) Obstetrics and Gynecology (1143) Occupational and Environmental Health (956) Oncology (3331) Ophthalmology (970) Orthopedics (369) Otolaryngology (420) Pain Medicine (435) Palliative Medicine (129) Pathology (663) Pediatrics (1690) Pharmacology and Therapeutics (691) Primary Care Research (710) Psychiatry and Clinical Psychology (5438) Public and Global Health (9218) Radiology and Imaging (2195) Rehabilitation Medicine and Physical Therapy (1369) Respiratory Medicine (1195) Rheumatology (593) Sexual and Reproductive Health (709) Sports Medicine (529) Surgery (709) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'9ff81ec329904807',t:'MTc3OTQxNDEwMw=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

⚙ Ask this paper AI returns verbatim quotes from the full text · source: preprint-html ⓘ

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc: last seen: 2026-05-20T01:45:00.602351+00:00
unpaywall: last seen: 2026-05-21T05:10:58.409756+00:00

License: CC-BY-4.0