Full text
50,693 characters
· extracted from
preprint-html
· click to expand
Health and socioeconomic characteristics underlying educational attainment of children born preterm in England: a population cohort study using linked data | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Health and socioeconomic characteristics underlying educational attainment of children born preterm in England: a population cohort study using linked data View ORCID Profile Sadia Haider , View ORCID Profile Athanasios Tsanas , View ORCID Profile G. David Batty , View ORCID Profile Rebecca M Reynolds , Melvyn Roffe , View ORCID Profile Heather C Whalley , View ORCID Profile Riccardo E Marioni , View ORCID Profile Hilary Richardson , View ORCID Profile Cheryl Battersby , View ORCID Profile James P Boardman doi: https://doi.org/10.1101/2025.11.13.25340148 Sadia Haider 1 Section of Neonatal Medicine, School of Public Health, Faculty of Medicine, Imperial College London , London, UK PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Sadia Haider Athanasios Tsanas 2 Usher Institute, Edinburgh Medical School, University of Edinburgh , Edinburgh, UK 3 School of Mathematics, University of Edinburgh , UK DPhil(Oxon) Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Athanasios Tsanas G. David Batty 4 Department of Epidemiology and Public Health, University College London , London, UK FRSE Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for G. David Batty Rebecca M Reynolds 5 Centre for Reproductive Health, Institute for Regeneration and Repair, University of Edinburgh , Edinburgh, UK 6 Centre for Cardiovascular Science, University of Edinburgh , Edinburgh, UK FMedSci Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Rebecca M Reynolds Melvyn Roffe 7 Haberdashers’ Monmouth School , Monmouth, UK FRSA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Heather C Whalley 8 Centre for Clinical Brain Sciences, University of Edinburgh , Edinburgh, UK PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Heather C Whalley Riccardo E Marioni 10 Centre for Genomic and Experimental Medicine, Institute of Genetics and Cancer, University of Edinburgh , Edinburgh, UK PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Riccardo E Marioni Hilary Richardson 11 School of Philosophy, Psychology, and Language Sciences, University of Edinburgh , Edinburgh, UK PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Hilary Richardson Cheryl Battersby 1 Section of Neonatal Medicine, School of Public Health, Faculty of Medicine, Imperial College London , London, UK PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Cheryl Battersby James P Boardman 5 Centre for Reproductive Health, Institute for Regeneration and Repair, University of Edinburgh , Edinburgh, UK 8 Centre for Clinical Brain Sciences, University of Edinburgh , Edinburgh, UK FMedSci Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for James P Boardman For correspondence: james.boardman{at}ed.ac.uk Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF Abstract Background Preterm birth (PTB) is a leading cause of atypical brain development and cognitive impairment, however, there are sparse data on its impact on statutory educational assessments. We aimed to describe school readiness at 5 years and educational attainment at 6–7 years of children born preterm in England and identify the early life factors that associate with attainment. Methods We created a novel record linkage between the National Neonatal Research Database and the National Pupil Database for all babies born <32 weeks’ gestation in England (2008–2012) who survived to neonatal discharge. We used logistic regression to investigate associations between clinical and demographic variables and performance in six statutory school-age assessments. Findings Data from 15,857 children were analysed (53.3% boys). Fifty-seven percent did not meet the school readiness level at age 5, 51% did not meet expected attainment at ages six to seven in writing, maths (48%), reading (42%), and science (36%). Children born at 23–24 weeks had two to three times higher odds of not meeting expected levels compared to those born at 31 weeks (age 5: adjusted odds ratio 2.86, 95% CI 2.19-3.73). Children born in the most deprived areas at birth had 1 7 to 2-fold the risk of under-attainment compared to those in the least deprived. In adjusted models, male sex and season of birth conferred increased risk, alongside several potentially mutable risks: smoking during pregnancy, exposure to ante-or postnatal corticosteroids, severe acquired neonatal brain injuries, co-morbidities of PTB, nutrition during neonatal care, and childhood deprivation. Interpretation PTB poses a substantial risk for educational under-attainment at ages 5 through 7 years, particularly when combined with socioeconomic deprivation. Addressing neighbourhood-and family-level social inequalities should be given similar priority as reducing medical complications of PTB for improving the educational attainment of children born preterm. Funding UKRI Medical Research Council Evidence before this study We searched PubMed from October 1 st , 2015, to October 1 st , 2025, with no language restrictions for publications using the terms ((“preterm” OR “premature” OR “gestational age”) AND “socioeconomic” AND (“school” OR “education”)) in the title/abstract. Our search identified 20 relevant peer-reviewed studies, including one narrative systematic review that examined how socioeconomic inequalities and preterm birth interact to modify health and education outcomes. Three studies were conducted in the UK and used linked data to investigate educational outcomes for preterm-born children. The remainder were conducted in Scandinavian countries, Canada, Australia, and the Netherlands. Collectively, these studies have consistently shown that children born preterm have lower educational attainment compared with those born at term: a well-established dose-response relationship exists between gestational age and educational outcomes, with lower gestational age associated with progressively poorer attainment across all stages of education. However, most existing linkage studies did not capture the clinical heterogeneity of the preterm-born population underlying this gradient, as these data are rarely available in population-level datasets linked to education records. Whilst some studies included measures of socioeconomic status as a covariate, their independent effects have seldom been investigated, particularly relative to neonatal risk factors. Added value of this study The present study addresses these gaps through a novel linkage of population-level neonatal clinical data with national statutory educational assessments. We describe the high prevalence of low attainment among very preterm children (<32 weeks’ gestation) at ages 5 through 7 years in England. The linkage enables a granular characterisation of how maternal and neonatal conditions, exposures and treatments, and neighbourhood-and family-level measures of social disadvantage explain educational performance of children born <32 weeks’ gestation. The findings show a dose effect of low GA on low attainment and that the adverse effects of socioeconomic deprivation at birth persist through early school age. The effect of family-level deprivation at the start of school age is comparable in magnitude to that of severe neonatal brain injury, however, impacts a greater proportion of the population. As such, this study provides a more holistic understanding of the pathways underlying educational risk in this population. Implications of all the available evidence Improving the educational attainment of very preterm children is likely to require a reduction in social inequalities in pregnancy and early childhood, alongside care practices and research to minimise comorbidities of preterm birth. Furthermore, the identification of modifiable exposures, including maternal non-smoking, antenatal or postnatal corticosteroid exposure, breastfeeding, and deferred school entry or targeted additional support for very preterm children born in the summer months, offers practical targets for parents, clinicians, teachers and school leaders and educators, that could facilitate long-term educational attainment for children born preterm. Introduction Globally, preterm birth (PTB) affects 13 4 million pregnancies per annum 1 . Over the past two decades, the survival rate of children born preterm has improved, but 10-15% of children born very preterm (<32 weeks) develop cerebral palsy, and 30-50% develop an intellectual or behavioural disability. 2 Furthermore, preterm birth is more common among socioeconomically disadvantaged groups, reflecting social gradients in maternal health, environmental exposures, and access to antenatal care. 3 Consequently, preterm children face a double burden of biological immaturity and social disadvantage, with the latter influencing developmental outcomes through limited access to resources, greater exposure to stress, and reduced opportunities for cognitive stimulation. There is a paucity of data on the relationship between preterm birth and statutory educational assessments, and on the relative importance of socioeconomic disadvantage in shaping this relationship, particularly around the transition to school when cognitive demands substantially increase. Statutory assessments often determine the level of support provided to children. At the individual level, some very preterm children are free of neurodevelopmental and cognitive impairments, indicating that it is not low gestational age (GA) alone that confers risk. We hypothesise that risks which commonly co-occur with PTB influence the susceptibility to injury and dysmaturation and may explain differences in attainment at school age. These preterm birth-associated risk factors (PTB-RFs) are biological, psychosocial, and social/infrastructural. They can affect parent or child, or be shared, for instance: alterations in the perinatal stress environment, 4 , 5 systemic inflammation, 6 , 7 suboptimal neonatal nutrition, 8 complications of PTB, such as bronchopulmonary dysplasia and necrotising enterocolitis, 9 and social inequalities. 3 , 10 , 11 Understanding the relative contributions of PTB-RFs to important educational outcomes is necessary to inform clinical interventions and social policies designed to facilitate the educational attainment of children born preterm. The National Neonatal Research Database (NNRD) contains data on all neonatal admissions across the United Kingdom (UK) from 2007 to the present. 12 The National Pupil Database (NPD) is an administrative dataset of educational outcomes collected and maintained by the Department for Education (DfE) in England. 13 We created a novel record linkage between the NNRD and the NPD 14 to quantify the proportion of preterm children who do not meet expected levels in statutory educational assessments and test the hypothesis that specific PTB-RFs modify the relationship between low GA and outcomes for school readiness and educational attainment at 5 to 7 years among children growing up in England. Methods Data source The study links data from the National Neonatal Research Database (NNRD) 10 and National Pupil Database (NPD) 11 , 14 . See Supplement for details of the datasets. Study population This retrospective cohort comprised children born and cared for in a neonatal unit (NNU) in England between 1st September 2008 and 31st August 2012, with a recorded GA below 32 completed weeks, who survived to discharge, and had a linked neonatal and education record. The study epoch was chosen to include children old enough to be eligible for assessments at 5 to 7 years. Infants with congenital malformations or missing data for GA, sex, or place of birth were excluded. Ethics approval Research ethical and regulatory approval as part of the neoWONDER study (reference 21/EM/0130) 14 including Confidentiality Advisory Group approval to use identifiers for linkage purposes without consent (CAG reference 21/CAG/0081, Section 251 of the NHS Act 2006). No NNU opt-out requests were received. Definitions of variables Outcomes All outcomes are binary measures of whether a child met the expected education level at three time points (at 5 years, 6 years, 7 years), ascertained from statutory assessments in England. Age 5 Reception: Early Years Foundation Stage Profile (EYFSP) At the end of the final year of reception (akin to pre-school), teachers assess development across seven domains: communication and language (CL), physical development (PHY), personal, social, and emotional development (PSE), literacy (LIT), mathematics (MAT), understanding the world (UTW), and expressive arts and design (EXP). A ‘good level of development’ (GLD) was defined as achieving at least the expected level in CL, PHY, PSE, LIT, and MAT. 15 We used EYFSP as a measure of school readiness because these domains reflect the skills and behaviours that promote successful engagement in the early years of formal schooling. 16 Age 6, Key Stage 1 (KS1) phonics screening check During year 1 of formal schooling, teachers assess phonics using a 40-word test to assess reading ability. Pupils scoring > 32/40 meet the expected level. 17 Age 7, End of KS1 assessments Binary variables are derived to denote whether children meet the expected level in national tests of reading, writing, mathematics, and science. For KS1 assessments, the outcome was expressed as ‘not meeting the expected level’ at each time point because it indicates children who were likely to require additional support. 18 , 19 Exposures For descriptive analyses, we reported outcomes stratified by GA groups: 23-26 and 27-31 completed weeks. 20 The Index of Multiple Deprivation (IMD) was derived from the maternal postcode recorded in the NNRD at birth. 21 Maternal postcodes were linked to UK Office for National Statistics Lower Super Output Areas to assign IMD scores, which were grouped into national deciles (1 = most deprived, 10 = least deprived). Covariates PTB-RFs included maternal smoking, age, gestational diabetes, and hypertensive disorders, and the following neonatal characteristics: sex, birth month, birthweight, multiplicity, mode of delivery, co-morbidities of preterm birth (retinopathy of prematurity [ROP], necrotising enterocolitis [NEC], sepsis, bronchopulmonary dysplasia [BPD)], brain injuries (cystic periventricular leukomalacia [cPVL], all-grade intraventricular haemorrhage [IVH], hydrocephalus, and porencephalic cyst), exposure to ante-and post-natal corticosteroids, and nutrition at discharge (see Table S1 for definitions). Socioeconomic and demographic variables from the NPD included child ethnicity and major language group. The Income Deprivation Affecting Children Index (IDACI) was recorded at age 5 years. The IDACI ranks neighbourhoods according to the proportion of children under 16 living in low-income households, expressed as deciles. 21 Eligibility for free school meals (FSM) at age 5 years was included as a family-level proxy for household income. Statistical analysis Descriptive analyses We report participant characteristics for the study cohort with and without a linked education record ( Table 1 ). Frequencies (%) and median (IQR) are presented for categorical and continuous variables, respectively. For each outcome, we plotted the prevalence (95% CI) of not meeting the expected level of attainment across IMD, IDACI, and FSM stratified by 23-26 weeks’ and 27-31 weeks’ gestation. We used the Cochran–Armitage test to evaluate trends. We report outcomes for the study cohort alongside DfE national data for the same epoch. 15 , 17 We plotted the ten most common longitudinal individual-attainment trajectories. View this table: View inline View popup Table 1: Characteristics of children with and without a linked NNRD-NPD record Frequencies (%) and median (IQR) are presented for categorical and continuous variables, respectively. *Frequencies for cystic periventricular leukomalacia and hydrocephalus have been suppressed to minimise risk of secondary disclosure when cell counts describe <10 individuals. Regression analysis Overall, 0 8% of all covariate values were missing in the data. Missingness was addressed through multiple imputation using chained equations (see Supplement methods and Table S2). We fitted cross-sectional logistic regression models using generalised estimating equations (GEE) to develop functional statistical relationships between covariates and each outcome. An exchangeable correlation structure was specified to account for within-mother correlation among multiple births, assuming equal correlation between siblings. 22 Model estimation employed a binomial distribution with a logit link and robust standard errors. We assessed multicollinearity using the variance inflation factor (VIF), ensuring that values did not exceed 5. Children with complete data on all outcomes and maternal ID to identify within-family clustering were included in the GEE models. IMD quintiles were used in three models to highlight broader gradients of deprivation in line with previous studies: 1) crude associations of each covariate with each outcome; 2) a model to test the interaction between GA and IMD, which was assessed by testing statistical significance (at p=0.05 level) of the interaction term and by plotting predicted probabilities of outcomes at mean values of covariates values stratified by GA across levels of IMD; and 3) fully adjusted models including all covariates described above. To avoid collinearity between ethnicity, language, and socioeconomic variables (Figure S1), our primary regression analyses retained IMD, FSM eligibility, and language, while omitting IDACI and ethnicity. In a sensitivity analysis, we substituted ethnicity for language to evaluate its impact on outcomes. We report results as odds ratios (OR) with 95% confidence intervals (CI). A CI that did not cross 1 was considered statistically significant at 5%. We evaluated out of sample predictive performance of the fully adjusted models (see Supplemental methods, ‘Predictive performance of the fully adjusted models‘). Analyses were conducted using Stata, version 18 0 and R. Role of the funding source The funder of the study had no role in study design, data collection, data analysis, data interpretation, or writing of the report. Results Study population Of 23,862 infants in the NNRD, 17,245 were identified by NHS Digital for linkage and 6,617 were not identified due to missing or incomplete NHS numbers. There were no major differences between groups with and without sufficient linkage identifiers (Table S3). Of those identified, 15,857 (92%) had an education record in the NPD ( Figure 1 ). Among these, 16 3% were born 23 to 26 weeks and 83 7% born 27 to 31 weeks; 53 3% were male, 26.9% were multiple-born, and 76 9% were born to White mothers ( Table 1 ). There were no differences in the distribution of GA, sex, or neonatal morbidities between linked and non-linked groups; however, the linked group were more likely to be of White ethnicity (76 9% vs 67 9%) and from the most deprived IMD decile (18 5% versus 10 9%). Download figure Open in new tab Figure 1: Participant flow of cohort included in the study born between 2008 /09 to 2011 /12 in England Trends in educational attainment of children born at <32 weeks at 5, 6, and 7 years old, and comparison to the whole population Table S4 shows the annual proportion of the cohort born in 2008/2009 to 2011/2012 who did not meet the expected level in each outcome, and Figure 2 summarises the data alongside national population results for the same epoch. For preterm born children at 5-6 years, a higher proportion did not meet the expected level compared to the national average (EYFSP 56 6% vs 35 5%; phonics 20 7% vs 8 8%); at 7 years, around half did not meet expected levels in writing (51 8%), maths (48 1%), and approximately 40% in reading and science. Compared with the national average, 15 , 17 the percentage point differences were 21% (EYFSP), 12% (phonics), 17% (KS1 reading), 20% (KS1 writing), 23% (KS1 maths), and 18% (KS1 science), Figure 2 . Children born <32 weeks constituted 1-2% of the national comparator data. 23 Download figure Open in new tab Figure 2: Distribution of children who did not meet expected levels for each outcome in the cohort and the whole national population Comparison between educational outcome measures in the cohort and published national statistics for all children who were at school and undertook the assessments during the same time-period. We derived the % who did not meet the expected level from annual figures published in reports by the Department for Education. 15 , 17 The bars represent the mean and SD over four birth years (2008/09 to 2011/12). Figures show the percentage point difference between preterm cohort and national attainment. Associations between gestational age and educational attainment There was a dose-response relationship between GA and educational attainment: each decreasing week of gestation from 31 weeks was associated with an increased proportion of children not achieving expected levels across all outcomes ( Figure 3 , Table S5). For EYFSP and KS1 reading, maths, science, and writing domains, approximately 70–90% born at 23 weeks did not reach expected standards, compared with around 30–50% at 31 weeks. Download figure Open in new tab Figure 3: Distribution of children who did not meet the expected level across outcomes stratified by gestational age (GA) Proportion in the overall cohort that did not meet expected level: EYFSP 8,602/15,528 (55.9%); Phonics 3,226/15,504 (20.8%); KS1 Reading 6,354/15,141 (42%); KS1 Writing 7,789/15,141 (51.4%); KS1 Maths 7,216/15,140 (47.7%); KS1 Science 5,449/15,141 (36%) Associations between socioeconomic status and educational attainment The proportion of children who did not meet expected levels declined progressively with higher SES at birth ( Figure 4 ). The gradients across IMD levels were parallel, indicating similar effects of deprivation across GA groups. Among children born in the least deprived IMD decile, 52% born at 23-27 weeks and 42% born at 28-31 weeks did not achieve the expected level at EYFSP. For the most deprived decile, the corresponding percentages were higher at 75% and 60%, respectively. These trends were consistent for FSM and IDACI at 5 years (Figures S2 and S3). Download figure Open in new tab Figure 4: Proportion of children who did not meet the expected level in outcomes by socio-economic status at birth (Index of Multiple Deprivation) stratified by gestational age category (23-26 weeks and 27-31 weeks) and the overall cohort Trend tested using Cochran–Armitage test. P<0.001 for every line. IMD 1= most deprived. Longitudinal individual-attainment trajectories Figure 5 shows the relative frequencies of the top ten most frequently occurring within-individual attainment sequence across all outcomes stratified by degree of prematurity. Among children born at 23-26 weeks, persistent under-performance in all outcomes was the most frequent attainment pattern (29 5%), and children were 1 7 times more likely to not meet expected levels in at least five outcomes compared with children born at 27-32 weeks (43 7% versus 26%). The most frequently occurring sequence in the 27-31 week group was meeting the expected level in all outcomes (35 9%), almost twice more than the 23-26 week group (21 6%). Download figure Open in new tab Figure 5: Sequence frequency plot to show the ten most frequently occurring longitudinal outcome patterns between age 5 and 7 years, stratified by gestational age category (23-26 weeks and 27-31 weeks) The y-axis represents the cumulative percentage of longitudinal sequences, and the bar widths are proportional to their frequencies. Rows are ordered by frequency of the pattern. Factors associated with educational attainment over time in mutually adjusted models Impact of gestational age and other infant characteristics Table 2 and Figure 6 present the ORs and 95% CIs from the unadjusted and fully adjusted GEE regression models for EYFSP, phonics, and KS1 reading and maths. There were strong correlations across domains for KS1 7-year outcomes ( r >0 8); the results for KS1 writing and science are presented in Supplementary Table S6 and Figure S4. Download figure Open in new tab Figure 6: Forest plot to show the unadjusted and fully adjusted associations between socio-economic and preterm birth factors with educational outcomes (not meeting the expected level in EYFSP, Phonics, KS1 reading, or maths) Odds ratios and 95% confidence intervals derived from GEE regression models. View this table: View inline View popup Table 2: Unadjusted and adjusted GEE regression models for the association between socio-economic and preterm-birth factors with educational outcomes for children born 2008/09 to 2011/12 in England Results are expressed as odds ratios with 95% confidence intervals. The adjusted model includes all covariates listed for unadjusted models (N=14,129). 14,129 children with complete data on all outcomes and maternal ID to identify clustered sibling data were included in the models. The dose-response relationship between GA and attainment persisted after adjustment, particularly for the most preterm infants, although effect sizes were attenuated. After adjustment, children born at 23–24 weeks were two to three times more likely to not achieve the expected level compared to those born at 31 weeks (EYFSP: adjusted odds ratio (aOR) 2.86, 95% CI 2.19-3.73) ( Table 2 ). Higher birthweight and female sex were protective for attainment although the gap between male and female children narrowed by age 7 years, especially for maths (EYFSP: (aOR) 1 96, 95% CI 1 82–2 11; maths: aOR 1 07, 95% CI 1 00–1 15) ( Table 2 ). Summer-born children, who enter school a year earlier than Autumn-born children, were nearly three times more likely to not meet expectations at EYFSP (aOR 2 64, 95% CI 2 41–2 90). Attainment did not differ between singletons and multiples. Impact of maternal characteristics Smoking during pregnancy increased the odds of under-attainment by 19–37% across outcomes ( Table 2 ). Increasing maternal age was protective, with each additional year associated with a 1–2% reduction in under-attainment. The effect of maternal diabetes increased after adjustment; however, hypertensive disorders had no statistical association with education attainment. Impact of care and interventions in the perinatal period A complete antenatal corticosteroid course administered to the mother was protective across all attainment timepoints and domains, whereas postnatal corticosteroids were consistently associated with elevated odds of not meeting the expected level of attainment (EYFSP: aOR, 1 37, 95% CI 1 13-1 65; KS1 maths: aOR 1 28, 95% CI 1 08-1 52). Lack of exclusive breastfeeding predicted poorer outcomes: mixed feeding had a lower association than exclusive formula feeding (EYFSP: aOR 1 19, 95% CI 1 07–1 33 versus aOR 1 51, 95% CI 1 37–1 66, respectively). Preterm complications/co-morbidities Of all covariates, neonatal brain injuries had the strongest associations with educational outcomes, particularly PVL (EYFSP: aOR 3 05, 95% CI 2 04–4 58) and hydrocephalus (EYFSP: aOR 2 47, 95% CI 1 48–4 13). PVL demonstrated the least attenuation after adjustment compared with other preterm complications/co-morbidities and had an effect size on par with being born at 23-24 weeks GA. Porencephalic cysts was associated with outcomes at KS1 but not earlier assessments. Infants with NEC, treated ROP, and BPD were linked to 1 5–2-fold higher odds of poor outcomes, while no association was found with sepsis. Socioeconomic and environmental exposures Socioeconomic disadvantage had a negative association with attainment at all ages. In adjusted models, children born in the most deprived quintile of neighbourhoods were 20–40% more likely to underachieve than those in the least deprived quintile (EYFSP: aOR 1.27, 95% CI 1.11–1.45), and children eligible for FSM were almost twice as likely to have poor outcomes, a magnitude on par with severe intraventricular haemorrhage (grade III–IV), Table 2 . Children whose primary language was not English were more likely to underachieve at EYFSP, though this difference was not present at KS1. There was no statistical interaction between deprivation and GA; the probability of poor attainment increased steadily with higher deprivation in all GA groups, confirming that deprivation exerts a comparable negative influence regardless of degree of prematurity (Figure S5). Overall, findings were consistent for KS1 science and writing (Figure S4, Table S6). Models showed low multicollinearity (VIF 1 28), moderate discrimination (AUC≈0.7) and classification performance (balanced accuracy of 0 63-0 66). Sensitivity analyses substituting major language spoken at home with ethnicity showed no consistent effect of ethnicity (Table S7). Effects of IMD and FSM were stable to its inclusion. Discussion In this large, population-based cohort study of preterm infants born in England before 32 weeks’ gestation between 2008 and 2012, there was a substantially elevated risk of not being ready for school at 5 years and of not meeting expected attainment levels in statutory tests at 6 and 7 years. There was a dose effect of prematurity: only a fifth of children born at 23-26 weeks and a third born at 27-31 weeks met expected levels of attainment at all time points. The data highlight the additive impact of socioeconomic deprivation in shaping the educational outcomes of children born very preterm. Those born in the most deprived quintile of neighbourhoods were 20–40% more likely not to meet expected levels of attainment than those born in the least deprived quintile, even after accounting for low GA and medical complications. Strikingly, FSM eligibility at age 5 years, a proxy for family income, was associated with an almost doubling risk of under-attainment, which is an effect size comparable to that of severe neonatal brain injury. Our findings corroborate education research showing that deprivation impacts pre-school neurodevelopmental outcome, 24 , 25 and cognitive neuroscience research showing that inequalities associate with differences in brain structure and connectivity, particularly in regions that support language, executive function, and memory, among preterm children. 10 , 26 The data indicate that social deprivation and PTB constitute a ‘double burden’. These adverse effects may be modifiable through family-level interventions and social and public policy designed to alleviate deprivation. This result is particularly important given that one-third of UK children live in relative poverty. 27 In addition, there is a need for continued clinical and research efforts to reduce severe neonatal brain injuries, NEC, BPD, and ROP, which all predicted low attainment. Whilst postnatal corticosteroid exposure was associated with low attainment, further work is required to explore whether the exposure is a proxy of illness severity or due to a direct effect on the developing brain. Although some of the PTB-RFs that are associated with low attainment are immutable (GA, male sex), others are potentially modifiable with targeted interventions, such as increasing breastfeeding rates during NNU care, improving antenatal corticosteroid use, and reducing maternal smoking. Studies are required to determine whether children born in the summer months could benefit from delayed school entry or targeted support, and whether very preterm boys and children growing up in deprived circumstances may have additional support needs. Ensuring that children born preterm with additional risk factors are supported for school readiness could confer life-course and societal benefits, including higher educational achievement and improved employability and income. 28 , 29 Strengths and limitations The study has several strengths. The use of a contemporary, socioeconomically and ethnically diverse, population-level cohort ensures high representativeness and generalisability to infants with access to modern neonatal intensive care. Furthermore, linkage with the NNRD ensured that we had a rich set of perinatal clinical variables. Socioeconomic status was triangulated from multiple data sources (IMD at birth, IDACI, and free school meal eligibility) to capture both neighbourhood-and family-level proxies of early-life deprivation, enhancing the robustness of our findings. As the UK government routinely collects these indicators, the findings are likely to be tractable to policymakers. We used multiple domains of educational outcomes, enabling us to identify shared and outcome-specific associations. Finally, the cohort is considerably larger than those reported in previous linkage studies of birth and education data, so was powered to detect novel associations in very preterm infants. 18 , 19 There are some limitations. First, 27 7% of eligible children were not linked due to missing or incomplete NHS number information. However, we did not identify biases, particularly socioeconomic, between groups with and without linked educational records. 1,029 (6%) children whom NHS Digital identified for linkage did not have an education record. Speculatively, this could include children who are home-schooled, in private or hospital schools, or have migrated since birth. Second, our adjusted models achieved a moderately discriminative AUC of 0 7. Omitted variable bias in the models may have resulted from unavailable data on important factors previously identified to increase school readiness, such as maternal education. 16 Third, we could not adjust for pre-existing neurodevelopmental impairment, so unmeasured variation in pre-school functioning may confound the observed associations at school age. 24 Finally, we did not have access to data from term-born controls, so the study may have been underpowered to detect an interaction effect of GA and deprivation. Due to differences in neonatal practice and in the assessment of educational outcomes, this study may have limitations in generalisability to LMIC settings. However, the findings suggest that maternal health behaviours, optimal use of antenatal corticosteroids, breast milk, and reducing co-morbidities are likely to be universally advantageous for improving developmental trajectories. 30 Future work We have demonstrated the methodological feasibility of linking population neonatal health to education data. Previous work has shown that parents support data linkage between health and education data; 14 continued follow-up of this cohort will enable evaluation of interventions, such as policy measures that reduce child deprivation. Identification of early life risk factors for low educational attainment will enhance research into the biological processes that embed preterm birth and social inequalities in child development. Conclusion This longitudinal birth cohort study found that children born at <32 weeks’ gestation often do not meet expected attainment levels in statutory educational assessments at 5-7 years. Low GA was strongly predictive of underachievement, but socioeconomic deprivation and several modifiable early-life exposures and co-morbidities were identified. Policies that reduce maternal and child deprivation, alongside clinical and research strategies that improve maternal health and minimise the co-morbidities of preterm birth, could improve school performance and potentially attenuate the life course impacts of being born too soon. Data Availability The data underlying this study cannot be shared publicly due to data-sharing agreements with NHS Digital and the Department for Education. Data availability The data underlying this study cannot be shared publicly due to data-sharing agreements with NHS Digital and the Department for Education. Acknowledgements The work was funded by UKRI Medical Research Council programme grant (MR/X003434/1) awarded to JPB. We wish to acknowledge all neonatal units who contribute data to the NNRD, known collectively as the UK Neonatal collaborative ( www.imperial.ac.uk/neonatal-data-analysis-unit/neonatal-data-analysis-unit/list-of-national-neonatal-units/ ). Infrastructure support for this research was provided by the NIHR Imperial Biomedical Research Centre (BRC) to the NNRD. Data were made available by the neoWONDER study supported by the National Institute for Health Research (NIHR) through an Advanced Fellowship awarded to CB (reference: NIHR300617). This work was undertaken in the Office for National Statistics Secure Research Service using data from ONS and other owners and does not imply the endorsement of the ONS or other data owners. We are grateful to the Department for Education for the provision of education data in the National Pupil Database. References 1. ↵ Ohuma , E.O. , et al. National, regional, and global estimates of preterm birth in 2020, with trends from 2010: a systematic analysis . Lancet 402 , 1261 – 1271 ( 2023 ). OpenUrl CrossRef PubMed 2. ↵ Inder , T.E. , Volpe , J.J. & Anderson , P.J . Defining the Neurologic Consequences of Preterm Birth . N Engl J Med 389 , 441 – 453 ( 2023 ). OpenUrl CrossRef PubMed 3. ↵ Saberian , S. , et al. Inequalities in neonatal unit mortality in England and Wales between 2012 and 2022: a retrospective cohort study . The Lancet Child & Adolescent Health 9 , 857 – 867 ( 2025 ). OpenUrl PubMed 4. ↵ Stoye , D.Q. , et al. Maternal cortisol is associated with neonatal amygdala microstructure and connectivity in a sexually dimorphic manner . Elife 9 ( 2020 ). 5. ↵ Lautarescu , A. , et al. Maternal Prenatal Stress Is Associated With Altered Uncinate Fasciculus Microstructure in Premature Neonates . Biol Psychiatry 87 , 559 – 569 ( 2020 ). OpenUrl CrossRef PubMed 6. ↵ Hagberg , H. , et al. The role of inflammation in perinatal brain injury . Nat Rev Neurol 11 , 192 – 208 ( 2015 ). OpenUrl CrossRef PubMed 7. ↵ Sullivan , G. , et al. Interleukin-8 dysregulation is implicated in brain dysmaturation following preterm birth . Brain Behav Immun 90 , 311 – 318 ( 2020 ). OpenUrl CrossRef PubMed 8. ↵ Sullivan , G. , et al. Breast Milk Exposure is Associated With Cortical Maturation in Preterm Infants . Ann Neurol 93 , 591 – 603 ( 2023 ). OpenUrl CrossRef PubMed 9. ↵ Boardman , J.P. & Counsell , S.J . Invited Review: Factors associated with atypical brain development in preterm infants: insights from magnetic resonance imaging . Neuropathol Appl Neurobiol 46 , 413 – 421 ( 2020 ). OpenUrl PubMed 10. ↵ McKinnon , K. , et al. Association of Preterm Birth and Socioeconomic Status With Neonatal Brain Structure . JAMA Netw Open 6 , e2316067 ( 2023 ). OpenUrl 11. ↵ Benavente-Fernandez , I. , Siddiqi , A. & Miller , S.P . Socioeconomic status and brain injury in children born preterm: modifying neurodevelopmental outcome . Pediatr Res 87 , 391 – 398 ( 2020 ). OpenUrl CrossRef PubMed 12. ↵ Modi , N . Information technology infrastructure, quality improvement and research: the UK National Neonatal Research Database . Transl Pediatr 8 , 193 – 198 ( 2019 ). OpenUrl CrossRef PubMed 13. ↵ Department for Education, The National Pupil Database User Guide. (United Kingdom, 2015 ). 14. ↵ van Blankenstein , E. , Aveline , A. & Battersby , C . A protocol for neoWONDER: Neonatal whole population data linkage to improve long-term health and wellbeing of preterm and sick babies . PLoS One 19 , e0305113 ( 2024 ). OpenUrl CrossRef PubMed 15. ↵ Department for Education, Early years foundation stage profile results: 2016 to 2017 . ( United Kingdom , 2017 ). 16. ↵ Raghuram , K. , Bando , N. & Janus , M . School readiness in children born preterm . Pediatric Research ( 2025 ). 17. ↵ Department for Education, Key stage 1 and phonics screening check attainment: Academic year 2021/22 . ( United Kingdom 2022 ). 18. ↵ Alterman , N. , et al. Gestational age at birth and academic attainment in primary and secondary school in England: Evidence from a national cohort study . PLoS One 17 , e0271952 ( 2022 ). OpenUrl CrossRef PubMed 19. ↵ Libuy , N. , et al. Gestational age at birth, chronic conditions and school outcomes: a population-based data linkage study of children born in England . Int J Epidemiol 52 , 132 – 143 ( 2023 ). OpenUrl CrossRef PubMed 20. ↵ Mactier , H. , et al. Perinatal management of extreme preterm birth before 27 weeks of gestation: a framework for practice . Archives of Disease in Childhood - Fetal and Neonatal Edition 105 , 232 – 239 ( 2020 ). OpenUrl 21. ↵ Department for Local Government and Communities, The English Index of Multiple Deprivation (IMD) 2015 (United Kingdom, 2015 ). 22. ↵ Hardin , J.W. & Hilbe , J.M. Generalized estimating equations , ( Chapman & Hall CRC , Boca Raton , 2013 ). 23. ↵ McHale , P. , et al. How do socioeconomic inequalities and preterm birth interact to modify health and education outcomes? A narrative systematic review . BMJ Open 15 , e084147 ( 2025 ). OpenUrl Abstract / FREE Full Text 24. ↵ Haider , S. , et al. Statistical learning to identify and characterise neurodevelopmental outcomes at 2 years in babies born preterm: model development and validation using population-level data from England and Wales . EBioMedicine 117 , 105811 ( 2025 ). 25. ↵ Benavente-Fernandez , I. , et al. Association of Socioeconomic Status and Brain Injury With Neurodevelopmental Outcomes of Very Preterm Children . JAMA Netw Open 2 , e192914 ( 2019 ). OpenUrl PubMed 26. ↵ Barda , T. , et al. The impact of socio-environmental factors on brain structure over the early life course of preterm-born individuals - A systematic review . Neuroscience & Biobehavioral Reviews 170 , 106061 ( 2025 ). 27. ↵ Department for Work and Pensions, Households Below Average Income: an analysis of the UK income distribution: FYE 1995 to FYE 2024. (United Kingdom, 2025 ). 28. ↵ Bolbocean , C. , et al. A heterogeneity analysis of health-related quality of life in early adults born very preterm or very low birthweight across the sociodemographic spectrum . Soc Sci Med 380 , 118181 ( 2025 ). 29. ↵ Gonen , E. , et al. Wealth Among Adults Aged 26 to 34 Years Born Very Preterm and Full Term . JAMA Netw Open 8 , e2510093 ( 2025 ). OpenUrl PubMed 30. ↵ Black , R.E. , et al. Health and development from preconception to 20 years of age and human capital . Lancet 399 , 1730 – 1740 ( 2022 ). OpenUrl PubMed View the discussion thread. Back to top Previous Next Posted November 17, 2025. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Health and socioeconomic characteristics underlying educational attainment of children born preterm in England: a population cohort study using linked data Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Health and socioeconomic characteristics underlying educational attainment of children born preterm in England: a population cohort study using linked data Sadia Haider , Athanasios Tsanas , G. David Batty , Rebecca M Reynolds , Melvyn Roffe , Heather C Whalley , Riccardo E Marioni , Hilary Richardson , Cheryl Battersby , James P Boardman medRxiv 2025.11.13.25340148; doi: https://doi.org/10.1101/2025.11.13.25340148 Share This Article: Copy Citation Tools Health and socioeconomic characteristics underlying educational attainment of children born preterm in England: a population cohort study using linked data Sadia Haider , Athanasios Tsanas , G. David Batty , Rebecca M Reynolds , Melvyn Roffe , Heather C Whalley , Riccardo E Marioni , Hilary Richardson , Cheryl Battersby , James P Boardman medRxiv 2025.11.13.25340148; doi: https://doi.org/10.1101/2025.11.13.25340148 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Pediatrics Subject Areas All Articles Addiction Medicine (570) Allergy and Immunology (864) Anesthesia (302) Cardiovascular Medicine (4445) Dentistry and Oral Medicine (444) Dermatology (383) Emergency Medicine (609) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1515) Epidemiology (15236) Forensic Medicine (30) Gastroenterology (1127) Genetic and Genomic Medicine (6610) Geriatric Medicine (669) Health Economics (1000) Health Informatics (4549) Health Policy (1370) Health Systems and Quality Improvement (1613) Hematology (543) HIV/AIDS (1266) Infectious Diseases (except HIV/AIDS) (15926) Intensive Care and Critical Care Medicine (1104) Medical Education (623) Medical Ethics (147) Nephrology (668) Neurology (6613) Nursing (346) Nutrition (999) Obstetrics and Gynecology (1147) Occupational and Environmental Health (957) Oncology (3341) Ophthalmology (975) Orthopedics (369) Otolaryngology (420) Pain Medicine (436) Palliative Medicine (130) Pathology (665) Pediatrics (1694) Pharmacology and Therapeutics (693) Primary Care Research (714) Psychiatry and Clinical Psychology (5458) Public and Global Health (9244) Radiology and Imaging (2205) Rehabilitation Medicine and Physical Therapy (1370) Respiratory Medicine (1197) Rheumatology (596) Sexual and Reproductive Health (715) Sports Medicine (530) Surgery (713) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'a0254e68dcbc67d4',t:'MTc3OTg4NzkxNA=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.