Full text
38,767 characters
· extracted from
preprint-html
· click to expand
Evaluation of post-acute COVID-19 health outcomes (ECHOES) in England: The development of national surveillance system for long- term health outcomes following COVID-19 | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Evaluation of post-acute COVID-19 health outcomes (ECHOES) in England: The development of national surveillance system for long- term health outcomes following COVID-19 View ORCID Profile Hester Allen , Katie Hassell , Christopher Rawlinson , Owen Pullen , Colin Campbell , Annika M. Jödicke , Martí Català , View ORCID Profile Albert Prats Uribe , View ORCID Profile Gavin Dabrera , View ORCID Profile Daniel Prieto-Alhambra , View ORCID Profile Ines Campos-Matos doi: https://doi.org/10.1101/2024.10.18.24315744 Hester Allen 1 Immunisation and Vaccine Preventable Diseases Division, UK Health Security Agency , 61 Colindale Avenue, London, vNW9 5EQ, UK 2 Health Data Sciences, Centre for Statistics in Medicine, Nuffield Department of Orthopaedics, Rheumatology and Musculoskeletal Sciences (NDORMS), University of Oxford , UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Hester Allen For correspondence: hester.allen{at}seh.ox.ac.uk Katie Hassell 1 Immunisation and Vaccine Preventable Diseases Division, UK Health Security Agency , 61 Colindale Avenue, London, vNW9 5EQ, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site Christopher Rawlinson 1 Immunisation and Vaccine Preventable Diseases Division, UK Health Security Agency , 61 Colindale Avenue, London, vNW9 5EQ, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site Owen Pullen 1 Immunisation and Vaccine Preventable Diseases Division, UK Health Security Agency , 61 Colindale Avenue, London, vNW9 5EQ, UK 3 Student EPSRC Centre for Doctoral Training in Health Data Science, Department of Computer Science, University of Oxford Find this author on Google Scholar Find this author on PubMed Search for this author on this site Colin Campbell 1 Immunisation and Vaccine Preventable Diseases Division, UK Health Security Agency , 61 Colindale Avenue, London, vNW9 5EQ, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site Annika M. Jödicke 2 Health Data Sciences, Centre for Statistics in Medicine, Nuffield Department of Orthopaedics, Rheumatology and Musculoskeletal Sciences (NDORMS), University of Oxford , UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site Martí Català 2 Health Data Sciences, Centre for Statistics in Medicine, Nuffield Department of Orthopaedics, Rheumatology and Musculoskeletal Sciences (NDORMS), University of Oxford , UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site Albert Prats Uribe 2 Health Data Sciences, Centre for Statistics in Medicine, Nuffield Department of Orthopaedics, Rheumatology and Musculoskeletal Sciences (NDORMS), University of Oxford , UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Albert Prats Uribe Gavin Dabrera 1 Immunisation and Vaccine Preventable Diseases Division, UK Health Security Agency , 61 Colindale Avenue, London, vNW9 5EQ, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Gavin Dabrera Daniel Prieto-Alhambra 2 Health Data Sciences, Centre for Statistics in Medicine, Nuffield Department of Orthopaedics, Rheumatology and Musculoskeletal Sciences (NDORMS), University of Oxford , UK 5 Department of Medical Informatics, Erasmus Medical Centre University , Rotterdam, Netherlands Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Daniel Prieto-Alhambra Ines Campos-Matos 1 Immunisation and Vaccine Preventable Diseases Division, UK Health Security Agency , 61 Colindale Avenue, London, vNW9 5EQ, UK 2 Health Data Sciences, Centre for Statistics in Medicine, Nuffield Department of Orthopaedics, Rheumatology and Musculoskeletal Sciences (NDORMS), University of Oxford , UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Ines Campos-Matos Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF Abstract Introduction Electronic health records can be used to understand the diverse presentation of post-acute and long-term health outcomes following COVID-19 infection. In England, the UK Health Security Agency in collaboration with the University of Oxford have created the ECHOES dataset to monitor how an initial SARS-CoV-2 infection episode is associated with changes in the risk of health outcomes that are recorded in routinely collected health data. Methods The ECHOES dataset is as a national level dataset combining national level surveillance, administrative, and healthcare data. Entity resolution and data linkages methods are used to create a cohort of individuals who have tested positive and negative for SARS-CoV-2 in England throughout the COVID-19 pandemic, alongside information on a range of health outcomes including diagnosed clinical conditions and mortality, and risk factor information. Results The dataset contains comprehensive COVID-19 testing data and demographic, socio economic and health related information for 44 million individuals, who tested for SARS-CoV-2 between March 2020 and April 2022, representing 15,720,286 individuals who tested positive and 42,351,016 individuals who tested negative. Discussion With the application of epidemiological and statistical methods, this dataset allows a range of clinical outcomes to be investigated, including pre-specified health conditions and mortality. Furthermore, understanding of potential determinants of health outcomes can be gained, including pre-existing health conditions, acute disease characteristics, SARS-CoV-2 vaccination status and genomic variant. Introduction SARS-CoV-2 infection typically causes an acute respiratory syndrome, and there has been significant research into different health outcomes within the acute period following symptom onset, such as critical care admission and death. Increasingly, data driven approaches to characterise and determine the prevalence, symptoms and risk factors of post-acute COVID-19 are being developed ( 4 , 5 ). Electronic health records can be used to understand the diverse presentation of post-acute and long-term COVID-19 heath outcomes in representative populations and in routine care ( 3 ). In England, during the COVID-19 pandemic, robust, national surveillance systems were developed to collect comprehensive data to monitor trends in COVID-19. Using these data, UKHSA, in collaboration with the University of Oxford, have developed the Evaluation of Post-acute COVID-19 Health Outcomes (ECHOES) dataset. The purpose of this surveillance dataset is to monitor how an initial SARS-CoV-2 infection episode is associated with changes in the risk of health outcomes that are recorded through secondary care use, and death. To overcome limitations of other publications in the literature, of which many have focused on those with the most severe acute SARS-CoV-2 infection, we developed this dataset to include a broad range of both community based and hospitalised cases, as well as a developed control group based on negative laboratory tests. ECHOES is a dataset designed as a longitudinal cohort comprising individuals tested for SARS-CoV-2 in England throughout the COVID-19 pandemic. This dataset benefits from the use of a range of large data including, comprehensive, national level SARS-CoV-2 testing data, genomic sequencing data and vaccination records, alongside extensive demographic, socio economic and health related information. The use of routine health record datasets allows health outcomes, including those presented in secondary healthcare settings to be assessed using pre-existing methodologies, and therefore outcomes can be comparable during the exposure and follow-up periods and between persons with SARS-CoV-2 infection and test negative controls. As part of the remit to diagnose, control, prevent, and describe trends in communicable diseases and other risks to public health, UKHSA processes personal information to develop and maintain surveillance systems and conduct infection control activities( 7 ), in accordance with Regulation 3 SI 1438 Control of Healthcare Information Regulations 2002 (s251)( 8 ) as the legal basis for data processing in the absence of individual consent. Methods The ECHOES dataset is a longitudinal cohort capturing individuals who tested for SARS-CoV-2 between March 2020 and May 2022. This cohort is linked to multiple data sources to obtain information on health outcomes occurring in the post-acute phase (defined as >28 days after test), and factors associated with the COVID-19 infection and health outcomes. Building of the dataset occurs in three steps: cohort building, linkage to additional data sources, and matching. Data processing is carried out using SQL and statistical analysis is carried out using R, working within UKHSA secure servers. Data sources The data sources utilised to build the ECHOES dataset are all routinely collected national level surveillance, administrative, and healthcare data for which UKHSA are the owners or processors. This dataset is built linking: COVID-19 testing data; the National Immunisation Management system (NIMS); the Office of National statistics All-cause mortality data; and Hospital Episode statistics. COVID-19 testing data are collected through two data systems – the Second-Generation Surveillance System (SGSS) and the Unified Sample Dataset (USD). Second generation surveillance system (SGSS) collects infectious disease laboratory test information from diagnostic laboratories in England ( 4 ). SARS-CoV-2 testing data in SGSS includes polymerase chain reaction (PCR) tests from NHS settings (including NHS patients and staff) and PCR and lateral flow device (LFD) tests from community settings, submitted by individuals via an NHS website. SGSS records are validated and enhanced using the NHS spine, a database containing person identifying information (PII) for everyone who has ever had a contact with the NHS( 5 ). Positive test records are converted to cases and infection episodes, deduplicating records using the Organism-Patient-Illness Episode (OPIE) principle, whereby episodes constitute a positive organism in a defined time-period. For COVID-19, episodes are defined as 91 days from an individual’s earliest positive specimen date within a previous episode( 4 ). Where available, SARS-CoV-2 genomic information is included in SGSS( 6 ). In England, during the pandemic, genomic investigation and variant assignment was coordinated by the COVID-19 Genomics UK consortium (COG UK). A sample of eligible SARS-CoV-2 PCR samples underwent genomic investigation via: i) whole genome sequencing ii) reflex (genotyping) assays to detect key mutations, and iii) S-gene target status of PCR tests carried out on the TaqPath assay. The Unified sample dataset (USD) is a repository for positive and negative COVID-19 testing data in England, including all PCR and LFD tests ( 7 ). Testing data are sourced from SGSS, Respiratory Datamart (a laboratory reporting system designed for influenza test data collection)( 8 ) and the National Pathology Exchange (NPEX). Test records are enriched with patient information from the NHS spine ( 9 ). The national immunisation management system (NIMS) collects information on individuals eligible for SARS-CoV-2 vaccination and on administered vaccinations across a range of settings. It was commissioned in 2020 as part of the national influenza and COVID-19 vaccination programmes ( 13 , 14 ). NIMS contains two data views: person records for all individuals issued with an NHS number in England (the NIMS population denominator) who were alive when the vaccination programme began in December 2020, identifying those eligible for vaccination; and detailed vaccination records for all individuals who have received at least one dose of SARS-CoV-2 vaccination. Patient information is obtained from the NHS spine and undergoes validation to improve accuracy and completeness. All-cause mortality data are obtained from death registrations for England and Wales collated by the Office for National Statistics (ONS)( 15 ). Data are reported at person level and contain information about the death and the deceased individual. Causes of death, including underlying and primary cause of death are provided as International Classification of Diseases (ICD-10) codes, obtained through using automatic coding software to convert text terms from the death certificate. Primary cause of death refers to the disease or condition directly leading to death and underlying cause is the significant conditions contributing to the death (16). Hospital Episode Statistics collects information about all NHS hospital admissions, Accident and Emergency (A&E) attendances and outpatient visits in England (17). Standardised codes for procedures (Office of Population Censuses and Surveys (OPCS) codes) and diagnoses and medical conditions (ICD-10 codes), are captured for each episode, including information on primary diagnosis, treatment, co-morbidities and complications (20). Supplementary Table 1 describes the features of the datasets used in the production of these data. Cohort building methods To create a cohort of individuals who tested positive and negative for SARS-CoV-2 we identify unique individuals who have tested positive and negative within the COVID-19 testing datasets. This is done by applying entity resolution methods, which utilise PII and demographic information to create a dataset containing key identifiers for linkage to other data sources. Entity resolution involves SGSS, USD, the NIMS denominator and death registration data. Individuals can be captured in both the SGSS and USD testing data multiple times. The entity resolution methods use linkage methods between these data and the NIMS and death registration data to identity unique individuals within the testing data. To date, COVID-19 test and death registration records from January 2020 to December 2023, and NIMS records for those eligible for vaccination from December 2020 to May 2022 are included in the entity resolution process. To maximise uniformity, datasets are initially cleaned, removing all non-alphanumeric characters and additional spaces present in name, NHS number and postcode variables, and NHS numbers and postcodes are validated ( 9 ). The NIMS denominator acts as the gold-standard for PII as information is obtained from the NHS spine, and death registration data provides validated PII for deceased individuals. The entity resolution process runs, firstly between SGSS, USD and NIMS and secondly between SGSS, USD and death registration data. Each stage consists of 5 sequential iterations ( Table 1 ) and nine sub-iterations ( Table 2 ). Once linked, individuals are excluded from following iterations. All iterations include deterministic matching of at least three person identifiers (of NHS number, sex, residential postcode and date of birth) and deterministic matching and probabilistic matching (using the LIKE and DIFF SQL functions) of forename and surname. View this table: View inline View popup Download powerpoint Table 1: Description of entity resolution iterations 1.1 to 5.9 used in ECHOES cohort creation View this table: View inline View popup Table 2: Description of entity resolution sub iterations 1 to 9 used in ECHOES cohort creation Iteration one includes all identifiers (NHS number, forename, surname, DOB, sex and postcode). Subsequent iterations exclude postcode, NHS number and sex and consider alternative formatting of person identifiers. This account for where people may have changed residence over the time-period captured, where different formatting of names have been used across datasets (eg. Anne-Marie vs Anne Marie) and where key fields are missing, such as NHS number and erroneously entered, such as sex. These iterations are carried out between the two testing data sources and NIMS denominator data, then for records not successfully linked, between testing data and ONS death registration data. Following entity resolution, all PII except NHS number which is required for linkage to other data sources are removed from the dataset. 2.3 Censoring and exclusion criteria Exclusion criteria and censoring rules are then applied. All records require a valid NHS number which has been verified against or obtained from NIMS or death registration data, therefore testing records not linked during the entity resolution process were excluded. To investigate post-acute outcomes, individuals are required to have survived beyond the acute phase of infection, with follow-up starting 28 days after individuals’ earliest positive and negative tests dates. Data are at individual and test result level, as individuals can contribute both positive and negative follow-up time. If an individual tests negative before their first positive, both tests are included, however, if the positive test is within 28 days of the negative test, the negative test is negated, and the positive test retained. Positive test records are not negated if a negative test is recorded within 28 days. To assess time at risk, follow-up time is calculated. For negatives, follow-up time is calculated from 28 days after their negative test, and whichever comes first of a) date of death, b) a positive test or, c) the health outcome of interest occurs. For positives, between earliest test date and date of death or outcome occurrence ( Figure 2 ). Linkage to other data sources The ECHOES cohort is linked (using NHS number) to other data sources to obtain information a range of health outcomes and factors associated with the SARS-CoV-2 infection and health outcomes. These include cause of death, pre-existing health conditions, comorbidities, and acute phase hospitalisation (Supplementary Table 1). All-cause mortality provides date and cause of death. Time to death is calculated and cause of death ICD-10 codes are categorised into disease groups( 13 ). Vaccination status at time of test is obtained from NIMS and is defined in several ways: i) as fully vaccinated (having two or more vaccine doses) or unvaccinated, ii) by time since last vaccine dose received. Linkage of the ECHOES cohort to HES allows a range of health indicators including acute disease characteristics and pre-existing health conditions to be developed, as well as post-acute health outcomes to be defined. Hospital admission information at the time of test can be used to indicate hospitalisation during the acute phase of COVID-19 as well as whether an individual’s SARS-CoV-2 test was carried out in a hospital setting. Diagnosis ICD-10 codes captured in HES can be used to indicate pre-existing conditions and comorbidities if recorded prior individual’s test. Specific pre-existing conditions can be defined and categorised using the standard ICD-10 chapter categorisations or through clinical phenotyping of diagnosis codes, and comorbidities scores can be assigned using tools such as the Charlson Comorbidity index( 14 ). Furthermore, information on hospital admissions and procedures occurring during the post-acute phase can indicate healthcare usage, and by applying using similar disease area and condition categorisation methods, diagnosis codes during this phase can be used to define post-acute health outcomes within varying time periods after an individual’s initial SARS-CoV-2 test. Following data linkage, all PII are removed from the dataset. Analytical method The aim of analyses using these data is to compare the risk of post-acute health outcomes between those who tested positive and negative for SARS-CoV-2. Using this cohort, a range of study designs can be used to assess different outcomes within individual’s follow-up time. A matched cohort design can be applied, matching individuals who test positive and negative on a range of characteristics, depending on the objectives of the study. Results The entity resolution process using 16,598,060 positive episodes and 421,875,882 negative tests recorded at the time of dataset development result in 92.8% of positive records and 85.7% of negative records who tested between March 2020 and May 2022 being linked to a person record. Following censoring and exclusion, 44,234,762 unique individuals who have tested for COVID-19 are included. As individuals can be included in the positive and negative groups, this represents 15,720,286 positive individuals and 42,351,016 negative individuals ( Figure 1 ). Download figure Open in new tab Download figure Open in new tab Discussion The development of ECHOES the dataset will facilitate the investigation of a range of post-acute health outcomes, including pre-specified health conditions and mortality. These investigations will allow greater understanding of how a SARS-CoV-2 infection episode is associated with changes in the risk of health outcomes, and the long-term impacts of COVID-19 more generally. Further, these data allow potential determinants of these outcomes to be accounted for in any analyses. The inclusion of national level COVID-19 testing data in the ECHOES dataset creates a representative dataset, mirroring the overall population in England. The use of these data also allows the ECHOES dataset to capture those testing with asymptomatic infection and those with more severe disease testing in hospital settings. A major strength of ECHOES is its large size. This facilitates the investigation of rare outcomes and for research questions unanswerable by smaller datasets to be answered. Using person level data from multiple data sources allows comprehensive linkage methods to be developed to create an accurate testing record for each individual. Furthermore, it facilitates the creation of a robust control group. This adds validity to the results produced, allows multiple study designs to be applied and means the findings are more generalisable to the general population. Additionally, using multiple data sources means a range of health outcomes and risk factors can be investigated. Demographic factors such as age, sex, residential location, ethnicity and IMD can be considered, alongside vaccination status, comorbidities, pre-existing health conditions, acute disease severity and SARS-CoV-2 variant. Moreover, outcomes identified will not have to be considered independently and can be considered as indicators of future health outcomes. Despite capturing all COVID-19 tests in England, certain individuals are excluded from the ECHOES dataset. Including only those with a valid NHS number may exclude specific population groups such as those who do not engage in healthcare. However, as ECHOES aims to compare outcomes between positive and negative groups rather than providing robust prevalence estimates for outcomes, this is unlikely to significantly impact the results produced. Additionally, certain population groups that did not self-report their home test results may be excluded. How not being entitled to sick pay and other barriers to testing impacted different population groups needs to be considered when generalising results. Early in the pandemic, prior to self-administered test availability, testing was limited to PCR tests in healthcare settings (March to June 2020) and non-hospitalised COVID-19 cases had limited access to testing. This may introduce inaccuracies in the results, however, these can by overcome by analysis by different time-periods. Changes in test availability may lead to underrepresentation of population groups and misclassification of individuals. For example, individual’s earliest recorded positive tests could be a reinfection and individuals who tested negative may have also tested positive but never reported the result. Lastly, the dataset is designed for long term follow-up individuals, with periodic linkage to updated health outcome data. As widescale community testing was ceased in England in April 2022 but COVID-19 has continued to circulate in the population, if individuals are infected with SARS-CoV-2 after this date, this may not be captured, therefore resulting in potential misclassification of the negative group over time, causing a reduction in risk difference between the two testing groups for certain outcomes. Furthermore, by not including individuals who’s first COVID-19 infection was after community testing was ceased may result in some under-estimation of the post-acute health outcomes of these of these later COVID-19 infections that may be distinct from those in the earlier time periods. Despite these limitations, the ECHOES dataset offers a robust and comprehensive tool for investigating the post-acute health outcomes of COVID-19 in England. The dataset’s strengths will significantly enhance our understanding of the long-term impacts of SARS-CoV-2 infection. Data Availability Any research conducted using the ECHOES dataset must be done as a formal collaboration with UKHSA. Proposals for collaboration will be considered by the Immunisation and Vaccine Preventable Diseases team to evaluate the scientific quality and feasibility of the proposal. Data resource access Any research conducted using the ECHOES dataset must be done as a formal collaboration with UKHSA. Proposals for collaboration will be considered by the Immunisation and Vaccine Preventable Diseases team to evaluate the scientific quality and feasibility of the proposal. Ethics, Caldicott and Data protection approvals The production and analysis of this dataset has been approved by the UKHSA Caldicott Advisory Pane( 15 )l (Application reference CAP-2022-13) and the UKHSA Research & Public Health Practice Ethics and Governance Group (SUKHS REGG-Application reference NR0312). A Data Protection Impact Assessment was approved by DHSC Office of the Data Protection Officer in June 2023. Conflict of Interest DPA’s department has received grant/s from Amgen, Chiesi-Taylor, Lilly, Janssen, Novartis, and UCB Biopharma. His research group has received consultancy fees from Astra Zeneca and UCB Biopharma. Amgen, Astellas, Janssen, Synapse Management Partners and UCB Biopharma have funded or supported training programmes organised by DPA’s department. Author Contributions All authors were involved in the design of the ECHOES database and have contributed to the drafting of the manuscript. HA wrote the manuscript and lead on the design of the ECHOES database with oversight from ICM. KH led on the development of the database and development of entity resolution methods with support from CR and OP, APU, AJ, MCS have provided academic input into the design of the dataset. CC provided oversight specially for areas relating to vaccination data and GD and DPA have provided overall oversight. Funding Routine work undertaken by UK Health Security Agency as part of public health response. No external funding received. Acknowledgments We thank the Data Operations team at UKHSA for coordinating data flows and the IT infrastructure to build the ECHOES dataset, the ECHOES steering group including Russell Hope, Guy Harling and Daniel Ayoubkhani and all colleagues working on COVID-19 Vaccine and Epidemiology at UKHSA who have inputted to discussions regarding the development of ECHOES. References 1. Zhang H , Zang C , Xu Z , Zhang Y , Xu J , Bian J , et al. Data-driven identification of post-acute SARS-CoV-2 infection subphenotypes . Nat Med [Internet] . 2023 Jan [cited 2023 Aug 14 ]; 29 ( 1 ): 226 – 35 . Available from: https://www.nature.com/articles/s41591-022-02116-3 OpenUrl 2. Symptom clusters in COVID-19: A potential clinical prediction tool from the COVID Symptom Study app . SCIENCE ADVANCES . 2021 ; 3. ↵ Pfaff ER , Girvin AT , Bennett TD , Bhatia A , Brooks IM , Deer RR , et al. Identifying who has long COVID in the USA: a machine learning approach using N3C data . The Lancet Digital Health [Internet] . 2022 Jul [cited 2023 Aug 14 ]; 4 ( 7 ): e532 – 41 . Available from: https://linkinghub.elsevier.com/retrieve/pii/S2589750022000486 OpenUrl 4. ↵ UK Health Security Agency . Laboratory reporting to UKHSA: Guide for diagnostic laboratories [Internet] . 2022 Jan . Available from: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/1108438/UKHSA_Laboratory_reporting_guidelines1_.pdf 5. ↵ NHS Digital [Internet] . [cited 2023 Mar 17 ]. Spine . Available from: https://digital.nhs.uk/services/spine 6. ↵ Twohig KA , Harman K , Zaidi A , Aliabadi S , Nash SG , Sinnathamby M , et al. Representativeness of whole-genome sequencing approaches in England: the importance for understanding inequalities associated with SARS-CoV-2 infection . Epidemiol Infect [Internet] . 2023 [cited 2024 Jul 26 ]; 151 : e169 . Available from: https://www.cambridge.org/core/product/identifier/S0950268823001541/type/journal_article OpenUrl 7. ↵ Covid-19 Unified Sample Dataset (USD ). 8. ↵ GOV.UK [Internet] . [cited 2023 Mar 17 ]. Sources of surveillance data for influenza, COVID-19 and other respiratory viruses . Available from: https://www.gov.uk/government/publications/sources-of-surveillance-data-for-influenza-covid-19-and-other-respiratory-viruses/sources-of-surveillance-data-for-influenza-covid-19-and-other-respiratory-viruses 9. ↵ MikeRayMSFT . int, bigint, smallint, and tinyint (Transact-SQL) - SQL Server [Internet] . 2023 [cited 2023 Mar 24 ]. Available from: https://learn.microsoft.com/en-us/sql/t-sql/data-types/int-bigint-smallint-and-tinyint-transact-sql 10. rwestMSFT . LIKE (Transact-SQL) - SQL Server [Internet] . 2023 [cited 2023 Mar 17 ]. Available from: https://learn.microsoft.com/en-us/sql/t-sql/language-elements/like-transact-sql 11. DIFFERENCE (Transact-SQL) - SQL Server | Microsoft Learn [Internet] . [cited 2023 Mar 17 ]. Available from: https://learn.microsoft.com/en-us/sql/t-sql/functions/difference-transact-sql?view=sql-server-ver16 12. MikeRayMSFT . SOUNDEX (Transact-SQL) - SQL Server [Internet] . 2023 [cited 2023 Mar 17 ]. Available from: https://learn.microsoft.com/en-us/sql/t-sql/functions/soundex-transact-sql 13. ↵ Seghezzo G , Allen H , Griffiths C , Pooley J , Beardsmore L , Caul S , et al. Comparison of two COVID-19 mortality measures used during the pandemic response in England . International Journal of Epidemiology [Internet] . 2024 Feb 1 [cited 2024 Jul 26 ]; 53 ( 1 ): dyad116 . Available from : doi: 10.1093/ije/dyad116/7249287 OpenUrl CrossRef 14. ↵ NCI Comorbidity Index Overview [Internet] . [cited 2023 Aug 10 ]. Available from: https://healthcaredelivery.cancer.gov/seermedicare/considerations/comorbidity.html 15. ↵ GOV.UK [Internet] . [cited 2023 Nov 9 ]. The Caldicott Principles . Available from: https://www.gov.uk/government/publications/the-caldicott-principles View the discussion thread. Back to top Previous Next Posted October 21, 2024. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Evaluation of post-acute COVID-19 health outcomes (ECHOES) in England: The development of national surveillance system for long- term health outcomes following COVID-19 Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Evaluation of post-acute COVID-19 health outcomes (ECHOES) in England: The development of national surveillance system for long- term health outcomes following COVID-19 Hester Allen , Katie Hassell , Christopher Rawlinson , Owen Pullen , Colin Campbell , Annika M. Jödicke , Martí Català , Albert Prats Uribe , Gavin Dabrera , Daniel Prieto-Alhambra , Ines Campos-Matos medRxiv 2024.10.18.24315744; doi: https://doi.org/10.1101/2024.10.18.24315744 Share This Article: Copy Citation Tools Evaluation of post-acute COVID-19 health outcomes (ECHOES) in England: The development of national surveillance system for long- term health outcomes following COVID-19 Hester Allen , Katie Hassell , Christopher Rawlinson , Owen Pullen , Colin Campbell , Annika M. Jödicke , Martí Català , Albert Prats Uribe , Gavin Dabrera , Daniel Prieto-Alhambra , Ines Campos-Matos medRxiv 2024.10.18.24315744; doi: https://doi.org/10.1101/2024.10.18.24315744 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Epidemiology Subject Areas All Articles Addiction Medicine (573) Allergy and Immunology (865) Anesthesia (302) Cardiovascular Medicine (4453) Dentistry and Oral Medicine (444) Dermatology (383) Emergency Medicine (609) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1515) Epidemiology (15242) Forensic Medicine (30) Gastroenterology (1131) Genetic and Genomic Medicine (6615) Geriatric Medicine (669) Health Economics (1001) Health Informatics (4552) Health Policy (1372) Health Systems and Quality Improvement (1614) Hematology (543) HIV/AIDS (1270) Infectious Diseases (except HIV/AIDS) (15929) Intensive Care and Critical Care Medicine (1106) Medical Education (624) Medical Ethics (147) Nephrology (670) Neurology (6625) Nursing (346) Nutrition (999) Obstetrics and Gynecology (1148) Occupational and Environmental Health (957) Oncology (3344) Ophthalmology (979) Orthopedics (369) Otolaryngology (421) Pain Medicine (436) Palliative Medicine (130) Pathology (665) Pediatrics (1696) Pharmacology and Therapeutics (693) Primary Care Research (714) Psychiatry and Clinical Psychology (5461) Public and Global Health (9252) Radiology and Imaging (2207) Rehabilitation Medicine and Physical Therapy (1371) Respiratory Medicine (1197) Rheumatology (597) Sexual and Reproductive Health (715) Sports Medicine (530) Surgery (714) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'a02bf9c74b491640',t:'MTc3OTk1Nzg0OA=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.