Health Information Exchanges (HIEs) as Novel Sources for Population-Based Post Marketing Surveillance of Medical Products: A Pilot Study from the FDA Sentinel Innovation Center

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 43,646 characters · extracted from preprint-html · click to expand
Health Information Exchanges (HIEs) as Novel Sources for Population-Based Post Marketing Surveillance of Medical Products: A Pilot Study from the FDA Sentinel Innovation Center | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Health Information Exchanges (HIEs) as Novel Sources for Population-Based Post Marketing Surveillance of Medical Products: A Pilot Study from the FDA Sentinel Innovation Center Anjum Khurshid , David Kendrick , View ORCID Profile Haritha S. Pillai , Jenny Sun , Eliel Oliveira , Alexis Jaquish , Sarah K. Dutcher , Patricia Bright , Youjin Wang , Jie Li , Tiffany Austin , Patrick J. Heagerty , View ORCID Profile Michael E. Matheny , Sebastian Schneeweiss , Rishi J. Desai doi: https://doi.org/10.1101/2025.08.13.25333515 Anjum Khurshid 1 Department of Population Medicine, Harvard Pilgrim Health Care Institute and Harvard Medical School , Boston, MA MD, PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site David Kendrick 2 MyHealth Access Network , Tulsa, OK, USA MD, MPH, FACP Find this author on Google Scholar Find this author on PubMed Search for this author on this site Haritha S. Pillai 3 Division of Pharmacoepidemiology and Pharmacoeconomics, Department of Medicine, Brigham and Women’s Hospital and Harvard Medical School , Boston, MA, USA MPH Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Haritha S. Pillai Jenny Sun 2 MyHealth Access Network , Tulsa, OK, USA PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site Eliel Oliveira 4 Connxus , Austin, TX, USA MBA, MSc, FAMIA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Alexis Jaquish 1 Department of Population Medicine, Harvard Pilgrim Health Care Institute and Harvard Medical School , Boston, MA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Sarah K. Dutcher 5 Office of Surveillance and Epidemiology, Center for Drug Evaluation and Research, United States Food and Drug Administration , Silver Spring, MD, USA MS, PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site Patricia Bright 5 Office of Surveillance and Epidemiology, Center for Drug Evaluation and Research, United States Food and Drug Administration , Silver Spring, MD, USA PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site Youjin Wang 5 Office of Surveillance and Epidemiology, Center for Drug Evaluation and Research, United States Food and Drug Administration , Silver Spring, MD, USA PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site Jie Li 5 Office of Surveillance and Epidemiology, Center for Drug Evaluation and Research, United States Food and Drug Administration , Silver Spring, MD, USA PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site Tiffany Austin 5 Office of Surveillance and Epidemiology, Center for Drug Evaluation and Research, United States Food and Drug Administration , Silver Spring, MD, USA MPH Find this author on Google Scholar Find this author on PubMed Search for this author on this site Patrick J. Heagerty 6 Department of Biostatistics, University of Washington , Seattle, WA, USA MS, PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site Michael E. Matheny 7 Department of Biomedical Informatics, Vanderbilt University Medical Center , Nashville, TN, USA MD, MS, MPH Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Michael E. Matheny Sebastian Schneeweiss 3 Division of Pharmacoepidemiology and Pharmacoeconomics, Department of Medicine, Brigham and Women’s Hospital and Harvard Medical School , Boston, MA, USA MD, ScD Find this author on Google Scholar Find this author on PubMed Search for this author on this site Rishi J. Desai 3 Division of Pharmacoepidemiology and Pharmacoeconomics, Department of Medicine, Brigham and Women’s Hospital and Harvard Medical School , Boston, MA, USA MS, PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site Abstract Full Text Info/History Metrics Data/Code Preview PDF Abstract Introduction Health information exchanges (HIEs) provide the capability to electronically move health care information among different health care information systems and store these data for downstream use cases. However, use of data from HIEs for postmarketing surveillance of medical products is not previously explored. Objectives To conduct a pilot descriptive study characterizing data from MyHealth Access Network - a statewide HIE for Oklahoma, to understand its utility for conducting pharmacoepidemiology studies. Materials and methods MyHealth Access Network connects 95% of all hospital activity, 100% of federally qualified health center activity, and most community behavioral health clinics, tribal health systems, and independent providers in the state. As a use case to understand data in MyHealth Access Network, we characterized patients with Type 2 Diabetes Mellitus (T2DM), aged 18 years or older and treated with one of two common antidiabetic drug classes: Sodium-Glucose Co-Transporter 2 inhibitors (SGLT-2i) and Dipeptidyl Peptidase 4 inhibitors (DPP-4i) in a new user cohort design. A cohort entry date was defined based on records of medication initiation for either of the two drug classes, using dispensing data from insurance claims (when available) or prescribing data from electronic health records (EHRs) when claims were not available. Patient characteristics including demographics, comorbidities, comedications, clinical and lifestyle related factors, and healthcare utilization factors were summarized for the two exposure groups. Results A total of 76,018 DPP-4i initiators and 101,599 SGLT-2i initiators met our inclusion criteria. The mean age was 59 years and nearly half were women in both the groups. While there was a large proportion of those with missing race information (32% DPP-4i, 24% SGLT-2i), a majority were White (47% DPP-4i, 57% SGLT-2i). The second most reported race category was American Indian or Alaskan Natives (13% DPP-4i, 9.9% SGLT-2i), which is in line with their representation in the 2024 US Census for Oklahoma. Hemoglobin A1c (HbA1c) results were available for 63% and 66% of the DPP-4i and SGLT-2i groups with mean + SD of 8.1+ 1.9% and 8.2 + 1.9%, respectively. Serum creatinine was recorded for 67% DPP-4i and 70% SGLT-2i initiators with mean + SD of 1.30 + 1.01 mg/dL and 1.14 + 0.64 mg/dL, respectively. Discussion HIEs may offer a promising resource for population-based postmarketing surveillance of medical products owing to their comprehensive capture of information across various healthcare settings. 1. Introduction Fragmentation in the U.S. healthcare system poses critical challenges for both patient level care coordination and population level research. A 2007 analysis of Medicare data reported that patients visited, on average, more than 7 different healthcare providers annually, and that, on average, primary care providers serving a panel of patients found themselves coordinating care among 225 other providers in 117 other organizations.[ 1 ] As the adoption of electronic health records (EHR) by eligible providers and hospitals in the U.S. healthcare system surged following significant investments through the Health Information Technology for Economic and Clinical Health (HITECH) Act, the need to facilitate seamless exchange of clinical data securely across disparate competing EHR systems and provider organizations was clearly recognized.[ 2 ] As described in the Office of the National Coordinator for Health IT (ONC) Roadmap for Nationwide Interoperability (2015)[ 3 ], “every patient deserves to have their complete, longitudinal health record available where and when they need it for decisions about their care”. As a result, approximately 3% of HITECH funding supported the dramatic expansion of state and regional health information exchanges (HIEs) throughout the country.[ 4 ] The primary purposes of HIEs is to promote interoperability and coordination of care. Implementing and operationalizing this mission has been done by creating trusted regional networks where the silos of data, existing due to the fragmented nature of healthcare delivery, are connected through a governed, secure, central exchange platform. Since many of these exchanges also maintain the exchanged clinical documents and patient records in a centralized clinical data repository, over the years, these HIEs have become a comprehensive source of longitudinal, population level, linked EHR data in the country.[ 5 ] Almost all states in the U.S. have a statewide HIE or multiple regional HIEs. A recent survey funded by the ONC has reported about 80 fully operational HIEs in the country with an average data repository comprising more than four million unique patients with data going back to around 15 years in some cases. [ 6 , 7 ] These HIEs are mostly non-profit entities with a multistakeholder community governance. They maintain a robust technical infrastructure to create bidirectional data interfaces with large and small hospitals, federally qualified health clinics, physician practices, Emergency Medical Services (EMS), behavioral health providers, pharmacies, laboratories, and public health clinics among other types of organizations that are sources of health-related data. These interfaces allow for exchange of detailed clinical data through secure connections using FHIR APIs (Fast Health Interoperability Resources Application Programming Interfaces), HL7 (Health Level 7) interfaces, CCD (Continuity of Care Documents), or even flat files (.csv).[ 8 ] Importantly, HIEs maintain governance and compliance required to build trust in the privacy and confidentiality of sensitive clinical data. The HIEs store and use this data as Business Associate Agreement (BAA) partners for all providers connected to them and fully comply with HIPAA (Health Insurance Portability and Accountability Act, 1996) and other federal, state and local laws.[ 9 ] There are also continuous data quality and data integrity assurance processes[ 10 ] implemented in all major HIEs. This broad technical infrastructure has matured over the last decade, making HIEs an attractive source of large-scale EHR data that is ready to be leveraged for multiple important use cases. However, historically HIEs have been underutilized for conducting public health surveillance, pharmacoepidemiologic studies, and population outcomes research.[ 11 ] The Sentinel Initiative is a key component of the U.S. Food and Drug Administration’s (FDA) postmarket surveillance for approved medical products. Results from Sentinel investigations are routinely used to support the FDA in regulatory decision making.[ 12 ] The Sentinel System, a national medical product safety surveillance system within the Sentinel Initiative, has historically relied on large volumes of insurance claims data but more recently has developed an infrastructure linking EHRs with insurance claims to address questions related to medical product use and associated outcomes using more granular clinical information captured in EHRs.[ 13 , 14 ] The new infrastructure, the Real World Evidence Data Enterprise (RWE-DE), comprises linked claims-EHR data for 26 million individuals from six data sources involving four academic partner institutions (three tertiary care centers-Mass General Brigham, Vanderbilt University Medical Center, Duke University Health Systems, and an integrated care delivery network-Kaiser Permanente-Washington) collectively termed the Development Network and two commercial data networks (HealthVerity, TriNetX) collectively termed the Commercial Network.[ 14 ] While a major step forward, the RWE-DE may benefit from inclusion of additional data sources to increase the total population covered and availability of near-real time information. Additionally, all current sources face challenges in EHR data continuity due to the fragmentation of care described above. To explore the potential of HIEs for addressing some of these challenges, we initiated a pilot study with MyHealth Access Network-a statewide HIE from Oklahoma, to implement a descriptive analysis of initiators of two antidiabetic medications to reflect a typical Sentinel query. In this article, we describe the learnings from the pilot and discuss considerations for future use of HIEs as novel sources for population-based pharmacoepidemiology research and postmarketing surveillance of medical products. 2. Methods 2.1 Data source MyHealth Access Network is a non-profit organization and Oklahoma’s State Designated Entity for Health Information Exchange that connects 95% of all hospital activity, 100% of federally qualified health center activity, and most community behavioral health clinics, tribal health systems, and independent providers in the state.[ 15 ] It connects to more than 500 unique healthcare entities including independent pharmacies, emergency medical services (EMS), social services organizations, organ procurement organizations, Oklahoma Office of the Chief Medical Examiner, and health plans in the area. The HIE has a clinical data repository that goes back to encounters captured since 2011 and provides the most complete and near real-time access to population-level healthcare and social needs data for the over 4 million residents of Oklahoma. These data are standardized and linked across all providers into a unique unduplicated record for each patient. We used data from January 2016 to December 2023 available in MyHealth Access Network, which also included linked EHR data to claims data from three of the health plans. 2.2 Study design We conducted a descriptive medical product utilization query (similar to a ‘Type 5’ query in the Sentinel Routine Querying tools)[ 16 ]-to identify and characterize patients with Type 2 Diabetes Mellitus (T2DM) treated with two common antidiabetic drug classes: Sodium-Glucose Co-Transporter 2 inhibitors (SGLT-2i) and Dipeptidyl Peptidase 4 inhibitors (DPP-4i) in a new user cohort design. Patients entered the cohort on a cohort entry date (CED) based on records of medication initiation for either of the two drug classes, using dispensing data from insurance claims (when available) or prescribing data from EHRs when claims were not available. Patients were required to be aged 18 years or older, have a diagnosis of type 2 diabetes mellitus, and have some EHR activity (operationalized as having any data available from EHRs any time prior to index date) to ensure adequate contact with the healthcare system and capture of clinical codes to measure baseline characteristics. Since the focus of this query was on patients with type 2 diabetes mellitus, we excluded patients with a diagnosis of type 1 diabetes mellitus. 2.3. Variables We assessed demographic characteristics (age, sex, race, ethnicity and year of cohort entry); diabetes-related factors including duration of diabetes (operationalized as the time between the first diagnosis codes found in the data and cohort entry) and use of other antihyperglycemic medications; a range of comedications and comorbid conditions; laboratory test results and other clinical parameters including serum creatinine, hemoglobin A1c (HbA1c), total cholesterol, high density lipoprotein (HDL), low density lipoprotein (LDL), and left ventricular ejection fraction (LVEF); vital signs (heart rate, blood pressure), body mass index (BMI), and lifestyle factors (any smoking status, alcohol use, drug misuse or abuse). All variables were assessed in a 365-day baseline period prior to the cohort entry date, unless otherwise specified. For laboratory tests, clinical parameters, and vital signs, values closest to the cohort entry were used for patients with multiple recordings in the baseline period. Standardized coding terminology including national drug codes (NDCs) and RxNorm Concept Unique Identifier (RxCUI) for medications with drug mechanism classifications determined by manual mapping, Logical Observational Identifiers Names and Codes (LOINC) for laboratory tests, international classification of diseases (ICD)-10-CM codes for diagnoses, and current procedural terminology (CPT) codes (with modifiers) to assess in-person healthcare utilization were used to identify relevant information in each domain. 2.4 Statistical analysis We used basic descriptive statistics to summarize all characteristics for each of the two exposure groups using percentages for categorical variables and means (standard deviations) for quantitative measures. We also reported the proportion of individuals in each group who had at least one in-person EHR encounter in 30, 90, 180, and 365 days prior to the cohort entry to contextualize routine flow of information in the HIE. 2.5 Ethics review This Sentinel project is a public health surveillance activity conducted under the authority of the Food and Drug Administration and, accordingly, is not subject to Institutional Review Board oversight.[ 17 - 19 ] Additionally, the HIE governance committee comprising local stakeholders and data contributors, reviewed and approved the secondary use of the data for this query. 3. Results Figure 1 . shows the total number of DPP-4i and SGLT-2i initiators with type 2 diabetes mellitus along with source of the prescription information on their cohort entry date. A total of 76,018 DPP-4i initiators and 101,599 SGLT-2i initiators met our inclusion criteria, a majority of whom were included based on prescription orders found in EHRs. Figure 2 outlines information sources for the two exposure groups during the study period. A large majority (63.0% and 60.1% for DPP-4i and SGLT-2i groups, respectively) were identified from EHR data alone and did not appear in any of the three claims datasets. A total of 15.7% and 20.1% for DPP-4i and SGLT-2i, respectively had information in both EHRs and claims from one or more of the three payers. Notably, a small subset of patients (0.003% and 0.01% for DPP-4i and SGLT-2i) existed in all three payer datasets and EHR at some point of time for both DPP-4i and SGLT-2i initiators, which highlights the issue of frequent changes in individuals’ insurance coverage over time with claims data sources. Download figure Open in new tab Figure 1. Final cohort of DPP-4i and SGLT-2i initiators with type 2 diabetes mellitus along with data source (EHR versus claims) Download figure Open in new tab Figure 2. Claims versus EHR overlap of DPP-4i and SGLT-2i initiators with type 2 diabetes mellitus Patient demographics, medication use, and comorbid diagnoses Table 1 summarizes the demographic characteristics of the DPP-4i and SGLT-2i initiators. The mean age was 59 years in each of the cohorts with the largest group of patients falling within the age category of 55-64 years (30%, 32% respectively). About half of the patients were female in both the cohorts (49%, 45% respectively). Less than 0.05% of patients had missing data for age and sex. While information on race was unknown or missing for 32% of the DPP-4i initiators and 24% of SGLT-2i initiators, a majority of patients were White in both the cohorts (47%, 57% respectively); the second most reported race category was American Indian or Alaskan Natives, representing 13% and 9.9%, respectively. A total of 8.5% of the DPP-4i initiators and 7.5% of the SGLT-2i initiators were of Hispanic origin. View this table: View inline View popup Download powerpoint Table 1. Demographic characteristics of the DPP-4i and SGLT-2i initiators with type 2 diabetes mellitus Table 2 provides information on diabetes duration, comedications, and comorbid conditions. Most patients had a diagnosis of Type 2 DM for 1-5 years at the time of cohort entry across both DPP-4i initiators and SGLT-2i initiators (39%, 48%). Among other antidiabetic medications, metformin was most common, followed by sulfonylureas. GLP1 agonists were much more frequently used by SGLT-2i initiators (19% vs 6.3%). Angiotensin converting enzyme inhibitors and angiotensin receptor blockers were the most common co-medications in both the groups (42%, 52%) and hypertension was the most frequent comorbid diagnosis (32%, 45%). View this table: View inline View popup Table 2. Diabetes duration, comedications, and comorbidities observed in the DPP-4i and SGLT-2i initiators with type 2 diabetes mellitus Table 3 summarizes information on laboratory test results, lifestyle factors and vital signs. HbA1c results were available for 63% and 66% of the DPP-4i and SGLT-2i groups, respectively with mean + SD of 8.1+ 1.9% and 8.2 + 1.9%. Serum creatinine was recorded for 67% of DPP-4i and 70% of SGLT-2i initiators. The mean serum creatinine values were 1.30 + 1.0 mg/dL and 1.14 + 0.6 mg/dL for DPP-4i and SGLT-2i initiators respectively. Substance use including smoking status, alcohol use, and drug misuse/abuse was recorded for 5-23% of the patients across both DPP-4i and SGLT-2i initiators. BMI was recorded for 28.4% of the DPP-4i initiators (mean = 33.4 + 8.0 kg/m 2 ) and 46% of the SGLT-2i initiators (mean = 34.1 + 8.0 kg/m 2 ). Heart rate and blood pressure had similar mean values across both groups, with measurements recorded for 25-35% of DPP-4i initiators, and a higher proportion (45-50%) of SGLT-2i initiators. View this table: View inline View popup Table 3. Clinical characteristics, lifestyle factors, and vital signs of the DPP-4i and SGLT-2i initiators with type 2 diabetes mellitus Table 4 summarizes healthcare utilization-related information. We observed that 64% of the DPP-4i initiators and 76 % of the SGLT-2i initiators had at least 1 in-person encounter in the 365 days prior to the cohort entry. This proportion was consistent when restricting to past 180 days (62 %, 74 %), 90 days (60 %, 72 %), and 30 days (55 %, 67 %). View this table: View inline View popup Download powerpoint Table 4. Healthcare utilization features of the DPP-4i and SGLT-2i initiators with type 2 diabetes mellitus 4. Discussion In this study, we observed that it was feasible to create patient cohorts using near real-time EHR data to describe initiators of medications using data from an HIE. We noted that capture of important clinical data elements such as HbA1c was comparable or more complete than diabetic cohorts from other EHR sources from the US.[ 20 - 22 ] Importantly, traditionally underrepresented racial groups such as American Indians were represented in line with their representation in the 2024 US Census for Oklahoma (10-13% in this study, 9.5% in the US Census)[ 23 ], which highlights the truly population-based nature of HIEs. HIEs offer certain benefits that make them a promising resource for future use in national medical product surveillance systems like Sentinel for pharmacoepidemiology evaluations. First, since most HIEs are community-governed with a not-for-profit status and funding from public sources (state and federal health departments), they are quite efficient in terms of cost to acquire data for surveillance and research. As the source of almost real-time data on an entire population, HIEs may help to study emergent infections, adverse events for newly used treatments, and geographical coverage within the covered regions in a timely and comprehensive manner. Many HIEs also store unstructured data, like clinical notes, creating a valuable resource to develop and test natural language processing algorithms and large language models.[ 24 ] Increasingly, HIEs are expanding their role to collect nonmedical data such as social needs assessments, social services referrals, and criminal justice, environmental, and housing data to become health data utilities (HDUs) for their state or region, much like the energy or public transportation utilities that provide the service for multiple uses by consumers.[ 25 ] Some states have also passed legislation to mandate contribution of health and social services data to their HDUs to help state-level public health and Medicaid better coordinate, monitor, and evaluate care for its population. This rich and comprehensive data under a community-governed entity, which has high levels of technical expertise to curate representative population level data of clinical and non-clinical factors, is primed to help study health equity issues in much better detail than in any other dataset of this size and coverage.[ 26 ] One of the most important requirements for conducting causal inference studies with longitudinal health records is the availability of EHR data without ‘information leakage’ that is common in traditional EHR sources from a single healthcare system because patients frequently seek care outside of the system.[ 27 ] A key service provided by HIEs is that of maintaining a master patient index that links all the various medical records across the fragmented health delivery system into one master record, thus saving a huge effort in deduplicating and linking clinical records for subsequent analysis. The ability to maintain a truly longitudinal patient record across healthcare systems makes HIEs an attractive data resource to conduct studies that require long term follow-up and consistent data availability over the course of a treatment or a disease. In the analysis of healthcare utilization, we observed that about 60-70% patients included in the current study had an in-person EHR visit in 365 days, 180 days, and 30 days prior to the medication initiation date, which suggests that HIEs have a stable pool of patients with consistent flow of EHR information. Some governance related aspects of HIE data merit a discussion. While a single patient-level record can be shared across the network for treatment, payment, and operations for authorized users with an established relationship with that patient, the secondary use of these data for research and surveillance has established policies that vary across HIEs. These policies are largely focused on patient privacy and agreed upon governance policies with data contributors. Secondary use data sharing for public health, epidemiological studies, and population health research is determined on a case-by-case basis. Most HIEs will allow use of data for public health surveillance activities, but in many cases, use of data for research requires appropriate IRB supervision and may require patient consent for sharing any protected health information. We also acknowledge some important limitations of our current work. First, we only explored a single HIE in Oklahoma which is a relatively mature and sophisticated HIE with a legislative mandate from the state. HIEs across the country differ in significant ways in terms of their geographical and clinical data capture as well as their ability to link to other sources like insurance claims. However, many of the features described for MyHealth Access are likely to be representative of larger state level and regional HIEs, some with much larger populations such as in New York, California, Michigan, and Texas. Second, we only focused on a descriptive study of relatively commonly used medication classes, which precludes generalizable conclusions regarding completeness of information for more rare conditions or medications. However, it is reasonable to hypothesize that if there is a method of connecting a consortium of HIEs from across the country to act as a distributed network with a common data model and quality assurance, as established in the Sentinel Distributed Network, this limitation may be adequately addressed through a geographically and socioeconomically representative cohort from across the country. A preliminary feasibility study for such a consortium of HIEs to support pharmacoepidemiology and population health studies is already underway and showing encouraging results.[ 28 ] In conclusion, the HIE network has grown over the last decade at the local, regional, and national level. Our pilot study conducted in partnership with MyHealth Access Network suggests that data from HIEs may offer a promising resource for conducting population-based postmarketing surveillance of medical products with EHR data. Data Availability The data that support the findings of this study are not publicly available due to privacy restrictions. Statements and Declarations Funding Acknowledgements This project was supported by Master Agreement 75F40119D10037 from the US Food and Drug Administration (FDA). FDA coauthors reviewed the study protocol, statistical analysis plan, and the manuscript for scientific accuracy and clarity of presentation. Representatives of the FDA reviewed a draft of the manuscript for presence of confidential information and accuracy regarding statement of any FDA policy. The views expressed are those of the authors and not necessarily those of the U.S. FDA. Competing Interests Dr. Khurshid and Eliel Oliveira are co-founders of Pulsar Health, a software IT company. Dr. Desai reports serving as Principal Investigator on investigator-initiated grants to the Brigham and Women’s Hospital from Novartis, Vertex, and Bayer on unrelated projects. Dr. Schneeweiss is co-principal investigator of an investigator-initiated grant to the Brigham and Women’s Hospital from Boehringer Ingelheim unrelated to the topic of this study. He is a consultant to Aetion Inc., a software manufacturer of which he owns equity. His interests were declared, reviewed, and approved by the Brigham and Women’s Hospital and MGB HealthCare System in accordance with their institutional compliance policies. All other authors have no conflicts of interest to disclose relative to this work. References 1. ↵ Pham HH , Schrag D , O’Malley AS , Wu B , Bach PB . Care Patterns in Medicare and Their Implications for Pay for Performance . New England Journal of Medicine . 2007 -03-15; 356 ( 11 ) doi: 10.1056/NEJMsa063979 OpenUrl CrossRef PubMed Web of Science 2. ↵ What is the HITECH Act? The HIPAA Journal . https://www.hipaajournal.com/what-is-the-hitech-act/ 3. ↵ Office of the National Coordinator for Health Information Technology. Connecting Health and Care for the Nation: A Shared Nationwide Interoperability Roadmap . https://www.healthit.gov/sites/default/files/ONC2015-Interop-Roadmap.pdf 4. ↵ State Health Information Exchange Cooperative Agreement Program . https://www.healthit.gov/topic/onc-hitech-programs/state-health-information-exchange 5. ↵ Holmgren AJ , Esdar M , Hüsers J , Coutinho-Almeida J. Health Information Exchange: Understanding the Policy Landscape and Future of Data Interoperability . Yearbook of Medical Informatics . 2023 /08; 32 ( 01 ) doi: 10.1055/s-0043-1768719 OpenUrl CrossRef 6. ↵ Civitas Networks for Health . Key Learnings from the National Health Information Organization Survey Resultsl] https://www.civitasforhealth.org/learnings-from-national-hio-survey-results/ 7. ↵ Everson J , Chang W , Patel V , Adler-Milstein J. The state of health information organizations and plans to participate in the federal exchange framework . Health Affairs Scholar . 2024 /08/02; 2 ( 8 ) doi: 10.1093/haschl/qxae098 OpenUrl CrossRef 8. ↵ The Office of the National Coordinator for Health Information Technology . What Is HL7 FHIR? https://www.healthit.gov/ 9. ↵ U.S. Department of Health and Human Services . HIPAA, Health Information Exchanges, and Disclosures of Protected Health Information for Public Health Purposes . https://www.hhs.gov/sites/default/files/hie-faqs.pdf 10. ↵ Garg N , Kuperman G , Onyile A , et al. Validating Health Information Exchange (HIE) Data For Quality Measurement Across Four Hospitals . AMIA Annual Symposium . 2014 ; 2014 : 573 – 579 OpenUrl 11. ↵ Yeager VA , Vest JR , Walker D , Diana ML , Menachemi N. Challenges to Conducting Health Information Exchange Research and Evaluation: Reflections and Recommendations for Examining the Value of HIE . eGEMs . 2017 Sep 4; 5 ( 1 ) doi: 10.5334/egems.217 OpenUrl CrossRef 12. ↵ Maro JC , Nguyen MD , Kolonoski J , et al. Six Years of the US Food and Drug Administration’s Postmarket Active Risk Identification and Analysis System in the Sentinel Initiative: Implications for Real World Evidence Generation . Clinical Pharmacology & Therapeutics . 2023 /10/01; 114 ( 4 ) doi: 10.1002/cpt.2979 OpenUrl CrossRef 13. ↵ Brown JS , Mendelsohn AB , Nam YH , et al. The US Food and Drug Administration Sentinel System: a national resource for a learning health system . Journal of the American Medical Informatics Association . 2022 /11/14; 29 ( 12 ) doi: 10.1093/jamia/ocac153 OpenUrl CrossRef 14. ↵ Desai RJ , Marsolo K , Smith J , et al. The FDA Sentinel Real World Evidence Data Enterprise (RWE-DE) . Pharmacoepidemiology and Drug Safety . 2024 /10/01; 33 ( 10 ) doi: 10.1002/pds.7002815 . OpenUrl CrossRef 15. ↵ MyHealth Access Network . https://myhealthaccess.net/ 16. ↵ Sentinel . Sentinel Routine Querying System Overview . https://dev.sentinelsystem.org/projects/SENTINEL/repos/sentinel-routine-querying-tool-documentation/browse/files/file160-type05-medprodutil.md 17. ↵ Basic HHS Policy for Protection of Human Research Subjects, 45 CFR §46.102(l)(2) . Accessed April 14, 2025 , 2025 . https://www.ecfr.gov/current/title-45/subtitle-A/subchapter-A/part-46/subpart-A#46.102 18. U.S. Department of Health and Human Services. Federal Policy for the Protection of Human Subjects. 82 Fed Reg 7149. January 19 , 2017 ; 19. ↵ Rosati K , Jorgensen NS , Melissa, Evans BJ . Sentinel Initiative Principles and Policies: HIPAA and Common Rule Compliance in the Sentinel Initiative . February 01, 2018 ; 20. ↵ Nanna MG , Kolkailah AA , Page C , Peterson ED , Navar AM . SGLT2i and GLP-1 RA in Patients With Diabetes and Cardiovascular Disease . JAMA Cardiology . 2023 /01/01; 8 ( 1 ) doi: 10.1001/jamacardio.2022.3839 OpenUrl CrossRef 21. Kukhareva PV , Facelli JC , O’Brien MJ , et al. Racial and Ethnic Disparities in Prescribing of GLP-1 Receptor Agonists in the United States: A Retrospective Cohort Analysis -PubMed . medRxiv : the preprint server for health sciences . 11/01/ 2024 ; doi: 10.1101/2024.10.28.24316312 OpenUrl Abstract / FREE Full Text 22. ↵ Li Y , Hu H , Zheng Y , et al. Impact of Contextual-Level Social Determinants of Health on Newer Antidiabetic Drug Adoption in Patients with Type 2 Diabetes . International Journal of Environmental Research and Public Health 2023, Vol 20, Page 4036 . 2023 -02-24; 20 ( 5 ) doi: 10.3390/ijerph2005403623 . OpenUrl CrossRef 23. ↵ United States Census Bureau . https://www.census.gov/quickfacts/fact/table/OK 24. ↵ Alkasir A , Seidman G , Ritzo J , Bari L , Khurshid A. The Role of Health Data Utilities in Supporting Health AI . NEJM AI . 2024 ; 1 ( 10 ) doi: 10.1056/AIpc2400401 OpenUrl CrossRef 25. ↵ Civitas Networks for Health . Health Data Utility Framework – A Guide to Implementation . https://www.civitasforhealth.org/hduframework/ 26. ↵ Khurshid A , Sarkar IN . The health data utility and the resurgence of health information exchanges as a national resource - PubMed . Journal of the American Medical Informatics Association : JAMIA . 2025 ; doi: 10.1093/jamia/ocaf032 OpenUrl CrossRef 27. ↵ Schneeweiss S , Desai RJ , Ball R. Invited commentary: A future of data-rich pharmacoepidemiology studiestransitioning to large-scale linked EHR+claims data . Am J Epidemiol . Jul 16 2024 ; doi: 10.1093/aje/kwae226 OpenUrl CrossRef 28. ↵ American Medical Informatics Association-Enhancing Public Health Insights with HIE (Health Information Exchange) Data . https://amia.secure-platform.com/symposium/solicitations/102001/sessiongallery/schedule/items/94086 View the discussion thread. Back to top Previous Next Posted August 19, 2025. Download PDF Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Health Information Exchanges (HIEs) as Novel Sources for Population-Based Post Marketing Surveillance of Medical Products: A Pilot Study from the FDA Sentinel Innovation Center Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Health Information Exchanges (HIEs) as Novel Sources for Population-Based Post Marketing Surveillance of Medical Products: A Pilot Study from the FDA Sentinel Innovation Center Anjum Khurshid , David Kendrick , Haritha S. Pillai , Jenny Sun , Eliel Oliveira , Alexis Jaquish , Sarah K. Dutcher , Patricia Bright , Youjin Wang , Jie Li , Tiffany Austin , Patrick J. Heagerty , Michael E. Matheny , Sebastian Schneeweiss , Rishi J. Desai medRxiv 2025.08.13.25333515; doi: https://doi.org/10.1101/2025.08.13.25333515 Share This Article: Copy Citation Tools Health Information Exchanges (HIEs) as Novel Sources for Population-Based Post Marketing Surveillance of Medical Products: A Pilot Study from the FDA Sentinel Innovation Center Anjum Khurshid , David Kendrick , Haritha S. Pillai , Jenny Sun , Eliel Oliveira , Alexis Jaquish , Sarah K. Dutcher , Patricia Bright , Youjin Wang , Jie Li , Tiffany Austin , Patrick J. Heagerty , Michael E. Matheny , Sebastian Schneeweiss , Rishi J. Desai medRxiv 2025.08.13.25333515; doi: https://doi.org/10.1101/2025.08.13.25333515 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Pharmacology and Therapeutics Subject Areas All Articles Addiction Medicine (569) Allergy and Immunology (863) Anesthesia (300) Cardiovascular Medicine (4442) Dentistry and Oral Medicine (444) Dermatology (383) Emergency Medicine (609) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1511) Epidemiology (15230) Forensic Medicine (30) Gastroenterology (1126) Genetic and Genomic Medicine (6610) Geriatric Medicine (668) Health Economics (998) Health Informatics (4542) Health Policy (1370) Health Systems and Quality Improvement (1613) Hematology (543) HIV/AIDS (1266) Infectious Diseases (except HIV/AIDS) (15923) Intensive Care and Critical Care Medicine (1103) Medical Education (623) Medical Ethics (147) Nephrology (668) Neurology (6607) Nursing (346) Nutrition (999) Obstetrics and Gynecology (1146) Occupational and Environmental Health (957) Oncology (3338) Ophthalmology (974) Orthopedics (369) Otolaryngology (420) Pain Medicine (436) Palliative Medicine (130) Pathology (665) Pediatrics (1693) Pharmacology and Therapeutics (692) Primary Care Research (712) Psychiatry and Clinical Psychology (5448) Public and Global Health (9239) Radiology and Imaging (2202) Rehabilitation Medicine and Physical Therapy (1370) Respiratory Medicine (1196) Rheumatology (596) Sexual and Reproductive Health (714) Sports Medicine (530) Surgery (712) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'a01fc53f19d5197c',t:'MTc3OTgyOTg2Nw=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00