Simulated sample splitting approach to address biases due to instrument selection and participant overlap in two-sample Mendelian Randomization studies

doi:10.1101/2025.11.04.686460

Simulated sample splitting approach to address biases due to instrument selection and participant overlap in two-sample Mendelian Randomization studies

2025 · doi:10.1101/2025.11.04.686460

preprint OA: closed

📄 Open PDF Full text JSON View at publisher

Full text 58,865 characters · extracted from preprint-html · click to expand

Simulated sample splitting approach to address biases due to instrument selection and participant overlap in two-sample Mendelian Randomization studies | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Simulated sample splitting approach to address biases due to instrument selection and participant overlap in two-sample Mendelian Randomization studies View ORCID Profile Amanda Forde , View ORCID Profile Gibran Hemani , John Ferguson doi: https://doi.org/10.1101/2025.11.04.686460 Amanda Forde 1 School of Mathematical and Statistical Sciences, University of Galway , Galway, Ireland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Amanda Forde For correspondence: amanda.forde{at}universityofgalway.ie Gibran Hemani 2 NIHR Bristol Biomedical Research Centre, University Hospitals Bristol and Weston NHS Foundation Trust and University of Bristol , Bristol, UK 3 MRC Integrative Epidemiology Unit (IEU), Bristol Medical School, University of Bristol , Bristol, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Gibran Hemani John Ferguson 1 School of Mathematical and Statistical Sciences, University of Galway , Galway, Ireland Find this author on Google Scholar Find this author on PubMed Search for this author on this site Abstract Full Text Info/History Metrics Preview PDF Abstract Mendelian randomization (MR) is a popular statistical technique that uses genetic variants to explore causal relationships in observational epidemiology. Summary-level MR, the most common form, relies on published GWAS summary statistics to estimate causal effects between exposures and outcomes. However, empirical analyses tend to ignore issues relating to Winner’s Curse of instrument effects, weak instrument bias and sample overlap. Our simulations and empirical examinations using the UK Biobank indicate that such mechanisms can induce substantial bias in routine MR approaches. We propose MR Simulated Sample Splitting (MR-SimSS), a novel method that corrects this bias requiring no additional data beyond the exposure and outcome GWAS summary statistics under examination. It operates by simulating statistically independent sets of summary statistics, analogous to what would be produced by splitting the individual-level data into independent subsets, which can then be plugged into existing pleiotropy-robust MR methods. With sufficient instrument variants, MR-SimSS is robust to a range of sample overlap scenarios, providing a practical and modular solution to Winner’s Curse and weak instrument bias. Author summary A central challenge in epidemiology is determining whether an observed association reflects a true cause- and-effect relationship. Mendelian randomization (MR) addresses this by using genetic variants as natural experiments to test whether a particular trait or exposure genuinely influences disease risk. However, when the same genetic data are used both to select and to estimate genetic instruments, MR results can become biased due to a phenomenon known as the Winner’s Curse. This problem, along with weak instruments and sample overlap between datasets, can distort causal estimates even in large studies. We introduce MR Simulated Sample Splitting (MR-SimSS), a new framework that overcomes these issues using only publicly available genome-wide association study (GWAS) summary statistics. MR-SimSS works by statistically simulating independent subsets of the data, without requiring access to individual-level information, allowing existing MR methods to be applied without bias. Through extensive simulations and analyses using UK Biobank data, we show that MR-SimSS provides more accurate and reliable causal estimates, offering a practical tool for robust causal inference in modern genetic epidemiology. Introduction Mendelian randomization (MR) is a statistical framework that uses genetic variation to assess whether a modifiable exposure causally influences an outcome of interest, and to estimate the magnitude of this effect [ 1 ]. Since its advent, the use of MR in epidemiological research has grown exponentially, largely due to the limitations of traditional observational studies, such as unmeasured confounding and reverse causation [ 2 ]. MR capitalises on the principle that genetic variants are fixed at conception and randomly inherited, rendering MR analyses approximately analogous to ‘naturally occurring randomized trials’ [ 3 ]. It relies on instrumental variable (IV) estimation, where genetic variants serve as instruments. For a variant to be a valid IV, it must be associated with the exposure, independent of confounders and influence the outcome only through the exposure pathway [ 4 ]. With the widespread availability of large-scale GWAS summary data, most MR analyses now use a two-sample, or summary-level, design. This involves performing the MR analysis using publicly available estimates of variant-exposure and variant-outcome associations, along with their standard errors, typically derived from two non-overlapping, or partially overlapping, GWAS datasets [ 5 ]. Provided certain conditions hold and a valid genetic instrument is used, a consistent estimate of the causal effect can be obtained by dividing the variant-outcome association by the variant-exposure association [ 6 ]. To increase statistical power, ratio estimates across multiple genetic variants are often aggregated using meta-analytic methods such as the inverse variance weighted (IVW) estimator [ 7 ]. However, IVW is known to be sensitive to weak instruments and violations of the IV assumptions [ 8 ]. To address these issues, alternative summary-level methods, such as MR-Egger [ 9 ] and MR-RAPS [ 10 ], have been proposed. A key focus of this work is the mitigation of Winner’s Curse bias in summary-level MR. To satisfy the IV relevance condition, genetic variants are usually selected by applying a genome-wide significance threshold, e.g. p-value < 5 × 10 -8 , to exposure GWAS summary data. However, using the same dataset for both instrument selection and estimation introduces Winner’s Curse, where variant-exposure associations of selected variants are overestimated due to selection bias [ 11 ]. Provided that the variant-outcome associations are estimated independently, this results in downward bias in the MR causal effect estimate, pulling it toward the null. To date, the only widely adopted solution to this problem has been the use of a third, independent dataset for instrument selection in a so-called ‘three-sample’ design [ 10 ]. While this avoids the overlap that causes Winner’s Curse, it is often impractical, requiring access to three large, non-overlapping GWAS datasets of similar ancestry, which is a challenge for many traits, particularly in understudied populations. Alternatively, a single dataset could be split into separate parts, but this sacrifices statistical power and efficiency, and also is only an option if individual-level data are available. Weak instruments pose a further source of bias. A genetic variant is considered a weak instrument if it explains only a small proportion of variation in the exposure [ 12 ]. The magnitude and direction of the bias this introduces depends on the degree of sample overlap between the exposure and outcome GWASs. In a complete overlap (one-sample) setting, causal estimates are biased toward the observational association, increasing the risk of Type I error. In contrast, using two non-overlapping samples biases results toward the null. While most summary-level MR methods have been designed under the assumption of complete independence between exposure and outcome GWAS samples, substantial participant overlap is common in practice as the largest outcome and exposure GWAS often come from the same consortia [ 13 ]. Restricting analyses to non-overlapping GWASs again leads to inefficient data use. To address these challenges, we propose a novel summary-level MR method, MR Simulated Sample Splitting (MR-SimSS). MR-SimSS extends the benefits of the ‘three-sample’ design to single sample settings, by imitating the process of splitting an individual-level dataset into three parts: one for instrument selection and two for independent estimation of the variant-exposure and variant-outcome associations. Importantly, this is achieved using only GWAS summary statistics. MR-SimSS leverages asymptotic conditional distributions to repetitively simulate association estimates in each of the three parts, or data-subsets, conditional on the known full dataset estimates. On each iteration, instrument variants are selected based on the simulated variant-exposure associations for the first subsample, and a two-sample MR method, such as IVW or MR-RAPS, is then applied to the exposure and outcome associations that are simulated for that set of instruments in the second and third subsets. MR estimates from each iteration are averaged to reduce variance. This approach allows use of the full dataset while avoiding biases introduced by sample overlap and Winner’s Curse. We assessed MR-SimSS under varying levels of sample overlap and exposure-outcome correlation, using pairs of simulated exposure and outcome GWAS summary statistics. Several existing MR methods were included for comparison. Same-trait analyses were also conducted using UK Biobank [ 15 ] body mass index (BMI) data, where the true causal effect is known to be 1, providing a useful benchmark. All methods were evaluated across three key metrics: average bias, root mean square error (RMSE) and empirical coverage probability of 95% confidence intervals. These evaluations showed that many MR methods are adversely affected by biases arising due to sample overlap, be it using the same samples for instrument selection and estimating variant-exposure associations or using overlapping datasets to estimate both variant-exposure and variant-outcome associations. MR-SimSS illustrated a strong ability to mitigate these biases, especially those arising from Winner’s Curse. However, the simulated sample splitting process can increase susceptibility to weak instrument bias. To address this, we recommend incorporating a robust two-sample method, such as MR-RAPS [ 10 ], within MR-SimSS. Our results show that the 3-split version of MR-SimSS, when combined with MR-RAPS, consistently outperforms all other evaluated methods across key performance metrics. Finally, we demonstrate the practical utility of MR-SimSS in a real-world example assessing the causal effect of BMI on risk of Type 2 diabetes (T2D), highlighting the method’s value in applied epidemiological research. Methods Overview of MR-SimSS MR-SimSS reconstructs the statistical conditions of a three-sample Mendelian Randomization (MR) design using only GWAS summary statistics for variant-exposure and variant-outcome associations, even when these originate from overlapping samples. This enables unbiased causal inference in the presence of Winner’s Curse and weak instrument bias. The method operates under the assumption that marginal variant effect estimates follow an asymptotic multivariate normal distribution. Based on this, we have derived an analytical expression (see Equation (1)) that allows simulation of marginally independent variant effect estimates from hypothetical non-overlapping subsamples, without requiring access to individual-level genotypes or phenotypes. The core procedure comprises three steps. First, MR-SimSS defines a hypothetical partition of the original dataset, allocating a fraction (e.g. π ) to a synthetic discovery subset. Conditional on the observed summary statistics, variant-exposure and variant-outcome association estimates are simulated for this subset and used to select instruments based on a genome-wide significance threshold. Second, to mitigate Winner’s Curse, MR-SimSS generates variant-exposure and variant-outcome association estimates from the remaining pseudo-subsample. These are derived according to the asymptotic linearity of maximum likelihood estimators under data partitioning (see Equation (2)), and are marginally independent of the selection step. As a result, they can be supplied directly to any standard two-sample MR estimator, such as IVW, MR-Egger or MR-RAPS, without inducing selection bias. However, in the presence of sample overlap between exposure and outcome GWASs, a residual correlation between and may remain, reintroducing weak instrument bias in the direction of the confounded observational association. To address this, MR-SimSS incorporates a three-split extension, where the 1 ― π data fraction is further subdivided into two non-overlapping fractions. Independent variant-exposure and variant-outcome association estimates are then generated for splits two and three using a similar conditional Gaussian framework, this time conditioning on the simulated summary statistics and from the first step. This removes residual covariance and restores the assumption of independence between numerator and denominator that is made by many two-sample MR estimators, like IVW and MR-RAPS. This step is especially important when exposure and outcome GWASs exhibit substantial sample overlap, ensuring that any remaining bias, if not corrected by the chosen MR method, is toward the null. To improve stability, the entire procedure is repeated over multiple random simulated splits, and causal effect estimates are averaged across iterations. MR-SimSS is compatible with both continuous and binary traits and generalizes to a wide range of GWAS settings, including full or partial sample overlap. Importantly, it permits valid use of robust MR methods, such as MR-RAPS, in settings where standard assumptions of independence are violated. Unbiased and efficient estimation of causal effects using commonly available summary-level data is therefore enabled as MR-SimSS reconstructs the independence structure of a three-sample MR design via conditional simulation. Technical Details For each genetic variant j = 1,…, N , we assume availability of variant-exposure and variant-outcome association estimates together with their respective standard errors, i.e. from an exposure GWAS with sample size n x and from an outcome GWAS with sample size n y . Summary statistics are assumed to arise from linear or logistic regression models applied to standardized genotypes, following standard GWAS practice. We allow for possible sample overlap ( n overlap ≤ min( n x , n y )) between the exposure and outcome studies, and assume that linkage disequilibrium (LD) pruning or clumping has already been applied, resulting in a set of uncorrelated variants with summary statistics available in both GWASs. If this individual-level data were available, Winner’s Curse could be eliminated by randomly splitting the data into two fractions π and 1 ― π , conducting GWASs on each, and then selecting instruments in one part and estimating causal effects in the other. Since only summary-level data are available, we simulate this splitting process by drawing from our derived asymptotic conditional distribution of the GWAS estimates in the π -fraction, conditional on the full-sample GWAS statistics. Therefore, for each variant j , association estimates and are simulated according to: Where and ρ = cor( X,Y ) denotes the correlation between the exposure and outcome, potentially non-zero due to confounding. A proof that this is the correct conditional distribution to use for the simulation is given in the Supplementary Note. In practice, n overlap and ρ may not be known; we propose a data-driven estimator of the parameter , as detailed in Supplementary Note. Unconditional standard errors in the π -fraction are approximated by and . Instruments are selected using z-statistics , and a genome-wide significance threshold of 5 × 10 -8 . To ensure independence between instrument selection and estimation, association estimates in the remaining (1 ― π )-fraction can be reconstructed as follows, using asymptotic linearity of maximum likelihood estimates: with corresponding standard errors scaled by . In the simplest (2-split) implementation of MR-SimSS, the selected genetic variants and their corresponding association estimates in the (1 ― π )-fraction are inputted into a summary-level MR method, such as IVW. However, this approach may still incur weak instrument bias in the direction of confounding if the exposure and outcome GWASs overlap. To address this, we extend the approach to a 3-split framework. In this version, the (1 ― π )-fraction is further conceptually split into sub-fractions of sizes p and 1 ― P, with simulated exposure estimates derived from the P-subset and outcome estimates from the remaining (1 ― P)-subset. These are simulated using a second conditional distribution, analogous to the form above. For each variant j , this yields independent association estimates and associated standard errors, , which are then used as input into the 2-sample MR method being used with MR-SimSS at each iteration. Again, standard errors are scaled appropriately with and . This simulated sample splitting procedure is repeated multiple times to reduce variability, and the final causal effect estimate, , is computed by averaging across iterations k = 1,…, N iter : in which is the causal effect estimate supplied by the summary-level MR method of choice on the k th iteration. To quantify uncertainty, we derive the standard error of the average estimate using the following decomposition: The first term captures the average estimation variance across iterations, while the second adjusts for between-iteration variation, analogous to a Monte Carlo error correction. This formulation follows from the identity Var( X ) = 𝔼[ X 2 ] ― (𝔼[ X ]) 2 , and is shown more thoroughly in the Supplementary Note. We refer to this method as MR-SimSS (Mendelian Randomization via Simulated Sample Splitting). The default implementation sets N iter = 1000 to ensure stable convergence of the mean and variance estimates, and fixes π = p = 0.5, following empirical guidance from Sadreev et al. [ 18 ], who found equal splits to offer the most flexibility when designing two-sample MR with sample splitting. Because the 3-split procedure may increase weak instrument bias towards the null due to reduced effective sample sizes, we also consider MR-SimSS in combination with MR-RAPS [ 10 ], which is designed to account for weak instruments when using independent samples. Our framework facilitates the application of MR-RAPS even when the underlying GWASs are partially overlapping, by producing independent summary statistics through simulation. While MR-SimSS is designed to improve causal inference accuracy, it can be computationally demanding when applied to large GWAS datasets due to the need to repeatedly simulate and evaluate many variants. To mitigate this, we introduce a probabilistic variant pre-selection strategy that retains computational efficiency while preserving instrument coverage with high probability. For each variant j , we compute the probability that it will be selected in any iteration based on the simulated z-statistic probability of variant j passing the significance threshold Φ ―1 (1 ― α /2), for the standard normal cumulative distribution function Φ(·) and chosen α , which by default corresponds to genome-wide significance α =5 × 10 -8 , is given by: in which . Derivation of this expression is provided in Supplementary Note. To construct a reduced variant subset, we rank variants by f j and compute the cumulative sum of these probabilities. We retain the smallest set of variants whose cumulative inclusion probability exceeds 0.95. This guarantees that the reduced and full variant sets will produce identical instruments on any iteration with at least 95% probability. Equivalently, the expected difference in the number of instruments selected by the full and reduced procedures is bounded by 5%. This subsetting procedure provides a principled and efficient means to scale MR-SimSS to large-scale genomic subsets. Simulation study We conducted simulations to assess the performance of MR-SimSS in reducing Winner’s Curse bias in MR and to compare it against established MR methods. A factorial design was implemented, varying the following parameters: Exposure heritability: h 2 ∈ {0.3, 0.7} Proportion of causal SNPs: π ∈ {0.01, 0.001} Sample overlap: n overlap ∈ {0, 0.25, 0.5, 0.75, 1} Exposure-outcome correlation: ρ ∈ {― 0.1, 0.1, 0.3, 0.5} Each scenario assumed equal exposure and outcome GWAS sample sizes, n X = n Y = 200,000, and a true causal effect β = 0.3. For each replicate, we simulated GWAS summary statistics for N = 1,000,000 independent genetic variants. True variant-exposure effects were sampled such that a proportion π had non-zero effects drawn from a normal distribution, calibrated to yield the specified heritability h 2 . True variant-outcome effects were defined as . Estimated summary statistics were drawn from a bivariate normal distribution: with variant minor allele frequencies (maf j ) simulated uniformly over [0.01, 0.5], an expression that is justified as an appropriate asymptotic distribution in the supplementary material, when both exposure and outcome have variance 1. Standard errors were assumed to be known. For each of the 80 parameter combinations, we simulated 100 independent datasets. To assess robustness to sample size, the simulations were repeated for n X = n Y = {50,000, 500,000}. Simulations under the null, in which the true causal effect was fixed at β = 0, with complete sample overlap, were also conducted. Each dataset was analysed using MR-SimSS (2-split and 3-split) with IVW and MR-RAPS, standard MR methods such as IVW and MR-RAPS using genome-wide significant instruments ( p < 5 × 10 -8 ), and debiased IVW (dIVW), a bias-corrected estimator that uses all variants and does not rely on SNP selection [ 22 ]. Each of these methods was evaluated using: Here, β = 0.3 is the true causal effect, and are the estimate and standard error in replicate k , and 𝕀 is the indicator function. We additionally report the average causal effect estimate, average standard error, and the empirical standard deviation across replicates. Real data processing For the empirical same-trait BMI-BMI analyses, the large-scale UK Biobank [ 15 ] BMI dataset was randomly split in half 10 times to generate 10 pairs of non-overlapping samples. In each of the 20 resulting subsets, quality control and GWAS were performed using PLINK 2.0 [ 17 ], following the same procedures as outlined in Forde et al. [ 14 ]. This yielded 10 pairs of independent GWAS summary statistics datasets. A set of approximately independent variants was obtained via LD pruning using the PLINK 2.0 [ 17 ] command ‘indep-pairwise 50 5 0.5’. Instrument variants were selected based on the conventional genome-wide significance threshold of p < 5 × 10 -8 . Results Simulation study We conducted a comprehensive simulation study to evaluate the finite-sample performance of MR-SimSS relative to existing summary-level MR methods. The simulations assumed equal exposure and outcome GWAS sample sizes of 200,000, and explored 80 distinct configurations defined by varying the proportion of causal variants, heritability of the exposure, fraction of sample overlap, and exposure-outcome correlation. Throughout, it was assumed that overlap and correlation parameters were unknown to the analyst. For each simulation, MR-SimSS in both two-split and three-split variants using MR methods; IVW and MR-RAPS, was used to estimate the causal effect of the exposure on the outcome. The implementation of MR-SimSS also incorporated estimation of the parameter λ, representing the correlation between variant-exposure and variant-outcome association estimates (see Methods). Table 1 summarizes mean performance metrics - bias, root mean squared error (RMSE), empirical standard deviation, and 95% coverage probability - averaged across all parameter settings. Supplementary Fig. 4 provides disaggregated boxplots of causal effect estimates stratified by overlap and correlation, collapsed across heritability and proportion of true effects. Notably, SimSS-3-RAPS, the three-split implementation using MR-RAPS, achieved uniformly superior performance. Across all simulations, it attained the lowest average bias (∼0), lowest RMSE (∼0.0009), and highest empirical coverage (93.9%). While successfully mitigating bias due to Winner’s Curse, MR-SimSS’s sample splitting procedure does reduce the effective sample size used for estimation, thus increasing susceptibility to weak instrument bias. This is particularly evident when IVW is implemented within MR-SimSS. For example, SimSS-3-IVW, which uses simulated non-overlapping splits for the generation of variant-exposure and variant-outcome association estimates, consistently exhibited downward weak instrument bias regardless of actual overlap, with an average bias of -0.0121 across settings (Supplementary Fig. 4). This pattern is visible in the boxplots, where the causal effect estimates provided by SimSS-3-IVW remain below 0.3 in all cases. In contrast, SimSS-2-IVW shows bias that varies with overlap, due to incomplete independence between the simulated subsamples used for estimation. View this table: View inline View popup Download powerpoint Table 1. Summarized simulation results for each method, averaged over all parameter combinations, including fraction of overlap, for sample sizes of 200,000. Using MR-RAPS with MR-SimSS, in three-split form, mitigates this weakness. When the GWAS datasets are independent or exhibit low overlap, both SimSS-2-RAPS and SimSS-3-RAPS yield nearly unbiased estimates. This is to be expected as MR-SimSS is designed to address weak instrument bias under independence of variant-exposure and variant-outcome estimates [ 10 ]. However, when this independence condition is not met, for example in the setting where the exposure-outcome correlation is equal to 0.5 and there is high overlap in the two GWAS databases, SimSS-2-RAPS leads to inflated bias, as evidenced in Supplementary Fig. 4. The variant of MR-SimSS using MR-RAPS with three splits does not suffer from this defect as the simulated exposure and outcome associations used in the estimation step are independent, even when the associations in the real data are correlated. Among all methods, SimSS-3-RAPS provides the most accurate causal effect estimates on average. Notably, it remains robust in the extreme case of full sample overlap and high correlation, where all other methods (except the negatively biased SimSS-3-IVW) yield upward-biased estimates toward the observational association. However, a consistent feature of all MR-SimSS methods, including SimSS-3-RAPS, is their slightly higher standard errors relative to competing approaches due to the variance inflation induced by simulated sample splitting. The standard IVW and MR-RAPS estimators display average negative bias and low empirical coverage, confirming susceptibility to Winner’s Curse. The dIVW method performs poorly across all overlapping sample settings, with estimates often exceeding the plausible range of 0.2-0.4, as illustrated in Supplementary Fig. 4. These findings indicate that dIVW is highly sensitive to sample overlap and cautions against its use when shared individuals are suspected between GWASs. Fig. 1 and Supplementary Table 1 report performance under strictly non-overlapping samples. In this setting, both SimSS-2-RAPS and SimSS-3-RAPS achieved near-zero bias (<0.0005), low RMSE, and empirical coverage between 94% and 97%. Due to the unnecessary inflation of variance introduced by three splits in the absence of overlap, SimSS-2-RAPS achieves slightly better RMSE. Conversely, standard IVW and MR-RAPS are substantially biased in settings with low proportions of causal variants. dIVW, while unbiased in this setting, suffered from large standard errors, resulting in elevated RMSE and variability. Download figure Open in new tab Fig. 1: Causal effect estimates for simulation settings with zero overlap. Estimated causal effect for each method and simulation setting with sample sizes of 200,000 and zero overlap, averaged over 100 simulated pairs of exposure and outcome GWAS summary statistics for each setting. Methods are abbreviated as: SimSS-2-IVW = 2-split version of MR-SimSS using IVW, SimSS-2-RAPS = 2-split version of MR-SimSS using MR-RAPS, SimSS-3-IVW = 3-split version of MR-SimSS using IVW, SimSS-3-RAPS = 3-split version of MR-SimSS using MR-RAPS, IVW = Inverse variance weighted method, RAPS = Robust Adjusted Profile Score of Zhao et al. [ 10 ], and dIVW = debiased IVW method of Ye et al. [ 22 ]. In the opposite extreme of complete sample overlap, Fig. 2 and Supplementary Table 2 illustrate that SimSS-3-RAPS again attained the most favourable balance of bias, RMSE, and coverage. Its estimates remained unbiased even under strong exposure-outcome correlation, while all other estimators—except SimSS-3-IVW—exhibited substantial upward bias toward the confounded observational association. Other estimators, including IVW and MR-RAPS, failed to correct for this bias. Performance under intermediate overlap fractions (25%, 50%, 75%) is reported in Supplementary Figs. 1-3 and reveals consistent trends favouring SimSS-3-RAPS. Download figure Open in new tab Fig. 2: Causal effect estimates for simulation settings with full overlap. Estimated causal effect for each method and simulation setting with sample sizes of 200,000 and full overlap, averaged over 100 simulated pairs of exposure and outcome GWAS summary statistics for each setting. Methods are abbreviated as: SimSS-2-IVW = 2-split version of MR-SimSS using IVW, SimSS-2-RAPS = 2-split version of MR-SimSS using MR-RAPS, SimSS-3-IVW = 3-split version of MR-SimSS using IVW, SimSS-3-RAPS = 3-split version of MR-SimSS using MR-RAPS, IVW = Inverse variance weighted method, RAPS = Robust Adjusted Profile Score of Zhao et al. [ 10 ], and dIVW = debiased IVW method of Ye et al. [ 22 ]. Supplementary Fig. 5 and Supplementary Table 3 show the results of simulations conducted with fully overlapping samples and a true causal effect of zero. The impact that biases due to instrument selection and participant overlap can have when two-sample MR methods are naively implemented is highlighted as IVW and MR-RAPS are seen to have poor empirical coverage probabilities and highly elevated false positive rates. Importantly, these results show roughly 95% coverage for both SimSS-3-IVW and SimSS-3-RAPS, indicating their ability to preserve type I error at ∼5%, under this simulated setting of a null causal effect. To assess sample size sensitivity, method performance was evaluated under alternative sample sizes of 500,000 and 50,000. With larger sized samples (500,000), performance of all methods improved due to increased instrument strength. Nevertheless, SimSS-3-RAPS remained the most accurate estimator, with average bias below 0.0001, RMSE of 0.0029, and empirical coverage of 94.1%. However, for smaller sample sizes of 50,000, MR-SimSS methods exhibited sensitivity to instrument sparsity. As shown in Supplementary Table 5, SimSS-3-RAPS remained the least biased estimator but incurred a markedly high standard error (∼58.29) and RMSE more than tenfold that of IVW and MR-RAPS. This instability is further illustrated in Supplementary Fig. 8, where effect estimates span a wide range (-1 to 1), attributable to the limited number of genome-wide significant variants in the simulated settings included in this figure. For instance, under 30% heritability and a 1% true effect proportion, only ∼10 variants exceeded genome-wide significance, yielding an average of ∼3 instruments per iteration, and thus, severely impairing causal effect estimation with MR-SimSS. To see whether the performance of SimSS-3-RAPS could be improved under such low-power conditions, we examined the impact of relaxing the instrument selection threshold. As shown in Supplementary Fig. 11 and Supplementary Table 6, increasing the significance threshold from 5 × 10 -8 to 5 × 10 -4 led to a substantial reduction in RMSE, from 1.008 to 0.032, while maintaining minimal bias (0.0066). This suggests that relaxing the selection criterion applied in MR-SimSS can substantially improve estimator stability when few variants are genome-wide significant (p < 5 × 10 -8 ). However, such adjustments to the MR-SimSS selection step inherently introduce weak instrument bias and as such, it is essential that robust MR methods, such as MR-RAPS, are used within the MR-SimSS framework to ensure valid inference. Same-trait empirical analysis To assess the empirical performance of MR-SimSS, we conducted same-trait MR analyses, estimating the causal effect of BMI on itself, using independent GWASs from the UK Biobank [ 15 ]. These analyses provide a realistic validation setting in which the true causal effect is known to be 1. 10 pairs of non-overlapping samples of ∼166,000 individuals were used to generate BMI GWAS summary statistics for ∼1.6 million LD-pruned variants using PLINK 2.0 [ 17 ]. Same-trait MR analyses were performed bidirectionally for each pair of summary statistics, yielding 20 causal effect estimates per evaluated method. All MR-SimSS variants and conventional methods, including MR-Egger and weighted median [ 6 ], were assessed using bias, RMSE and 95% coverage probability. Table 2 and Fig. 3 summarize the results of the repeated BMI-BMI analyses using pruned instruments. IVW, MR-RAPS and weighted median methods exhibited substantial downward bias, with mean causal estimates of 0.838, 0.865, and 0.807, respectively. All three methods yielded 0% empirical coverage, confirming susceptibility to Winner’s Curse. MR-Egger was less biased with an average causal effect estimate of 0.989, but its coverage was moderate (0.65) and its estimate variance nearly 4 times that of SimSS-2-RAPS, reflecting instability. In contrast, SimSS-2-RAPS and SimSS-3-RAPS outperformed all methods, delivering near-unbiased estimates (bias = 0.0015, 0.0017) and full 95% coverage. While dIVW had the lowest RMSE (0.0146), its poor coverage (0.30) reflects incorrect standard error estimation. View this table: View inline View popup Table 2. Summarized results for the sets of 20 same-trait BMI-BMI analyses for each method. Download figure Open in new tab Fig. 3: Causal effect estimates for 20 same-trait BMI-BMI analyses. Boxplots of the estimated causal effects for each method resulting from the 20 same-trait BMI-BMI analyses. Methods are abbreviated as: SimSS-2-IVW = 2-split version of MR-SimSS using IVW, SimSS-2-RAPS = 2-split version of MR-SimSS using MR-RAPS, SimSS-3-IVW = 3-split version of MR-SimSS using IVW, SimSS-3-RAPS = 3-split version of MR-SimSS using MR-RAPS, IVW = Inverse variance weighted method, RAPS = Robust Adjusted Profile Score of Zhao et al. [ 10 ], Egger = Egger regression of Bowden et al. [ 9 ], Weighted median = Weighted median approach of Bowden et al. [ 6 ], and dIVW = debiased IVW method of Ye et al. [ 22 ]. The black horizontal line represents the true causal effect of 1. SimSS-2-IVW and SimSS-3-IVW produced estimates free from Winner’s Curse but suffered from downward weak instrument bias, with mean biases of -0.0247 and -0.0503, and reduced coverage. These empirical results reinforce simulation findings: MR-SimSS, particularly SimSS-3-RAPS, reliably corrects for Winner’s Curse, providing accurate and well-calibrated estimates even in real-world data. Effect of body mass index on type 2 diabetes The four MR-SimSS variants, together with other MR methods, were also used to estimate the causal effect of BMI on type 2 diabetes (T2D), under varying degrees of sample overlap. First, a sample of 166,266 individuals with outcome information was randomly selected from the entire UKBB [ 15 ] T2D data set and used to generate a set of outcome GWAS summary statistics with PLINK 2.0 [ 17 ]. For the exposure, BMI, 5 different sets of GWAS summary statistics were generated using similarly-sized sets of individuals, all with different percentages of sample overlap with the outcome data set (0%, 25%, 50%, 75%, 100%). The results of the 5 BMI-T2D analyses are summarized in Fig. 4 and Table 3 . In line with previous MR studies [ 23 ], higher BMI was confirmed to be a causal risk factor for T2D. All methods yield statistically significant causal effect estimates, with all 95% confidence intervals lying above 1. The traditional IVW approach yielded estimated effects ranging from 1.171, for non-overlapping samples, to 1.298, for fully overlapping samples. In contrast, the range of causal effect estimates provided by SimSS-3-RAPS is ∼35% smaller, from 1.29 to 1.372. The difference between SimSS-3-RAPS and IVW estimates was greatest in the zero overlap setting, with our results suggesting that IVW underestimated the causal effect by ∼9% due to downward bias caused by both Winner’s Curse and weak instruments. These results illustrate MR-SimSS’s ability to provide more consistent effect estimates across different degrees of sample overlap between exposure and outcome data sets. View this table: View inline View popup Table 3. Summarized results for the BMI-T2D analyses across varying sample overlap. Download figure Open in new tab Fig. 4: Causal effect estimates for BMI-T2D analyses, with varying sample overlap. Estimated causal effects for each method resulting from BMI-T2D analyses with various percentages of sample overlap. Methods are abbreviated as: SimSS-2-IVW = 2-split version of MR-SimSS using IVW, SimSS-2-RAPS = 2-split version of MR-SimSS using MR-RAPS, SimSS-3-IVW = 3-split version of MR-SimSS using IVW, SimSS-3-RAPS = 3-split version of MR-SimSS using MR-RAPS, IVW = Inverse variance weighted method, RAPS = Robust Adjusted Profile Score of Zhao et al. [ 10 ], Egger = Egger regression of Bowden et al. [ 9 ], Weighted median = Weighted median approach of Bowden et al. [ 6 ], and dIVW = debiased IVW method of Ye et al. [ 22 ]. Discussion We introduce MR Simulated Sample Splitting (MR-SimSS), a novel summary-level MR method designed to correct Winner’s Curse bias. Winner’s Curse arises when the same GWAS dataset is used for both instrument selection and variant-exposure association estimation, often producing deflated causal effect estimates. In recent years, summary-level MR, or two-sample MR - has become the dominant MR approach, driven by its ease of use and the broad availability of complete summary data. This has spurred the development of numerous summary-level MR methods aimed at accurate causal effect estimation [ 16 ]. However, methods explicitly addressing Winner’s Curse bias remain underdeveloped. While using an independent sample for instrument selection is a commonly accepted solution [ 10 ], we consider such an approach suboptimal due to reduced statistical power from dataset partitioning and potential heterogeneity introduced by dissimilar populations. Accordingly, MR-SimSS requires no such independent dataset to be available. MR-SimSS addresses Winner’s Curse by employing asymptotic conditional distributions to emulate repetitive splitting of a large individual-level dataset into distinct fractions. Instrument selection is based on association estimates from one fraction, while the remaining fraction is used for estimation. At each iteration, causal effect estimates are obtained via the integration of a summary-level MR method. We investigated the use of both the IVW [ 7 ] and MR-RAPS [ 10 ] methods within the context of our simulated sample splitting procedure. Furthermore, the MR-SimSS framework accommodates both partial and full sample overlap between exposure and outcome GWASs, a frequent scenario in large biobank datasets such as UK Biobank. In a factorial simulation study, varying sample overlap and exposure-outcome correlation, SimSS-3-RAPS - the 3-split version of MR-SimSS integrating MR-RAPS - consistently demonstrated superior performance, yielding unbiased causal estimates across all scenarios. It achieved the highest empirical coverage (0.939), minimal average bias (0.0001) and lowest RMSE, illustrating its capacity to overcome both Winner’s Curse and weak instrument bias. As shown in Supplementary Fig. 4, SimSS-3-RAPS remains unbiased irrespective of exposure-outcome correlation, even in the presence of fully overlapping samples. When independent GWASs are available, SimSS-2-RAPS performs comparably well. Although SimSS-2-IVW and SimSS-3-IVW are susceptible to weak instrument bias, both outperform naïve IVW, underscoring MR-SimSS’s utility even when paired with simpler estimators. Our simulations reaffirm the vulnerability of standard methods, such as IVW and MR-RAPS, to Winner’s Curse. For example, Supplementary Table 1, shows coverage below 0.51 for these methods under zero-overlap conditions when selection and estimation utilize the same exposure data. Our simulation results with smaller sample sizes, e.g. 50,000, underscore the importance of sufficient instrument strength and quantity for stable estimation using MR-SimSS. When the average number of instruments per iteration is low, fewer than ∼20, the method exhibits increased variability and reduced precision. However, we find that performance improves substantially when the instrument selection threshold is relaxed. Specifically, our findings demonstrate that in low-power settings, employing a less stringent selection threshold offers a practical strategy to recover estimator stability within the MR-SimSS framework (Supplementary Fig. 11), provided that weak instrument bias is appropriately mitigated through the use of robust MR estimators. Our simulations also demonstrate that MR-SimSS in its three-split variety, when paired with MR-RAPS has roughly 95% coverage, and consequentially 5% Type I error, under the null hypothesis of no causal effect (Supplementary Fig. 5). It is well known that the combination of sample overlap and weak instrument bias typically leads to inflated Type I error, even for methods that are robust to weak instrument bias under no sample overlap, such as MR-RAPS as we show in our simulations. Given what has been referred to as a ‘credibility crisis’ in Mendelian Randomization [ 25 ], it is essential that MR methods have preserved Type I error under general conditions, and the MR-SimSS framework is an important development in this regard. Same-trait empirical analyses (e.g. BMI-BMI) corroborate the simulation findings, particularly under independent sample conditions ( Fig. 3 ). Across 20 BMI-BMI analyses, IVW, MR-RAPS, and the weighted median method displayed pronounced Winner’s Curse bias, with coverage probabilities of zero and average bias ranging from -0.2 to -0.13. In contrast, SimSS-2-RAPS and SimSS-3-RAPS yielded unbiased estimates with coverage of 0.95 and negligible bias (<0.002), demonstrating robustness to both Winner’s Curse and weak instrument bias. Admittedly, the current formulation of MR-SimSS has certain limitations. Throughout our investigation, the splitting fractions, π and p , were both fixed at 0.5. Determining universally optimal values for these fractions is inherently challenging as they likely depend on the underlying genetic architectures of both the exposure and outcome traits, as well as the sample sizes of the source GWAS datasets. Our selection of π = 0.5 was partly informed by Sadreev et al. [ 17 ]. A higher value of π increases the number of instruments per iteration; thus, π = 0.5 balances the fractions used for instrument generation and for estimation of associations in the 3-split setting. With both splitting fractions set to 0.5, only 25% of the total sample informs each variant-exposure and variant-outcome association estimate, increasing variance in the resulting causal effect estimates. This variance inflation can be largely mitigated by using a sufficiently large number of iterations, e.g. 1000, ensuring stability and precision in the final estimate. Adaptive tuning of these parameters merits future exploration. An additional avenue for future research is the integration of MR-SimSS with alternative summary-level MR methods. We anticipate optimal performance when paired with approaches robust to weak instruments and pleiotropy, whereas more vulnerable methods may yield less reliable estimates. Although pleiotropy was not explicitly modeled in simulations, MR-SimSS inherits the properties of the embedded MR method. For example, SimSS-3-RAP’s strong resistance to weak instrument bias is derived from MR-RAPS itself. Therefore, combining MR-SimSS with pleiotropy-robust methods is expected to be suitable for analyses affected by directional or horizontal pleiotropy. Conceptually, MR-SimSS functions not as a standalone MR estimator, but as a general framework for mitigating bias due to Winner’s Curse and sample overlap in summary-level MR. It complements existing MR methods, enabling researchers to utilize the largest available GWAS datasets, even with overlapping samples, without requiring a third, independent dataset. Due to the lack of accessible software, we were unable to include the recently proposed rerandomized IVW (RIVW) estimator [ 24 ] in our method evaluations. The RIVW estimator may be regarded as conceptually similar to MR-SimSS, as both approaches were designed to facilitate independent instrument selection and unbiased estimation of variant-exposure associations using a single exposure dataset. By introducing pseudo variant-exposure associations into the selection step and then using Rao-Blackwellization to produce a consistent estimator for the causal effect, RIVW successfully breaks the Winner’s Curse in the classical two-sample IVW estimator [ 24 ]. For settings with non-overlapping exposure and outcome samples, this Rao-Blackwellization result could be viewed as the theoretical expectation of what would be obtained if MR-SimSS was applied with an IVW estimate adapted to handle weak instrument bias. As RIVW is a non-simulation based approach, it is likely to be more computationally efficient than MR-SimSS. However, it requires that the exposure and outcome GWASs have been performed with non-overlapping samples and is vulnerable to unbalanced pleiotropy. In contrast, we have demonstrated here how MR-SimSS can mitigate Winner’s Curse bias irrespective of sample overlap and can also be used with existing MR methods that are resistant to weak instrument bias and certain types of pleiotropy. In conclusion, MR-SimSS provides a principled and practical solution to two pervasive issues in MR analysis, Winner’s Curse and weak instrument bias, when only GWAS summary statistics are accessible. By enabling the use of maximal GWAS data, MR-SimSS substantially improves the reliability of causal effect estimates, thus offering a certain valuable contribution to the MR methodological toolkit. Data Availability The real-data analysis has been conducted using the UK Biobank Resource under Application Number 23739 ( https://www.ukbiobank.ac.uk/enable-your-research/approved-research/exploring-the-shared-genetic-aetiology-between-schizophrenia-and-cognition ). Code Availability The code used for both the simulation study and the real-data analysis in the manuscript is available at https://github.com/amandaforde/mrsimss-paper . Code to implement MR-SimSS is available in the ‘mr.simss’ R package ( https://github.com/amandaforde/mr.simss ). Supplementary Information S1 File. Text Supplement . This file contains supplementary figures, tables as well as important derivations. References 1. ↵ Davey Smith G , Ebrahim S. ‘Mendelian randomization’: can genetic epidemiology contribute to understanding environmental determinants of disease? Int J Epidemiol . 2003 ; 32 ( 1 ): 1 – 22 . OpenUrl CrossRef PubMed Web of Science 2. ↵ Smith GD , Ebrahim S. Data dredging, bias, or confounding: they can all get you into the BMJ and the Friday papers . BMJ . 2002 ; 325 ( 7378 ): 1437 . OpenUrl FREE Full Text 3. ↵ Swanson SA , Tiemeier H , Ikram MA , Hernán MA. Nature as a trialist? Deconstructing the analogy between Mendelian randomization and randomized trials . Epidemiology . 2017 ; 28 ( 5 ): 653 – 9 . OpenUrl CrossRef PubMed 4. ↵ Sanderson E , Davey Smith G , Windmeijer F , Bowden J. Mendelian randomization . Nat Rev Methods Primers . 2022 ; 2 : 6 . OpenUrl PubMed 5. ↵ Burgess S , Scott RA , Timpson NJ , Davey Smith G , Thompson SG . Using published data in Mendelian randomization: a blueprint for efficient identification of causal risk factors . Eur J Epidemiol . 2015 ; 30 ( 7 ): 543 – 52 . OpenUrl CrossRef PubMed 6. ↵ Bowden J , Davey Smith G , Haycock PC , Burgess S. Consistent estimation in Mendelian randomization with some invalid instruments using a weighted median estimator . Genet Epidemiol . 2016 ; 40 ( 4 ): 304 – 14 . OpenUrl CrossRef PubMed 7. ↵ Burgess S , Dudbridge F , Thompson SG . Combining information on multiple instrumental variables in Mendelian randomization: comparison of allele score and summarized data methods . Stat Med . 2016 ; 35 ( 11 ): 1880 – 906 . OpenUrl CrossRef PubMed 8. ↵ Bowden J , Del Greco MF , Minelli C , Davey Smith G , Sheehan NA , Thompson JR . Assessing the suitability of summary data for two-sample Mendelian randomization analyses using MR-Egger regression: the role of the I2statistic . Int J Epidemiol . 2016 ; 45 ( 6 ): 1961 – 74 . OpenUrl CrossRef PubMed 9. ↵ Bowden J , Davey Smith G , Burgess S. Mendelian randomization with invalid instruments: effect estimation and bias detection through Egger regression . Int J Epidemiol . 2015 ; 44 ( 2 ): 512 – 25 . OpenUrl CrossRef PubMed 10. ↵ Zhao Q , Wang J , Hemani G , Bowden J , Small DS . Statistical inference in two-sample summary-data Mendelian randomization using robust adjusted profile score . Ann Stat . 2020 ; 48 ( 3 ): 1742 – 69 . OpenUrl CrossRef 11. ↵ Jiang T , Gill D , Butterworth AS , Burgess S. An empirical investigation into the impact of winner’s curse on estimates from Mendelian randomization . Int J Epidemiol . 2022 ; 52 ( 5 ): 1209 – 19 . OpenUrl 12. ↵ Burgess S , Thompson SG . Bias in causal estimates from Mendelian randomization studies with weak instruments . Stat Med . 2011 ; 30 ( 11 ): 1312 – 23 . OpenUrl CrossRef PubMed 13. ↵ Burgess S , Davies NM , Thompson SG . Bias due to participant overlap in two-sample Mendelian randomization . Genet Epidemiol . 2016 ; 40 ( 7 ): 597 – 608 . OpenUrl CrossRef PubMed 14. ↵ Forde A , Hemani G , Ferguson J. Review and further developments in statistical corrections for winner’s curse in genetic association studies . PLoS Genet . 2023 ; 19 ( 7 ): e1010546 . OpenUrl CrossRef PubMed 15. ↵ Bycroft C , Freeman C , Petkova D , Band G , Elliott LT , Sharp K , et al. The UK Biobank resource with deep phenotyping and genomic data . Nature . 2018 ; 562 ( 7726 ): 203 – 9 . OpenUrl CrossRef PubMed 16. ↵ Boehm FJ , Zhou X. Statistical methods for Mendelian randomization in genome-wide association studies: a review . Comput Struct Biotechnol J . 2022 ; 20 : 2338 – 51 . OpenUrl CrossRef PubMed 17. ↵ Purcell S , Neale B , Todd-Brown K , Thomas L , Ferreira MAR , Bender D , et al. PLINK: a tool set for whole-genome association and population-based linkage analyses . Am J Hum Genet . 2007 ; 81 ( 3 ): 559 – 75 . OpenUrl CrossRef PubMed 18. ↵ Sadreev II , Lepik K , Richmond RC , Palmer TM , Davey Smith G , Holmes MV , et al. Navigating sample overlap, winner’s curse and weak instrument bias in Mendelian randomization studies using the UK Biobank . medRxiv . 2021 . doi: 10.1101/2021.09.17.21263612 . OpenUrl Abstract / FREE Full Text 19. Thomas DC , Lawlor DA , Thompson JR . Re: Estimation of bias in nongenetic observational studies using “Mendelian triangulation” by Bautista et al . Ann Epidemiol . 2007 ; 17 ( 7 ): 511 – 3 . OpenUrl CrossRef PubMed Web of Science 20. Burgess S , Butterworth A , Thompson SG . Mendelian randomization analysis with multiple genetic variants using summarized data . Genet Epidemiol . 2013 ; 37 ( 7 ): 658 – 65 . OpenUrl CrossRef PubMed 21. Pierce BL , Burgess S. Efficient design for Mendelian randomization studies: subsample and 2-sample instrumental variable estimators . Am J Epidemiol . 2013 ; 178 ( 7 ): 1177 – 84 . OpenUrl CrossRef PubMed Web of Science 22. ↵ Ye T , Shao J , Kang H. Debiased inverse-variance weighted estimator in two-sample summary-data Mendelian randomization . Ann Stat . 2021 ; 49 ( 4 ): 2079 – 110 . OpenUrl 23. ↵ Corbin LJ , Richmond RC , Wade KH , Burgess S , Bowden J , Davey Smith G , et al. BMI as a modifiable risk factor for type 2 diabetes: refining and understanding causal estimates using Mendelian randomization . Diabetes . 2016 ; 65 ( 10 ): 3002 – 7 . OpenUrl Abstract / FREE Full Text 24. ↵ Ma X , Wang J , Wu C. Breaking the winner’s curse in Mendelian randomization: rerandomized inverse variance weighted estimator . Ann Stat . 2023 ; 51 ( 1 ): 211 – 32 . OpenUrl 25. ↵ Burgess S , Woolf B , Mason AM , Gill D , Davey Smith G , Lawlor DA , et al. Addressing the credibility crisis in Mendelian randomization . BMC Med . 2024 ; 22 ( 1 ): 374 . OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted November 05, 2025. Download PDF Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Simulated sample splitting approach to address biases due to instrument selection and participant overlap in two-sample Mendelian Randomization studies Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Simulated sample splitting approach to address biases due to instrument selection and participant overlap in two-sample Mendelian Randomization studies Amanda Forde , Gibran Hemani , John Ferguson bioRxiv 2025.11.04.686460; doi: https://doi.org/10.1101/2025.11.04.686460 Share This Article: Copy Citation Tools Simulated sample splitting approach to address biases due to instrument selection and participant overlap in two-sample Mendelian Randomization studies Amanda Forde , Gibran Hemani , John Ferguson bioRxiv 2025.11.04.686460; doi: https://doi.org/10.1101/2025.11.04.686460 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Genetics Subject Areas All Articles Animal Behavior and Cognition (7624) Biochemistry (17650) Bioengineering (13871) Bioinformatics (41882) Biophysics (21424) Cancer Biology (18566) Cell Biology (25461) Clinical Trials (138) Developmental Biology (13365) Ecology (19867) Epidemiology (2067) Evolutionary Biology (24290) Genetics (15590) Genomics (22476) Immunology (17713) Microbiology (40331) Molecular Biology (17148) Neuroscience (88477) Paleontology (666) Pathology (2828) Pharmacology and Toxicology (4816) Physiology (7635) Plant Biology (15114) Scientific Communication and Education (2044) Synthetic Biology (4286) Systems Biology (9815) Zoology (2268)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

⚙ Ask this paper AI returns verbatim quotes from the full text · source: preprint-html ⓘ

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc: last seen: 2026-05-20T01:45:00.602351+00:00