<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.1d3 20150301//EN" "http://jats.nlm.nih.gov/publishing/1.1d3/JATS-journalpublishing1.dtd">
<article article-type="research-article" dtd-version="1.1d3" xml:lang="en" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="nlm-ta">PLoS Genet</journal-id>
<journal-id journal-id-type="publisher-id">plos</journal-id>
<journal-id journal-id-type="pmc">plosgen</journal-id>
<journal-title-group>
<journal-title>PLOS Genetics</journal-title>
</journal-title-group>
<issn pub-type="ppub">1553-7390</issn>
<issn pub-type="epub">1553-7404</issn>
<publisher>
<publisher-name>Public Library of Science</publisher-name>
<publisher-loc>San Francisco, CA USA</publisher-loc>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">PGENETICS-D-20-00907</article-id>
<article-id pub-id-type="doi">10.1371/journal.pgen.1009575</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Research Article</subject>
</subj-group>
<subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Epidemiology</subject><subj-group><subject>Medical risk factors</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Computational biology</subject><subj-group><subject>Genome analysis</subject><subj-group><subject>Genome-wide association studies</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Genetics</subject><subj-group><subject>Genomics</subject><subj-group><subject>Genome analysis</subject><subj-group><subject>Genome-wide association studies</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Genetics</subject><subj-group><subject>Human genetics</subject><subj-group><subject>Genome-wide association studies</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Medical conditions</subject><subj-group><subject>Cardiovascular diseases</subject><subj-group><subject>Cardiovascular disease risk</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Cardiology</subject><subj-group><subject>Cardiovascular medicine</subject><subj-group><subject>Cardiovascular diseases</subject><subj-group><subject>Cardiovascular disease risk</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Biochemistry</subject><subj-group><subject>Proteins</subject><subj-group><subject>C-reactive proteins</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Genetics</subject><subj-group><subject>Genetics of disease</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Epidemiology</subject><subj-group><subject>Medical risk factors</subject><subj-group><subject>Cancer risk factors</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Oncology</subject><subj-group><subject>Cancer risk factors</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Genetics</subject><subj-group><subject>Genetics of disease</subject><subj-group><subject>Genetic predisposition</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Genetics</subject></subj-group></subj-group></article-categories>
<title-group>
<article-title>Causal inference for heritable phenotypic risk factors using heterogeneous genetic instruments</article-title>
<alt-title alt-title-type="running-head">Causal inference for heritable phenotypic risk factors using heterogeneous genetic instruments</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0002-1968-6888</contrib-id>
<name name-style="western">
<surname>Wang</surname> <given-names>Jingshu</given-names></name>
<role content-type="https://casrai.org/credit/">Conceptualization</role>
<role content-type="https://casrai.org/credit/">Data curation</role>
<role content-type="https://casrai.org/credit/">Formal analysis</role>
<role content-type="https://casrai.org/credit/">Methodology</role>
<role content-type="https://casrai.org/credit/">Software</role>
<role content-type="https://casrai.org/credit/">Validation</role>
<role content-type="https://casrai.org/credit/">Visualization</role>
<role content-type="https://casrai.org/credit/">Writing – original draft</role>
<role content-type="https://casrai.org/credit/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
<xref ref-type="corresp" rid="cor001">*</xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0001-9902-2768</contrib-id>
<name name-style="western">
<surname>Zhao</surname> <given-names>Qingyuan</given-names></name>
<role content-type="https://casrai.org/credit/">Conceptualization</role>
<role content-type="https://casrai.org/credit/">Methodology</role>
<role content-type="https://casrai.org/credit/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0003-2628-3304</contrib-id>
<name name-style="western">
<surname>Bowden</surname> <given-names>Jack</given-names></name>
<role content-type="https://casrai.org/credit/">Methodology</role>
<role content-type="https://casrai.org/credit/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff003"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0003-0920-1055</contrib-id>
<name name-style="western">
<surname>Hemani</surname> <given-names>Gibran</given-names></name>
<role content-type="https://casrai.org/credit/">Resources</role>
<role content-type="https://casrai.org/credit/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff004"><sup>4</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0002-1407-8314</contrib-id>
<name name-style="western">
<surname>Davey Smith</surname> <given-names>George</given-names></name>
<role content-type="https://casrai.org/credit/">Methodology</role>
<role content-type="https://casrai.org/credit/">Validation</role>
<role content-type="https://casrai.org/credit/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff004"><sup>4</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Small</surname> <given-names>Dylan S.</given-names></name>
<role content-type="https://casrai.org/credit/">Methodology</role>
<role content-type="https://casrai.org/credit/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff005"><sup>5</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0002-0880-5749</contrib-id>
<name name-style="western">
<surname>Zhang</surname> <given-names>Nancy R.</given-names></name>
<role content-type="https://casrai.org/credit/">Conceptualization</role>
<role content-type="https://casrai.org/credit/">Writing – original draft</role>
<role content-type="https://casrai.org/credit/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff005"><sup>5</sup></xref>
</contrib>
</contrib-group>
<aff id="aff001">
<label>1</label>
<addr-line>Department of Statistics, University of Chicago, Chicago, Illinois, United States of America</addr-line>
</aff>
<aff id="aff002">
<label>2</label>
<addr-line>Department of Pure Mathematics and Mathematical Statistics, University of Cambridge, Cambridge, United Kingdom</addr-line>
</aff>
<aff id="aff003">
<label>3</label>
<addr-line>College of Medicine and Health, University of Exeter, Exeter, United Kingdom</addr-line>
</aff>
<aff id="aff004">
<label>4</label>
<addr-line>MRC Integrative Epidemiology Unit, University of Bristol, Bristol, United Kingdom</addr-line>
</aff>
<aff id="aff005">
<label>5</label>
<addr-line>Department of Statistics, University of Pennsylvania, Philadelphia, Pennsylvania, United States of America</addr-line>
</aff>
<contrib-group>
<contrib contrib-type="editor" xlink:type="simple">
<name name-style="western">
<surname>Zhu</surname> <given-names>Xiaofeng</given-names></name>
<role>Editor</role>
<xref ref-type="aff" rid="edit1"/>
</contrib>
</contrib-group>
<aff id="edit1">
<addr-line>Case Western Reserve University, UNITED STATES</addr-line>
</aff>
<author-notes>
<fn fn-type="conflict" id="coi001">
<p>The authors have declared that no competing interests exist.</p>
</fn>
<corresp id="cor001">* E-mail: <email xlink:type="simple">jingshuw@uchicago.edu</email></corresp>
</author-notes>
<pub-date pub-type="collection">
<month>6</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="epub">
<day>22</day>
<month>6</month>
<year>2021</year>
</pub-date>
<volume>17</volume>
<issue>6</issue>
<elocation-id>e1009575</elocation-id>
<history>
<date date-type="received">
<day>7</day>
<month>6</month>
<year>2020</year>
</date>
<date date-type="accepted">
<day>4</day>
<month>5</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-year>2021</copyright-year>
<copyright-holder>Wang et al</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">
<license-p>This is an open access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">Creative Commons Attribution License</ext-link>, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
</license>
</permissions>
<self-uri content-type="pdf" xlink:href="info:doi/10.1371/journal.pgen.1009575"/>
<abstract>
<p>Over a decade of genome-wide association studies (GWAS) have led to the finding of extreme polygenicity of complex traits. The phenomenon that “all genes affect every complex trait” complicates Mendelian Randomization (MR) studies, where natural genetic variations are used as instruments to infer the causal effect of heritable risk factors. We reexamine the assumptions of existing MR methods and show how they need to be clarified to allow for pervasive horizontal pleiotropy and heterogeneous effect sizes. We propose a comprehensive framework GRAPPLE to analyze the causal effect of target risk factors with heterogeneous genetic instruments and identify possible pleiotropic patterns from data. By using GWAS summary statistics, GRAPPLE can efficiently use both strong and weak genetic instruments, detect the existence of multiple pleiotropic pathways, determine the causal direction and perform multivariable MR to adjust for confounding risk factors. With GRAPPLE, we analyze the effect of blood lipids, body mass index, and systolic blood pressure on 25 disease outcomes, gaining new information on their causal relationships and potential pleiotropic pathways involved.</p>
</abstract>
<abstract abstract-type="summary">
<title>Author summary</title>
<p>Mendelian randomization uses genetic variants related to a modifiable risk factor to obtain evidence regarding its causal influence on disease from observational studies. However, the highly polygenic nature of complex traits where almost all genes contribute to every complex trait challenges the reliability of the causal inference from these genetic variants. In this paper, we give a thorough reexamination of the assumptions that can be reasonably made for Mendelian randomization and propose a framework, GRAPPLE, to gain power by using both strongly and weakly associated SNPs and to identify confounding pleiotropic pathways from hidden risk factors. With GRAPPLE, we analyze the effect of blood lipids, body mass index, and systolic blood pressure on 25 diseases, gaining an improved understanding of these risk factors.</p>
</abstract>
<funding-group>
<funding-statement>GDS/GH work in the Medical Research Council Integrative Epidemiology Unit at the University of Bristol MC_UU_00011/1. DSS is supported by NIH grant 1R01AG065276-01. The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</funding-statement>
</funding-group>
<counts>
<fig-count count="3"/>
<table-count count="0"/>
<page-count count="24"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>PLOS Publication Stage</meta-name>
<meta-value>vor-update-to-uncorrected-proof</meta-value>
</custom-meta>
<custom-meta>
<meta-name>Publication Update</meta-name>
<meta-value>2021-07-23</meta-value>
</custom-meta>
<custom-meta id="data-availability">
<meta-name>Data Availability</meta-name>
<meta-value>All data used are publicly available and details of the data sources are listed in the <xref ref-type="supplementary-material" rid="pgen.1009575.s009">S3 Text</xref>.</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="sec001" sec-type="intro">
<title>Introduction</title>
<p>Understanding the pathogenic mechanism of common diseases is a fundamental goal in clinical research. As randomized controlled experiments are not always feasible, researchers are looking towards Mendelian Randomization (MR) as an alternative method for probing the causal mechanisms of common diseases [<xref ref-type="bibr" rid="pgen.1009575.ref001">1</xref>]. MR uses inherited genetic variations as instrumental variables (IV) to interrogate the causal effect of heritable risk factor(s) on the disease of interest. The basic idea is that at these variant loci, the inherited alleles are randomly transmitted from the parents to their offsprings according to Mendel’s laws. Thus, the genotypes are independent from non-heritable confounding variables which may obfuscate causal estimation in parent-offspring studies. More generally, such independence also approximately holds for population data such as those collected in genome-wide association studies (GWAS) when individuals share the same ancestry [<xref ref-type="bibr" rid="pgen.1009575.ref002">2</xref>]. With the accumulation of data from GWAS, there is increasing interest in MR approaches, especially in approaches that only rely on GWAS summary statistics that are publicly available [<xref ref-type="bibr" rid="pgen.1009575.ref002">2</xref>, <xref ref-type="bibr" rid="pgen.1009575.ref003">3</xref>].</p>
<p>How well Mendelian Randomization works depends on how well the genetic variant loci used as instruments abide by the rules of IV. These rules dictate that, if the genetic locus has an effect on the disease outcome, it should be only through pathways mediated by the risk factor(s) of interest. This rule, termed exclusion restriction, is violated when there is horizontal pleiotropy, defined as the case where the genetic variant can influence the disease through pathways other than the given risk factor(s) [<xref ref-type="bibr" rid="pgen.1009575.ref004">4</xref>]. There has been much recent attention on this issue [<xref ref-type="bibr" rid="pgen.1009575.ref005">5</xref>–<xref ref-type="bibr" rid="pgen.1009575.ref016">16</xref>] in MR, yet our understanding is far from complete. Current methods rely on different assumptions on the pattern of horizontal pleiotropy, often driven by statistical convenience rather than what geneticists have learned from real data. What assumptions on pleiotropy and genetic effects would be suitable? Would it be possible to learn the degree of pleiotropy from the data? Could we perform model diagnosis utilizing only GWAS summary statistics?</p>
<p>The pleiotropy issue that muddles Mendelian Randomization studies is, in a large part, due to the fact that complex traits are extremely polygenic [<xref ref-type="bibr" rid="pgen.1009575.ref015">15</xref>, <xref ref-type="bibr" rid="pgen.1009575.ref017">17</xref>–<xref ref-type="bibr" rid="pgen.1009575.ref024">24</xref>]. Accumulating evidence from GWAS studies indicates that many complex diseases may have an omnigenic architecture where all genes affect every complex trait [<xref ref-type="bibr" rid="pgen.1009575.ref025">25</xref>]. While a few genes might be “core” genes, a large proportion of genes may have non-zero effects on diseases and their risk factors. Thus, in an MR study, many genetic instruments, if not all, may affect the disease through their effects on other unmeasured risk factors. In other words, in an MR analysis, not only would we expect horizontal pleiotropy to be a pervasive issue across all genetic variants, any disease or complex risk factor would also be associated with a large number of SNPs across the whole genome. Many existing MR methods rely on the assumption that pleiotropic effects sparsely involve only a few SNPs, which directly counters these recent insights. Methods that don’t assume sparsity often require the instrument strength independent of direct effect (InSIDE) assumption [<xref ref-type="bibr" rid="pgen.1009575.ref006">6</xref>], which can be rather optimistic. Recently, a few new methods relaxed the InSIDE assumption to consider “correlated pleiotropy” through one pleiotropic pathway [<xref ref-type="bibr" rid="pgen.1009575.ref011">11</xref>, <xref ref-type="bibr" rid="pgen.1009575.ref012">12</xref>, <xref ref-type="bibr" rid="pgen.1009575.ref015">15</xref>, <xref ref-type="bibr" rid="pgen.1009575.ref026">26</xref>]. However, when pleiotropic pathways exist, there would often be an issue in identifying the true causal effect of the risk factor, and most methods are restricted to allow for only one pleiotropy pathway. Armed with these assumptions, most existing methods also utilize only the few SNPs that have the strongest association with the risk factor as instruments, ignoring the SNPs that are weakly associated. In this work, we will show that weakly associated SNPs are also informative, and that a model combining weak and strong SNPs can increase the accuracy and stability of our estimations in some scenarios.</p>
<p>We propose a comprehensive statistical framework for causal effect estimation under the realistic assumption that pleiotropy may be pervasive across the genome. The framework, called GRAPPLE (Genome-wide mR Analysis under Pervasive PLEiotropy), facilitates interactive identification of multiple pleiotropic pathways and incorporates all SNPs associated with the risk factor at varying p-value thresholds into the analysis. GRAPPLE builds upon a previous statistical framework we developed called MR-RAPS [<xref ref-type="bibr" rid="pgen.1009575.ref010">10</xref>] under the InSIDE assumption, but is much more comprehensive and flexible. GRAPPLE emphasizes the detection of multiple pleiotropic pathways when the InSIDE assumption is violated as well as the determination of the causal direction. GRAPPLE further addresses two common challenges: how to jointly estimate the effects with multiple risk factors to reduce correlated pleiotropy, and how to integrate cohorts with overlapping samples. The estimation accuracy of GRAPPLE is examined through validations involving both real studies and simulations.</p>
<p>We apply GRAPPLE to investigate the causal effects of 5 risk factors (three plasma lipid traits, body mass index, and systolic blood pressure) on 25 common diseases. Although there have been several causal effect screening studies [<xref ref-type="bibr" rid="pgen.1009575.ref009">9</xref>, <xref ref-type="bibr" rid="pgen.1009575.ref015">15</xref>, <xref ref-type="bibr" rid="pgen.1009575.ref026">26</xref>] for these risk factors and diseases, the multi-modality analysis enabled by GRAPPLE brings forth new insights on the pleiotropic landscape of these diseases and, thus, an improved understanding of the causal risk factors. Specifically, we will reexamine the role of lipid traits on coronary artery disease and type-II diabetes, where the results from MR studies have been under heated debate [<xref ref-type="bibr" rid="pgen.1009575.ref002">2</xref>, <xref ref-type="bibr" rid="pgen.1009575.ref027">27</xref>, <xref ref-type="bibr" rid="pgen.1009575.ref028">28</xref>]. The R package GRAPPLE is publicly available for installation at <ext-link ext-link-type="uri" xlink:href="https://github.com/jingshuw/GRAPPLE" xlink:type="simple">https://github.com/jingshuw/GRAPPLE</ext-link>.</p>
</sec>
<sec id="sec002" sec-type="results">
<title>Results</title>
<sec id="sec003">
<title>Model overview</title>
<sec id="sec004">
<title>From the causal model to GWAS summary statistics</title>
<p>Our framework starts with a set of structural equations that jointly specify the generative model on the disease <italic>Y</italic> that relies on <italic>K</italic> observed risk factors <bold><italic>X</italic></bold> = (<italic>X</italic><sub>1</sub>, ⋯, <italic>X</italic><sub><italic>K</italic></sub>) of interest, and the vector <bold><italic>Z</italic></bold> = (<italic>Z</italic><sub>1</sub>, <italic>Z</italic><sub>2</sub>, ⋯) containing all genetic information of an individual (<xref ref-type="fig" rid="pgen.1009575.g001">Fig 1a</xref>).
<disp-formula id="pgen.1009575.e001"><alternatives><graphic id="pgen.1009575.e001g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e001" xlink:type="simple"/><mml:math display="block" id="M1"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mi>Y</mml:mi></mml:mtd> <mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo> <mml:msup><mml:mi mathvariant="bold-italic">X</mml:mi> <mml:mi>T</mml:mi></mml:msup> <mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>+</mml:mo> <mml:mi>f</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="bold-italic">U</mml:mi> <mml:mo>,</mml:mo> <mml:mi mathvariant="bold-italic">Z</mml:mi> <mml:mo>,</mml:mo> <mml:msub><mml:mi>E</mml:mi> <mml:mi>Y</mml:mi></mml:msub> <mml:mo>)</mml:mo></mml:mrow> <mml:mspace width="1em"/><mml:mrow><mml:mo>(</mml:mo> <mml:mtext>if</mml:mtext> <mml:mspace width="4pt"/><mml:mi>Y</mml:mi> <mml:mspace width="4pt"/><mml:mtext>is</mml:mtext> <mml:mspace width="4pt"/><mml:mtext>a</mml:mtext> <mml:mspace width="4pt"/><mml:mtext>continuous</mml:mtext> <mml:mspace width="4pt"/><mml:mtext>trait</mml:mtext> <mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mtd></mml:mtr> <mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mtext>logit</mml:mtext> <mml:mo>[</mml:mo> <mml:mi>P</mml:mi> <mml:mo>(</mml:mo> <mml:mi>Y</mml:mi> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn> <mml:mo>)</mml:mo> <mml:mo>]</mml:mo></mml:mrow></mml:mtd> <mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo> <mml:msup><mml:mi mathvariant="bold-italic">X</mml:mi> <mml:mi>T</mml:mi></mml:msup> <mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>+</mml:mo> <mml:mi>f</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="bold-italic">U</mml:mi> <mml:mo>,</mml:mo> <mml:mi mathvariant="bold-italic">Z</mml:mi> <mml:mo>,</mml:mo> <mml:msub><mml:mi>E</mml:mi> <mml:mi>Y</mml:mi></mml:msub> <mml:mo>)</mml:mo></mml:mrow> <mml:mspace width="1em"/><mml:mrow><mml:mo>(</mml:mo> <mml:mtext>if</mml:mtext> <mml:mspace width="4pt"/><mml:mi>Y</mml:mi> <mml:mspace width="4pt"/><mml:mtext>is</mml:mtext> <mml:mspace width="4pt"/><mml:mtext>a</mml:mtext> <mml:mspace width="4pt"/><mml:mtext>binary</mml:mtext> <mml:mspace width="4pt"/><mml:mtext>trait</mml:mtext> <mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mtd></mml:mtr> <mml:mtr><mml:mtd columnalign="right"><mml:msub><mml:mi>X</mml:mi> <mml:mi>k</mml:mi></mml:msub></mml:mtd> <mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo> <mml:msub><mml:mi>g</mml:mi> <mml:mi>k</mml:mi></mml:msub> <mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="bold-italic">U</mml:mi> <mml:mo>,</mml:mo> <mml:mi mathvariant="bold-italic">Z</mml:mi> <mml:mo>,</mml:mo> <mml:msub><mml:mi>E</mml:mi> <mml:msub><mml:mi>X</mml:mi> <mml:mi>k</mml:mi></mml:msub></mml:msub> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>,</mml:mo> <mml:mspace width="1em"/><mml:mi>k</mml:mi> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn> <mml:mo>,</mml:mo> <mml:mo>⋯</mml:mo> <mml:mo>,</mml:mo> <mml:mi>K</mml:mi></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(1)</label></disp-formula>
Here <bold><italic>U</italic></bold> represents unknown non-heritable confounding factors and <inline-formula id="pgen.1009575.e002"><alternatives><graphic id="pgen.1009575.e002g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e002" xlink:type="simple"/><mml:math display="inline" id="M2"><mml:msub><mml:mi>E</mml:mi> <mml:msub><mml:mi>X</mml:mi> <mml:mi>k</mml:mi></mml:msub></mml:msub></mml:math></alternatives></inline-formula> and <italic>E</italic><sub><italic>Y</italic></sub> are random noise acting on <italic>X</italic><sub><italic>k</italic></sub> and <italic>Y</italic> respectively. The parameter of interest, <bold><italic>β</italic></bold>, quantifies the causal effect of the vector of risk factors <bold><italic>X</italic></bold> on <italic>Y</italic>. Mendel’s laws of inheritance suggest that the genotypes <bold><italic>Z</italic></bold> are randomized during conception and are generally independent of the environmental factors (<inline-formula id="pgen.1009575.e028"><alternatives><graphic id="pgen.1009575.e028g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e028" xlink:type="simple"/><mml:math display="inline" id="M28"><mml:mrow><mml:mi mathvariant="bold-italic">U</mml:mi> <mml:mo>,</mml:mo> <mml:msub><mml:mi>E</mml:mi> <mml:mi>Y</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:msub><mml:mi>E</mml:mi> <mml:msub><mml:mi>X</mml:mi> <mml:mi>k</mml:mi></mml:msub></mml:msub></mml:mrow></mml:math></alternatives></inline-formula>). The function <italic>f</italic>(<bold><italic>U</italic></bold>, <bold><italic>Z</italic></bold>, <italic>E</italic><sub><italic>Y</italic></sub>) represents the causal effect of unmeasured risk factors on <italic>Y</italic>, which can be heritable (contributed by <bold><italic>Z</italic></bold>) or non-heritable (contributed by <bold><italic>U</italic></bold>). The non-parametric functions <italic>f</italic>(⋅) and <italic>g</italic><sub><italic>k</italic></sub>(⋅) allow interactions among SNPs in <bold><italic>Z</italic></bold> and variables (<inline-formula id="pgen.1009575.e003"><alternatives><graphic id="pgen.1009575.e003g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e003" xlink:type="simple"/><mml:math display="inline" id="M3"><mml:mrow><mml:mi mathvariant="bold-italic">U</mml:mi> <mml:mo>,</mml:mo> <mml:msub><mml:mi>E</mml:mi> <mml:mi>Y</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:msub><mml:mi>E</mml:mi> <mml:msub><mml:mi>X</mml:mi> <mml:mi>k</mml:mi></mml:msub></mml:msub></mml:mrow></mml:math></alternatives></inline-formula>) in their causal effects on <bold><italic>X</italic></bold> and <italic>Y</italic>. Under this model, there is horizontal pleiotropy for a SNP <italic>j</italic> if <italic>Z</italic><sub><italic>j</italic></sub> has nonzero association with <italic>f</italic>(<bold><italic>U</italic></bold>, <bold><italic>Z</italic></bold>, <italic>E</italic><sub><italic>Y</italic></sub>). This is the case, for example, when <italic>Z</italic><sub><italic>j</italic></sub> acts on <italic>Y</italic> through a pathway affecting unmeasured risk factors, or when <italic>Z</italic><sub><italic>j</italic></sub> is in linkage disequilibrium (LD) with such a locus.</p>
<fig id="pgen.1009575.g001" position="float">
<object-id pub-id-type="doi">10.1371/journal.pgen.1009575.g001</object-id>
<label>Fig 1</label>
<caption>
<title>Model overview.</title>
<p><bold>a</bold>, The causal directed graph represented by structural equations (<xref ref-type="disp-formula" rid="pgen.1009575.e001">1</xref>). <bold>b</bold>, The existence of a pleiotropic pathway 2 (purple) can result in multiple modes of the profile likelihood. <bold>c</bold>, Multi-modality of the profile likelihood can reflect causal direction. <bold>d</bold>, The work-flow with GRAPPLE.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pgen.1009575.g001" xlink:type="simple"/>
</fig>
<p>Now consider the case where only GWAS summary statistics, i.e. the estimated marginal associations between each SNP <italic>j</italic> and the risk factors/disease traits, are available and there are in total <italic>p</italic> SNPs selected. Let Γ<sub><italic>j</italic></sub> be the true association between SNP <italic>j</italic> and <italic>Y</italic>, and <bold>γ</bold><sub><italic>j</italic></sub> be the vector of true marginal associations between SNP <italic>j</italic> and <bold><italic>X</italic></bold>. Later, we will denote their estimated values from GWAS summary statistics as <inline-formula id="pgen.1009575.e004"><alternatives><graphic id="pgen.1009575.e004g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e004" xlink:type="simple"/><mml:math display="inline" id="M4"><mml:msub><mml:mover accent="true"><mml:mo>Γ</mml:mo> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009575.e005"><alternatives><graphic id="pgen.1009575.e005g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e005" xlink:type="simple"/><mml:math display="inline" id="M5"><mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:math></alternatives></inline-formula>. Then, as shown in Materials and Methods, the model (<xref ref-type="disp-formula" rid="pgen.1009575.e001">1</xref>) results in the linear relationship
<disp-formula id="pgen.1009575.e006"><alternatives><graphic id="pgen.1009575.e006g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e006" xlink:type="simple"/><mml:math display="block" id="M6"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mo>Γ</mml:mo> <mml:mi>j</mml:mi></mml:msub> <mml:mo>=</mml:mo> <mml:msubsup><mml:mi>γ</mml:mi> <mml:mi>j</mml:mi> <mml:mi>T</mml:mi></mml:msubsup> <mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>+</mml:mo> <mml:msub><mml:mi>α</mml:mi> <mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(2)</label></disp-formula>
where for binary <italic>Y</italic>, the parameter <bold><italic>β</italic></bold> in model (<xref ref-type="disp-formula" rid="pgen.1009575.e006">2</xref>) is a conservatively biased version of <bold><italic>β</italic></bold> in model (<xref ref-type="disp-formula" rid="pgen.1009575.e001">1</xref>). This relationship holds even when the functions <italic>f</italic>(⋅) and <italic>g</italic><sub><italic>k</italic></sub>(⋅) in (<xref ref-type="disp-formula" rid="pgen.1009575.e001">1</xref>) are not linear. Here, <italic>α</italic><sub><italic>j</italic></sub> is the marginal association between <italic>Z</italic><sub><italic>j</italic></sub> and <italic>f</italic>(<bold><italic>U</italic></bold>, <bold><italic>Z</italic></bold>, <italic>E</italic><sub><italic>Y</italic></sub>), representing the unknown horizontal pleiotropy of SNP <italic>j</italic>.</p>
<p>One can immediately see that identifying <bold><italic>β</italic></bold> is impossible without further assumptions regarding <italic>α</italic><sub><italic>j</italic></sub>. Early MR methods such as IVW [<xref ref-type="bibr" rid="pgen.1009575.ref005">5</xref>] made the assumption that all instruments are valid satisfying <italic>α</italic><sub><italic>j</italic></sub> = 0. Other methods such as Weighted Median [<xref ref-type="bibr" rid="pgen.1009575.ref007">7</xref>] or MR-PRSSO [<xref ref-type="bibr" rid="pgen.1009575.ref009">9</xref>] assume that <italic>α</italic><sub><italic>j</italic></sub> is sparsely nonzero. However, the no or sparse pleiotropy assumption follows from statistical convenience rather than biological insights. As discussed in Introduction, horizontal pleiotropy is pervasive for most complex traits. One assumption that allows pervasive pleiotropy is to assume the InSIDE assumption [<xref ref-type="bibr" rid="pgen.1009575.ref006">6</xref>] where <inline-formula id="pgen.1009575.e007"><alternatives><graphic id="pgen.1009575.e007g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e007" xlink:type="simple"/><mml:math display="inline" id="M7"><mml:mrow><mml:msub><mml:mi>α</mml:mi> <mml:mi>j</mml:mi></mml:msub></mml:mrow><mml:mo>⫫</mml:mo> <mml:msub><mml:mo>γ</mml:mo> <mml:mi>j</mml:mi></mml:msub></mml:math></alternatives></inline-formula>, or alternatively, the random effect model [<xref ref-type="bibr" rid="pgen.1009575.ref010">10</xref>, <xref ref-type="bibr" rid="pgen.1009575.ref016">16</xref>] where <inline-formula id="pgen.1009575.e008"><alternatives><graphic id="pgen.1009575.e008g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e008" xlink:type="simple"/><mml:math display="inline" id="M8"><mml:mrow><mml:msub><mml:mi>α</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>∼</mml:mo> <mml:mi mathvariant="script">N</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mn>0</mml:mn> <mml:mo>,</mml:mo> <mml:msup><mml:mi>τ</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:math></alternatives></inline-formula> for most genetic instruments. Unfortunately, the InSIDE assumption can be easily violated if the pleiotropic effects of selected genetic variants are driven by shared pleiotropic mechanisms.</p>
<p>Some more recent MR methods such as LCV [<xref ref-type="bibr" rid="pgen.1009575.ref026">26</xref>], MRMix [<xref ref-type="bibr" rid="pgen.1009575.ref012">12</xref>], Contamination mixture [<xref ref-type="bibr" rid="pgen.1009575.ref013">13</xref>] and CAUSE [<xref ref-type="bibr" rid="pgen.1009575.ref015">15</xref>] have noticed this limitation of the InSIDE assumption and allow a subset of the genetic instruments to be associated with a common hidden pleiotropic pathway. For instance, using the above notation, both CAUSE and MRMix assumed that when for the SNPs that violate the inSIDE assumption, their pleiotropic effects satisfy <inline-formula id="pgen.1009575.e009"><alternatives><graphic id="pgen.1009575.e009g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e009" xlink:type="simple"/><mml:math display="inline" id="M9"><mml:mrow><mml:msub><mml:mi>α</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>=</mml:mo> <mml:mi>a</mml:mi> <mml:msub><mml:mi>γ</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mover accent="true"><mml:mi>α</mml:mi> <mml:mo>˜</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:math></alternatives></inline-formula> (when <italic>K</italic> = 1) where <italic>aγ</italic><sub><italic>j</italic></sub> represents the correlated pleiotropic effects due to a confounding pathway and <inline-formula id="pgen.1009575.e010"><alternatives><graphic id="pgen.1009575.e010g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e010" xlink:type="simple"/><mml:math display="inline" id="M10"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>α</mml:mi> <mml:mo>˜</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:mrow> <mml:mo>⫫</mml:mo> <mml:msub><mml:mo>γ</mml:mo> <mml:mi>j</mml:mi></mml:msub></mml:math></alternatives></inline-formula>. This is a more realistic assumption than InSIDE, though there would then be an issue in distinguishing the true causal effect <italic>β</italic> from the pleiotropic direction <italic>β</italic> + <italic>a</italic>. Allowing for only one pleiotropic pathway also makes the model restrictive for real datasets.</p>
</sec>
<sec id="sec005">
<title>Identify multiple pleiotropic pathways and the direction of causality</title>
<p>The key idea underlying GRAPPLE is that multiple pleiotropic pathways can be detected by using the shape of the profile likelihood function under no pleiotropy assumption. This allows us to probe the underlying causal mechanism, without explicit assumptions on pleiotropic patterns (<xref ref-type="fig" rid="pgen.1009575.g001">Fig 1b</xref>). When <italic>K</italic> = 1, the GWAS summary statistics reduce to the scalar <inline-formula id="pgen.1009575.e011"><alternatives><graphic id="pgen.1009575.e011g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e011" xlink:type="simple"/><mml:math display="inline" id="M11"><mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009575.e012"><alternatives><graphic id="pgen.1009575.e012g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e012" xlink:type="simple"/><mml:math display="inline" id="M12"><mml:msub><mml:mover accent="true"><mml:mo>Γ</mml:mo> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:math></alternatives></inline-formula>, with their standard errors <italic>σ</italic><sub>1<italic>j</italic></sub> and <italic>σ</italic><sub>2<italic>j</italic></sub>. From the central limit theorem, the joint distribution of <inline-formula id="pgen.1009575.e013"><alternatives><graphic id="pgen.1009575.e013g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e013" xlink:type="simple"/><mml:math display="inline" id="M13"><mml:mrow><mml:mo>(</mml:mo> <mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:msub><mml:mover accent="true"><mml:mo>Γ</mml:mo> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub> <mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula> approximately follows a multivariate normal distribution
<disp-formula id="pgen.1009575.e014"><alternatives><graphic id="pgen.1009575.e014g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e014" xlink:type="simple"/><mml:math display="block" id="M14"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mo>(</mml:mo> <mml:mtable><mml:mtr><mml:mtd><mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:mtd></mml:mtr> <mml:mtr><mml:mtd><mml:msub><mml:mover accent="true"><mml:mo>Γ</mml:mo> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:mtd></mml:mtr></mml:mtable> <mml:mo>)</mml:mo> <mml:mo>∼</mml:mo> <mml:mi mathvariant="script">N</mml:mi> <mml:mo>(</mml:mo> <mml:mo>(</mml:mo> <mml:mtable><mml:mtr><mml:mtd><mml:msub><mml:mi>γ</mml:mi> <mml:mi>j</mml:mi></mml:msub></mml:mtd></mml:mtr> <mml:mtr><mml:mtd><mml:msub><mml:mo>Γ</mml:mo> <mml:mi>j</mml:mi></mml:msub></mml:mtd></mml:mtr></mml:mtable> <mml:mo>)</mml:mo> <mml:mo>,</mml:mo> <mml:mo>(</mml:mo> <mml:mtable><mml:mtr><mml:mtd><mml:msubsup><mml:mi>σ</mml:mi> <mml:mrow><mml:mn>1</mml:mn> <mml:mi>j</mml:mi></mml:mrow> <mml:mn>2</mml:mn></mml:msubsup></mml:mtd> <mml:mtd><mml:mrow><mml:msub><mml:mi>σ</mml:mi> <mml:mrow><mml:mn>1</mml:mn> <mml:mi>j</mml:mi></mml:mrow></mml:msub> <mml:msub><mml:mi>σ</mml:mi> <mml:mrow><mml:mn>2</mml:mn> <mml:mi>j</mml:mi></mml:mrow></mml:msub> <mml:mi>θ</mml:mi></mml:mrow></mml:mtd></mml:mtr> <mml:mtr><mml:mtd><mml:mrow><mml:msub><mml:mi>σ</mml:mi> <mml:mrow><mml:mn>1</mml:mn> <mml:mi>j</mml:mi></mml:mrow></mml:msub> <mml:msub><mml:mi>σ</mml:mi> <mml:mrow><mml:mn>2</mml:mn> <mml:mi>j</mml:mi></mml:mrow></mml:msub> <mml:mi>θ</mml:mi></mml:mrow></mml:mtd> <mml:mtd><mml:msubsup><mml:mi>σ</mml:mi> <mml:mrow><mml:mn>2</mml:mn> <mml:mi>j</mml:mi></mml:mrow> <mml:mn>2</mml:mn></mml:msubsup></mml:mtd></mml:mtr></mml:mtable> <mml:mo>)</mml:mo> <mml:mo>)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(3)</label></disp-formula>
where <italic>θ</italic> is a shared sample correlation that can be estimated as <inline-formula id="pgen.1009575.e015"><alternatives><graphic id="pgen.1009575.e015g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e015" xlink:type="simple"/><mml:math display="inline" id="M15"><mml:mover accent="true"><mml:mi>θ</mml:mi> <mml:mo>^</mml:mo></mml:mover></mml:math></alternatives></inline-formula> (see <xref ref-type="sec" rid="sec015">Materials and methods</xref>).</p>
<p>When there is no horizontal pleiotropy in the <italic>p</italic> selected independent genetic instruments (<italic>α</italic><sub><italic>j</italic></sub> = 0 for <italic>j</italic> = 1, 2, ⋯, <italic>p</italic>), the robust profile likelihood [<xref ref-type="bibr" rid="pgen.1009575.ref010">10</xref>] is given by,
<disp-formula id="pgen.1009575.e016"><alternatives><graphic id="pgen.1009575.e016g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e016" xlink:type="simple"/><mml:math display="block" id="M16"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>l</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>b</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:mo>-</mml:mo> <mml:munderover><mml:mo>∑</mml:mo> <mml:mrow><mml:mi>j</mml:mi> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn></mml:mrow> <mml:mi>p</mml:mi></mml:munderover> <mml:mi>ρ</mml:mi> <mml:mo>(</mml:mo> <mml:mfrac><mml:mrow><mml:msub><mml:mover accent="true"><mml:mo>Γ</mml:mo> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub> <mml:mo>-</mml:mo> <mml:mi>b</mml:mi> <mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:mrow> <mml:msqrt><mml:mrow><mml:msubsup><mml:mi>σ</mml:mi> <mml:mrow><mml:mn>1</mml:mn> <mml:mi>j</mml:mi></mml:mrow> <mml:mn>2</mml:mn></mml:msubsup> <mml:mo>+</mml:mo> <mml:msup><mml:mi>b</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:msubsup><mml:mi>σ</mml:mi> <mml:mrow><mml:mn>2</mml:mn> <mml:mi>j</mml:mi></mml:mrow> <mml:mn>2</mml:mn></mml:msubsup> <mml:mo>+</mml:mo> <mml:mn>2</mml:mn> <mml:mi>b</mml:mi> <mml:mover accent="true"><mml:mi>θ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:msub><mml:mi>σ</mml:mi> <mml:mrow><mml:mn>1</mml:mn> <mml:mi>j</mml:mi></mml:mrow></mml:msub> <mml:msub><mml:mi>σ</mml:mi> <mml:mrow><mml:mn>2</mml:mn> <mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msqrt></mml:mfrac> <mml:mo>)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(4)</label></disp-formula>
where <italic>ρ</italic>(⋅) is the Tukey’s Biweight loss, or any other robust loss functions. As described with more details in Materials and Methods, the profile likelihood is obtained by profiling out nuisance parameters <italic>γ</italic><sub>1</sub>, ⋯, <italic>γ</italic><sub><italic>p</italic></sub> in the full likelihood from (<xref ref-type="disp-formula" rid="pgen.1009575.e014">3</xref>), which is further robustified by replacing the <italic>L</italic><sub>2</sub> loss with Tukey’s Biweight loss to increase the sensitivity of mode detection. Under no pleiotropy or InSIDE assumption, this function <italic>l</italic>(<italic>b</italic>) should have only one mode near the true causal effect <italic>b</italic> = <italic>β</italic>.</p>
<p>Now consider the case where a second genetic pathway (Pathway 2) also contributes substantially to the disease, and some instrument loci are also associated with Pathway 2 (<xref ref-type="fig" rid="pgen.1009575.g001">Fig 1b</xref>). In this scenario, SNPs that are associated with <italic>X</italic> only through Pathway 2 can contribute to a second mode in the profile likelihood at location <italic>β</italic> + <italic>κ</italic>/<italic>δ</italic>, where <italic>κ</italic> and <italic>δ</italic> quantifies the causal effect of Pathway 2 on <italic>Y</italic> and its marginal association with <italic>X</italic>, respectively (Materials and Methods). Similarly, multiple pleiotropic pathways generally result in multiple modes of <italic>l</italic>(<italic>b</italic>). Thus, we can use multiple modes in a plot of <italic>l</italic>(<italic>b</italic>) to diagnose the presence of horizontal pleiotropic effects that are grouped by different pleiotropic pathways.</p>
<p>The existence of pleiotropic pathways complicates MR and makes the causal effects of the risk factors potentially unidentifiable. Specifically, when Pathway 2 exists, the GWAS summary statistics alone cannot provide information to distinguish <italic>β</italic> from <italic>β</italic> + <italic>κ</italic>/<italic>δ</italic>. Instead of making further untestable assumptions such as one pathway “dominates” the other, when multiple modes are detected, we suggest that whenever multiple modes are detected, the investigator should try to find biomarkers for each mode and collect more GWAS data to adjust for confounding risk factors. Specifically, GRAPPLE facilitates this by identifying marker SNPs of each mode, as well as the mapped genes and GWAS traits of each marker SNP (see <xref ref-type="sec" rid="sec015">Materials and methods</xref>). This allows researchers to use their expert knowledge to infer possible confounding risk factors that contribute to each mode. With GWAS summary statistics of these confounding traits, GRAPPLE can perform a multivariable MR analysis assuming the InSIDE assumption applies for the remaining horizontal pleiotropic effects (Materials and Methods).</p>
<p>The detection of multiple modes can be also used to determine the causal direction (<xref ref-type="fig" rid="pgen.1009575.g001">Fig 1c</xref>). If the wrong causal direction is specified in model (<xref ref-type="disp-formula" rid="pgen.1009575.e001">1</xref>) and <italic>Y</italic> is a cause of <italic>X</italic>, the genetic variants associated with <italic>X</italic> can be classified in two groups: those associated with <italic>X</italic> through <italic>Y</italic>, and those associated with <italic>X</italic> through another pathway unrelated to <italic>Y</italic>. In the former case, <italic>γ</italic><sub><italic>j</italic></sub> = <italic>β</italic>Γ<sub><italic>j</italic></sub> where <italic>β</italic> is the causal effect of <italic>Y</italic> on <italic>X</italic>, and these SNPs should contribute to a mode around 1/<italic>β</italic>. In the latter case, a SNP <italic>j</italic> satisfies <italic>γ</italic><sub><italic>j</italic></sub> ≠ 0 but Γ<sub><italic>j</italic></sub> = 0, and would contribute to a mode of <italic>l</italic>(<italic>b</italic>) at 0. Thus, there will be two modes in the robust profile likelihood with one mode being around 0. This idea can be viewed as an extension of the bidirectional MR [<xref ref-type="bibr" rid="pgen.1009575.ref029">29</xref>, <xref ref-type="bibr" rid="pgen.1009575.ref030">30</xref>]. Bidirectional MR is based on the assumptions that when <italic>X</italic> is a cause of <italic>Y</italic>, most of the genetic instruments for <italic>Y</italic> should be unassociated with <italic>X</italic>, because they affect <italic>Y</italic> through a different pathway, thus the reserve MR would indicate a zero effect of <italic>Y</italic> on <italic>X</italic>. GRAPPLE makes this inference more robust by making use of the fundamentally different shape of the robust profile likelihood plots in different directions. In the correct causal direction, the plot should only show one mode around the true causal effect <italic>β</italic>. In the incorrect reverse direction - when the true outcome is treated as the risk factor and the true risk factor is treated as the outcome - the plot of the robust profile likelihood will have two modes, one around 0, <bold>representing the variants directly related to the true outcome</bold>, and one around 1/<italic>β</italic>, <bold>representing the variants indirectly related to the true outcome through the true risk factor</bold>.</p>
</sec>
<sec id="sec006">
<title>Weak genetic instruments: A curse or a blessing?</title>
<p>Besides the assumption of no-horizontal-pleiotropy, for a SNP to be a valid genetic instrument, it needs to have a non-zero association with the risk factor of interest. In most MR pipelines, SNPs are selected as instruments only when their p-values are below 10<sup>−8</sup>, which is required to guarantee a low family-wise error rate (FWER) for GWAS data. Using such a stringent threshold also helps to avoid weak instrument bias [<xref ref-type="bibr" rid="pgen.1009575.ref031">31</xref>], where measurement errors in <inline-formula id="pgen.1009575.e017"><alternatives><graphic id="pgen.1009575.e017g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e017" xlink:type="simple"/><mml:math display="inline" id="M17"><mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mrow><mml:mi>j</mml:mi> <mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:math></alternatives></inline-formula> are not ignorable and lead to bias in <inline-formula id="pgen.1009575.e018"><alternatives><graphic id="pgen.1009575.e018g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e018" xlink:type="simple"/><mml:math display="inline" id="M18"><mml:mover accent="true"><mml:mi>β</mml:mi> <mml:mo>^</mml:mo></mml:mover></mml:math></alternatives></inline-formula>. However, such a stringent selection threshold may result in very few, or even no instruments being selected with under-powered GWAS, and may still not be adequate to avoid weak instrument bias. Further, when our goal is to jointly model the effects of multiple risk factors (the setting where <bold><italic>X</italic></bold> as a vector), it is unrealistic to assume that all selected SNPs have strong effects on every risk factor. In addition, the high polygenecity of complex traits indicates that the weak instruments far outnumbers strong instruments, and collectively, they may substantially improve the estimation accuracy.</p>
<p>In GRAPPLE, we use a flexible p-value threshold, which can be either as stringent as 10<sup>−8</sup> or as relaxed as 10<sup>−2</sup>, for instrument selection. Based on the profile likelihood framework of MR-RAPS [<xref ref-type="bibr" rid="pgen.1009575.ref010">10</xref>], GRAPPLE can provide valid inference for <inline-formula id="pgen.1009575.e019"><alternatives><graphic id="pgen.1009575.e019g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e019" xlink:type="simple"/><mml:math display="inline" id="M19"><mml:mover accent="true"><mml:mi>β</mml:mi> <mml:mo>^</mml:mo></mml:mover></mml:math></alternatives></inline-formula> that avoids weak instrument bias for multiple risk factors even when the p-value threshold is as large as 10<sup>−2</sup>. This flexible p-value threshold is beneficial for several reasons. First, including moderate and weak instruments may increase power, especially for under-powered GWAS. Second, for MR with multiple risk factors where it is inevitable to include SNPs that have weak associations with some of the risk factors, we can obtain much more accurate causal effect estimations than methods that can only deal with jointly strong SNPs. More importantly, we can investigate the stability of the estimates across a series of p-value thresholds and get a more complete picture of the underlying horizontal pleiotropy. In practice, we suggest researchers to vary the selection p-value thresholds from a stringent one (say 10<sup>−8</sup>) to a relaxed one (say 10<sup>−2</sup>), both in the detection of multiple modes and in estimating causal effects.</p>
</sec>
<sec id="sec007">
<title>The three-sample design to guard against instrument selection bias</title>
<p>The current two-sample design of MR uses one GWAS data for the risk factor and one for the disease. The selection of genetic instruments is performed with p-values reported in the GWAS data for the risk factor. However, selecting instruments from GWAS summary statistics can introduce bias, which is commonly referred to as the “winner’s curse”. Conditional on being selected, the magnitude of <inline-formula id="pgen.1009575.e020"><alternatives><graphic id="pgen.1009575.e020g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e020" xlink:type="simple"/><mml:math display="inline" id="M20"><mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mrow><mml:mi>j</mml:mi> <mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:math></alternatives></inline-formula> is generally larger than <italic>γ</italic><sub><italic>jk</italic></sub> and introduces bias to the estimation of <bold><italic>β</italic></bold>. When <italic>K</italic> = 1 where there is only one risk factor, the estimate will be biased towards 0, but there is no guarantee on the direction of the bias when <italic>K</italic> &gt; 1. Among practitioners, a common belief is that the selection bias is negligible when only the strongly associated SNPs are selected as instruments.</p>
<p>However, this rule of thumb may not hold even when we only use that are genome-wide significant (p-value ≤10<sup>−8</sup>) (<xref ref-type="supplementary-material" rid="pgen.1009575.s001">S1(a) Fig</xref>). Thus, we strongly advocate using a three-sample GWAS summary statistics design (<xref ref-type="fig" rid="pgen.1009575.g001">Fig 1d</xref>). To avoid the selection bias, selection of genetic instruments is done on another GWAS dataset for the risk factor, whose cohort has no overlapping individuals with both the risk factor and disease cohorts. In addition, to simplify calculation and avoid bias due to different LD structure in heterogeneous populations, we use LD clumping [<xref ref-type="bibr" rid="pgen.1009575.ref032">32</xref>] to select independent SNPs in GRAPPLE (see <xref ref-type="sec" rid="sec015">Materials and methods</xref>). The three-sample design will also avoid possible selection bias introduced during clumping.</p>
<p>Summarizing the above points, a complete diagram of the GRAPPLE workflow is shown in <xref ref-type="fig" rid="pgen.1009575.g001">Fig 1d</xref>. A researcher may start with a single target risk factor of interest. The shape of the robust profile likelihood provides information on possible pleiotropic pathways. If only a single mode is detected, one can use GRAPPLE for the target risk factor. This is equivalent to using the original MR-RAPS. If multiple modes are detected, the researcher needs to seriously consider how to adjust for pleiotropic pathways. Researchers can use the marker SNP/gene/trait information that GRAPPLE provides to investigate each mode, decide on which confounding risk factors to adjust for, and collect extra GWAS data for them. GRAPPLE can then be used to jointly estimate the causal effects of the original and the additional risk factors.</p>
</sec>
</sec>
<sec id="sec008">
<title>Assessment of GRAPPLE with real studies</title>
<sec id="sec009">
<title>Combine weak and strong genetic instruments under no pleiotropy</title>
<p>We first examine whether GRAPPLE provides reliable statistical inference using instruments with different strength under an artificial setting with real GWAS summary statistics. In this setting, we make the “artificial risk factor” <italic>X</italic> and the “artificial disease” <italic>Y</italic> be the same trait from two non-overlapping cohorts, thus <italic>γ</italic><sub><italic>j</italic></sub> = Γ<sub><italic>j</italic></sub> while <inline-formula id="pgen.1009575.e021"><alternatives><graphic id="pgen.1009575.e021g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e021" xlink:type="simple"/><mml:math display="inline" id="M21"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub> <mml:mo>≠</mml:mo> <mml:msub><mml:mover accent="true"><mml:mo>Γ</mml:mo> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:math></alternatives></inline-formula> for any SNP <italic>j</italic>. Though the structural equation describing the causal effect of <italic>X</italic> on <italic>Y</italic> is not well defined., the linear relationship model (<xref ref-type="disp-formula" rid="pgen.1009575.e006">2</xref>) from which we estimate <italic>β</italic> still holds with <italic>β</italic> = 1 and <italic>α</italic><sub><italic>j</italic></sub> = 0. In other words, we are not estimating a meaningful “casual” effect, but are in a special case where the true <italic>β</italic> is known. This setup can be used to verify the validity of MR methods under no pleiotropy.</p>
<p>Specifically, we consider three traits: Body mass index (BMI), Type II diabetes (T2D) and height from the GIANT and DIAGRAM consortia where sex-specific GWAS data are available [<xref ref-type="bibr" rid="pgen.1009575.ref033">33</xref>–<xref ref-type="bibr" rid="pgen.1009575.ref035">35</xref>]. The female cohort is used to get <inline-formula id="pgen.1009575.e022"><alternatives><graphic id="pgen.1009575.e022g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e022" xlink:type="simple"/><mml:math display="inline" id="M22"><mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:math></alternatives></inline-formula> and the male cohort is used to get <inline-formula id="pgen.1009575.e023"><alternatives><graphic id="pgen.1009575.e023g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e023" xlink:type="simple"/><mml:math display="inline" id="M23"><mml:msub><mml:mover accent="true"><mml:mo>Γ</mml:mo> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:math></alternatives></inline-formula>. As a three-sample design, the UK Biobank data for corresponding traits are used for SNP selection. If we assume that all selected instruments have no gender-specific association with the traits, the true <italic>β</italic> would equal 1. For benchmarking, we compare the performance of GRAPPLE with CAUSE [<xref ref-type="bibr" rid="pgen.1009575.ref015">15</xref>] and three other widely adopted MR methods: inverse-variance weighted (IVW) [<xref ref-type="bibr" rid="pgen.1009575.ref005">5</xref>], MR-Egger [<xref ref-type="bibr" rid="pgen.1009575.ref006">6</xref>] and weighted median [<xref ref-type="bibr" rid="pgen.1009575.ref007">7</xref>] with the same three-sample design.</p>
<p>We compare different p-value thresholds for instrument selection, ranging from a stringent threshold of 10<sup>−8</sup> to a relaxed threshold of 10<sup>−2</sup> (<xref ref-type="fig" rid="pgen.1009575.g002">Fig 2a</xref>). GRAPPLE provides roughly unbiased estimates of <italic>β</italic> no matter which threshold is used, showing that it does not suffer from weak instrument bias. Surprisingly, the other MR methods are biased even with a stringent p-value threshold.</p>
<fig id="pgen.1009575.g002" position="float">
<object-id pub-id-type="doi">10.1371/journal.pgen.1009575.g002</object-id>
<label>Fig 2</label>
<caption>
<title>Performance evaluation.</title>
<p><bold>a</bold>, Estimation of <italic>β</italic> across selection p-value thresholds under no pleiotropy. Error bars show 95% Confidence intervals and the numbers are the number of independent SNPs obtained at each threshold. <bold>b</bold>, Estimation of <italic>β</italic> across three non-overlapping categories of SNPs: “strong”, “moderate” and “weak”. The numbers are the number of SNPs in each category. <bold>c</bold>, Identifying causal directions by multi-modality with MR reversely performed. The selection p-value threshold is kept at 10<sup>−4</sup>. <bold>d</bold>, three modes detected in the profile likelihood with selection p-value threshold 10<sup>−4</sup> for CRP on CAD. Marker genes and GWAS traits (in parenthesis) are shown for each mode. <bold>e</bold>, estimation of the CRP effect <italic>β</italic> at different p-value selection threshold with each method. The numbers are the estimated <inline-formula id="pgen.1009575.e024"><alternatives><graphic id="pgen.1009575.e024g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e024" xlink:type="simple"/><mml:math display="inline" id="M24"><mml:mover accent="true"><mml:mi>β</mml:mi> <mml:mo>^</mml:mo></mml:mover></mml:math></alternatives></inline-formula>, with * indicating p-value below 0.05 and ** indicating p-value below 0.01.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pgen.1009575.g002" xlink:type="simple"/>
</fig>
<p>Notice that for T2D, the confidence intervals of GRAPPLE do get narrower with increasing p-value thresholds (<xref ref-type="fig" rid="pgen.1009575.g002">Fig 2a</xref>), showing the potential power gain of including weak instruments in less powerful GWAS studies. In addition, we simulate synthetic GWAS summary statistics of the risk factor and disease (see <xref ref-type="supplementary-material" rid="pgen.1009575.s007">S1 Text</xref> for details) and confirm that the estimated <italic>β</italic> indeed gets more accurate with the inclusion of weakly associated SNPs (<xref ref-type="supplementary-material" rid="pgen.1009575.s002">S2(a) Fig</xref>). In the simulations, we also use GRAPPLE to adjust for measured confounding risk factors and compare the performance with MVMR [<xref ref-type="bibr" rid="pgen.1009575.ref036">36</xref>], a commonly used multivariable MR method. As discussed earlier, in multivariable MR, the inclusion of SNPs that are weakly associated with at least one risk factors is inevitable. As GRAPPLE does not suffer from weak instrument bias, we see that it provides accurate estimates of the causal effects as well as reliable confidence intervals with both stringent and mild p-value thresholds (<xref ref-type="supplementary-material" rid="pgen.1009575.s003">S3</xref>–<xref ref-type="supplementary-material" rid="pgen.1009575.s005">S5</xref> Figs).</p>
<p>Finally, we demonstrate that to avoid bias, the three-sample design is necessary no matter which MR method is used. As shown in <xref ref-type="supplementary-material" rid="pgen.1009575.s001">S1(a) Fig</xref>, the two-sample design where we use the same cohort of the risk factor for selection can result in biased casual effects estimation, and the bias occurs with most MR methods even when we only select the strongly associated SNPs.</p>
</sec>
<sec id="sec010">
<title>Weak SNPs provide reliable causal estimates under pleiotropy</title>
<p>Next, we examine whether or not the weak instruments are more vulnerable to pleiotropy, which can be a concern for including the weak SNPs. We compare four risk factor and disease pairs that cover eight different complex traits, including the effect of BMI on T2D, low-density cholesterol concentrations (LDL-C) on coronary artery disease (CAD), height on smoking, and systolic blood pressure (SBP) on stroke (<xref ref-type="fig" rid="pgen.1009575.g002">Fig 2b</xref>). The GWAS summary data are collected from the original study repositories [<xref ref-type="bibr" rid="pgen.1009575.ref037">37</xref>–<xref ref-type="bibr" rid="pgen.1009575.ref042">42</xref>].</p>
<p>We test whether independent sets of strongly and weakly associated SNPs can provide consistent estimates of the causal effects of the risk factors. SNPs passing the p-value threshold 10<sup>−2</sup> in the cohort for selection are divided into three non-overlapping groups after LD clumping: “strong” (<italic>p</italic><sub><italic>j</italic></sub> ≤ 10<sup>−8</sup>), “moderate” (10<sup>−8</sup> &lt; <italic>p</italic><sub><italic>j</italic></sub> ≤ 10<sup>−5</sup>), and “weak” (10<sup>−5</sup> &lt; <italic>p</italic><sub><italic>j</italic></sub> ≤ 10<sup>−2</sup>). The SNPs across groups are used separately to obtain group-specific estimates of the causal effect <italic>β</italic>. We observe that for all the four pairs, the estimates <inline-formula id="pgen.1009575.e025"><alternatives><graphic id="pgen.1009575.e025g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e025" xlink:type="simple"/><mml:math display="inline" id="M25"><mml:mover accent="true"><mml:mi>β</mml:mi> <mml:mo>^</mml:mo></mml:mover></mml:math></alternatives></inline-formula> are stable across groups (<xref ref-type="fig" rid="pgen.1009575.g002">Fig 2b</xref>). Though the “weaker” SNPs provide estimates with more uncertainty due to limited power, the estimates are consistent with those from the “strong” group. Other MR methods also show some level of consistency in estimating <italic>β</italic> across different sets of instruments, but perform less well due to weak instrument bias (<xref ref-type="supplementary-material" rid="pgen.1009575.s001">S1(b) Fig</xref>). To conclude, in the analysis of these four pairs of traits, we do not see any evidence that weakly associated SNPs provide more biased estimates than strong instruments due to horizontal pleiotropy. In contrast, as with the strong instruments, the weakly associated SNPs may also provide useful information to infer the causal effects of the risk factors.</p>
</sec>
<sec id="sec011">
<title>Identify direction of causality for known causal relationships</title>
<p>We also examine the performance of GRAPPLE in identifying the causal direction with the shape of the profile likelihood. For the causal direction, we focus on the two pairs of traits with known causal relationship: BMI on T2D, and LDL-C on CAD. We switch the roles of the risk factor and disease to see if the correct direction can be revealed. Specifically, we treat T2D and CAD as the “risk factor”, and BMI and LDL-C as the corresponding “disease” (<xref ref-type="fig" rid="pgen.1009575.g002">Fig 2c</xref>). For T2D, the cohort for the other gender is used for SNP selection and for CAD, the risk factor cohort used is from [<xref ref-type="bibr" rid="pgen.1009575.ref043">43</xref>] and the selection p-values are from [<xref ref-type="bibr" rid="pgen.1009575.ref044">44</xref>]. As expected, we see that when the roles of the risk factor and disease are reversed, the robust profile likelihood shows a main mode at 0, and a weaker mode around <inline-formula id="pgen.1009575.e026"><alternatives><graphic id="pgen.1009575.e026g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e026" xlink:type="simple"/><mml:math display="inline" id="M26"><mml:mrow><mml:mn>1</mml:mn> <mml:mo>/</mml:mo> <mml:mover accent="true"><mml:mi>β</mml:mi> <mml:mo>^</mml:mo></mml:mover></mml:mrow></mml:math></alternatives></inline-formula>.</p>
</sec>
<sec id="sec012">
<title>Detect multiple modes to identify pleiotropic pathways</title>
<p>Finally, we test the ability of GRAPPLE to identify multiple pleiotropic pathways with the analysis of the C-reactive protein (CRP) effect on CAD. C-reactive protein has been found to be strongly associated with the risk of heart disease while many SNPs that are associated with the C-reactive protein also seem to have pleiotropic effect on lipid traits [<xref ref-type="bibr" rid="pgen.1009575.ref045">45</xref>]. Previous MR analyses only included SNPs that are near the <italic>CRP</italic> gene to guarantee a free-of-pleiotropy analysis [<xref ref-type="bibr" rid="pgen.1009575.ref046">46</xref>, <xref ref-type="bibr" rid="pgen.1009575.ref047">47</xref>] and found that CRP has no causal effect on CAD. Now, instead of only using SNPs near the CRP gene, by using associated SNPs across the whole genome that are known to involve pleiotropy pathways, can GRAPPLE identify the existence of these pathways and still obtain the correct estimate of the C-reactive protein effect?</p>
<p>CRP GWAS data from [<xref ref-type="bibr" rid="pgen.1009575.ref048">48</xref>] are used for selection and the data from [<xref ref-type="bibr" rid="pgen.1009575.ref049">49</xref>] using a larger cohort is used for getting <inline-formula id="pgen.1009575.e027"><alternatives><graphic id="pgen.1009575.e027g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e027" xlink:type="simple"/><mml:math display="inline" id="M27"><mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:math></alternatives></inline-formula>. Similar to a multi-modality pattern already reported in [<xref ref-type="bibr" rid="pgen.1009575.ref011">11</xref>], our robust profile likelihood shows a pattern of three modes, indicating the existence of at least three different pathways (<xref ref-type="fig" rid="pgen.1009575.g002">Fig 2d</xref>). One mode is negative, one is positive and the third is around zero. The negative mode involves a few marker genes including <italic>HNF1A</italic> and <italic>PVRL2</italic>, with a marker trait LDL-C. The positive mode has marker traits pulmonary function and the C-reactive protein, and the few markers genes (<italic>IL6R</italic>, <italic>ARHGAP10</italic>, <italic>BCL7B</italic>, <italic>PABPC4</italic>) are also involved in immune response and lung cancer progression [<xref ref-type="bibr" rid="pgen.1009575.ref050">50</xref>, <xref ref-type="bibr" rid="pgen.1009575.ref051">51</xref>]. The mode at 0 has marker genes <italic>CRP</italic> and <italic>LEPR</italic>, and only one marker trait, C-reactive protein.</p>
<p>We compare across 3 p-value thresholds (10<sup>−8</sup>, 10<sup>−5</sup>, 10<sup>−3</sup>) and check how the existence of multiple pathways affects causal estimates of the effect of C-reactive protein in MR methods using SNPs across the genome. Including C-reactive protein as the only risk factor, all bench-marking methods give a negative estimate of the CRP effect, which is possibly driven by the bias from an LDL-C induced pleiotropic pathway (<xref ref-type="fig" rid="pgen.1009575.g002">Fig 2e</xref>). MR-RAPS is the estimation method used in GRAPPLE if we only use one risk factor, and the three other bench-marking methods give incorrect inference of the CRP effect with a p-value of <italic>β</italic> below 0.01 for at least one SNP selection threshold (notice that the weak instrument bias is towards 0 as shown in <xref ref-type="fig" rid="pgen.1009575.g002">Fig 2a</xref>, thus the significance at p-value threshold 10<sup>−3</sup> for MR-Egger and IVW cannot be explained by weak instrument bias). In contrast, after using two risk factors: C-reactive protein and LDL-C, where LDL-C is an identified confounding risk factor from the marker SNPs in <xref ref-type="fig" rid="pgen.1009575.g002">Fig 2d</xref>, the estimates of CRP effect are much closer to 0 compared with that without including LDL-C. This analysis illustrates how GRAPPLE can detect pleiotropic pathways, provide information to identify the confounding risk factors to adjust for, and obtain correct inference after adjusting for these risk factors.</p>
<p>As a complement to the analysis on CRP, we also use simulations (<xref ref-type="supplementary-material" rid="pgen.1009575.s007">S1 Text</xref>) and generate synthetic disease traits to evaluate the precision and recall in the detection of multiple modes and marker SNPs when there are pleiotropic pathways. We consider scenarios with one or two pleiotropic pathways caused by hidden confounding risk factors, and vary the genetic correlations between these hidden factors and the target risk factor. A higher genetic correlation corresponds to a larger proportion of SNPs that have a correlated pleiotropic effect. We observe that the detection of multiple modes is most powerful when the genetic correlation is neither too large nor too small (<xref ref-type="supplementary-material" rid="pgen.1009575.s002">S2(b) Fig</xref>). If the genetic correlation is too high, then there are not enough SNPs to contribute to the mode of the true causal effect, while if the genetic correlation is too low there will be too few SNPs to contribute to the pleiotropic modes. Including weaker SNPs will decrease the sensitivity in mode detection but can increase the recall of true marker SNPs. In our simulations, we also observe that all univariable MR methods can perform poorly in estimating the true causal effect in the presence of pleiotropic pathways (<xref ref-type="supplementary-material" rid="pgen.1009575.s003">S3</xref>–<xref ref-type="supplementary-material" rid="pgen.1009575.s005">S5</xref> Figs).</p>
</sec>
</sec>
<sec id="sec013">
<title>A causal landscape from 5 risk factors to 25 common diseases</title>
<p>Finally, we apply GRAPPLE to interrogate the causal effects of 5 risk factors on 25 complex diseases. The five risk factors are three plasma lipid traits: LDL-C, high-density lipoprotein cholesterol (HDL-C), triglycerides (TG), BMI and SBP. The diseases include heart disease, Type II diabetes, kidney disease, common psychiatric disorders, inflammatory disease and cancer (<xref ref-type="fig" rid="pgen.1009575.g003">Fig 3a</xref>). The GWAS summary statistics are from studies [<xref ref-type="bibr" rid="pgen.1009575.ref035">35</xref>, <xref ref-type="bibr" rid="pgen.1009575.ref037">37</xref>, <xref ref-type="bibr" rid="pgen.1009575.ref038">38</xref>, <xref ref-type="bibr" rid="pgen.1009575.ref041">41</xref>, <xref ref-type="bibr" rid="pgen.1009575.ref042">42</xref>, <xref ref-type="bibr" rid="pgen.1009575.ref052">52</xref>–<xref ref-type="bibr" rid="pgen.1009575.ref070">70</xref>] and downloaded from the GWAS catalog [<xref ref-type="bibr" rid="pgen.1009575.ref071">71</xref>]. For each pair of the risk factor and disease, we compare across p-value thresholds from 10<sup>−8</sup> to 10<sup>−2</sup>. As a summary of the results, <xref ref-type="fig" rid="pgen.1009575.g003">Fig 3a</xref> illustrates the average number of modes detected across the p-value thresholds for SNP selection (for modes at each p-value threshold, see <xref ref-type="supplementary-material" rid="pgen.1009575.s006">S6 Fig</xref>). Besides the number of modes, <xref ref-type="fig" rid="pgen.1009575.g003">Fig 3a</xref> also shows the p-values for each risk factor when GRAPPLE is performed with only the single risk factor (see also <xref ref-type="supplementary-material" rid="pgen.1009575.s006">S6 Fig</xref> and <xref ref-type="sec" rid="sec015">Materials and methods</xref>). These p-values are not valid when there are pleiotropic pathways.</p>
<fig id="pgen.1009575.g003" position="float">
<object-id pub-id-type="doi">10.1371/journal.pgen.1009575.g003</object-id>
<label>Fig 3</label>
<caption>
<title>Screening with GRAPPLE.</title>
<p><bold>a</bold>, Landscape of pleiotropic pathways on 25 diseases. The colors show average number of modes across 7 different selection p-value thresholds. The “+” sign shows a positive estimated effect and “−” indicates a negative estimated effect, with the p-value for each cell a combined p-value (see <xref ref-type="sec" rid="sec015">Materials and methods</xref>) of replicability across 7 thresholds using the single risk factor. These p-values are not multiple-testing adjusted across pairs. <bold>b</bold>, Multi-modality of the profile likelihood for effect of HDL-C on CAD at 2 different selection p-value threshold. Vertical bars are positions of marker SNPs (<inline-formula id="pgen.1009575.e029"><alternatives><graphic id="pgen.1009575.e029g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e029" xlink:type="simple"/><mml:math display="inline" id="M29"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mo>Γ</mml:mo> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub> <mml:mo>/</mml:mo> <mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:math></alternatives></inline-formula>), labeled by their mapped genes (only unique gene names are shown). <bold>c</bold>, Multivariable MR for the effect of 5 risk factors on CAD. <bold>d</bold>, Multivariable MR for the effect of 4 risk factors on CAD. The Error bars are 95% confidence intervals.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pgen.1009575.g003" xlink:type="simple"/>
</fig>
<p>
<xref ref-type="fig" rid="pgen.1009575.g003">Fig 3a</xref> shows that multi-modality can be detected in many risk factor and disease pairs. Multi-modality is most easily seen using the stringent p-value threshold 10<sup>−8</sup> (<xref ref-type="supplementary-material" rid="pgen.1009575.s006">S6 Fig</xref>). However, we find that some modes are contributed by a single SNP thus is more likely an outlier than a pathway. For instance, the effect of stroke on LDL-C shows two modes when the p-value threshold is 10<sup>−8</sup> or 10<sup>−7</sup> (one mode around −2.3 and another mode near 0.08). However, the negative mode only has one marker SNP (rs3184504) which has been found strongly associated with hundreds of different traits according to GWAS Catalog while the other mode has hundreds or marker genes. After removing the SNP rs3184504, the mode disappears. Such a mode also disappears when we increase the p-value threshold to include more SNPs as instruments. Thus, the average number of modes serves as a strength of evidence for the existence of multiple pleiotropic pathways. When a risk factor and disease pair show multi-modality, the p-values from GRAPPLE using the single target risk factor are no longer valid, and the researchers need further investigations of the modes.</p>
<p>First, consider the well-studied, often-debated relationship between CAD and the lipid traits. All five risk factors show highly significant effects, though multi-modality is detected in HDL-C and SBP. In our results for HDL-C, with different p-value thresholds, three modes in total can show up, two being negative and one positive, indicating that the pathways from HDL-C to CAD is complicated (<xref ref-type="fig" rid="pgen.1009575.g003">Fig 3b</xref>). <xref ref-type="fig" rid="pgen.1009575.g003">Fig 3b</xref> shows that one negative mode is contributed by SNPs near genes <italic>LPL</italic> and <italic>BUD13</italic>, which are strongly associated with triglycerides. Another positive mode is contributed by SNPs near genes <italic>ALDH1A2</italic> and <italic>PSKH1</italic>, which is related to respiratory diseases [<xref ref-type="bibr" rid="pgen.1009575.ref072">72</xref>]. The markers of the other negative mode are mapped to genes including <italic>LIPG</italic> and <italic>CETP</italic>.</p>
<p>Since the effects of the lipid traits are generally complicated, we combine all 5 risk factors and run an MR jointly with GRAPPLE (<xref ref-type="fig" rid="pgen.1009575.g003">Fig 3c</xref>) with different p-value thresholds. After adjusting for other risk factors, the two most prominent risk factors for heart disease are LDL-C and SBP, while the protective effect of HDL-C stays negligible, as does the risk conferred by TG. So these results show that HDL-C as a single measurement does not seem to have a protective effect on heart disease with multiple complex pathways linking HDL-C and heart disease. Researchers have suggested analyzing different subgroups of HDL-C as smaller particles tend to have a stronger protective effect [<xref ref-type="bibr" rid="pgen.1009575.ref073">73</xref>].</p>
<p>Lipids are also involved in a number of biological functions including energy storage, signaling, and acting as structural components of cell membranes and have been reported to be associated with various diseases [<xref ref-type="bibr" rid="pgen.1009575.ref074">74</xref>–<xref ref-type="bibr" rid="pgen.1009575.ref077">77</xref>]. Besides CAD, another disease that most likely involves the lipid traits is the Type II diabetes (<xref ref-type="fig" rid="pgen.1009575.g003">Fig 3a</xref>). T2D is associated with dyslipidemia (i.e., higher concentrations of TG and LDL-C, and lower concentrations of HDL-C), though the causal relationship is still unclear [<xref ref-type="bibr" rid="pgen.1009575.ref078">78</xref>]. In the meantime, evidence has emerged that LDL-C reduction with statin therapy results in a modest increase in risk of T2D [<xref ref-type="bibr" rid="pgen.1009575.ref074">74</xref>]. For the MR analyzing each risk factor alone, we see potential protective effects of LDL-C and HDL-C on T2D but also multi-modality patterns. Two modes show up in the profile likelihood from HDL-C to T2D where one negative mode has a marker gene <italic>LPL</italic> and a mode near 0 with marker genes <italic>CETP</italic> and <italic>AC012181.1</italic>. Thus, we include all 3 lipid traits, along with BMI and run a joint model for these 4 risk factors using GRAPPLE (<xref ref-type="fig" rid="pgen.1009575.g003">Fig 3d</xref>). Our result indicates a mild protective effect of HDL-C and LDL-C on T2D, and close to the null but imprecise estimate for TG.</p>
</sec>
</sec>
<sec id="sec014" sec-type="conclusions">
<title>Discussion</title>
<p>We propose a comprehensive framework, GRAPPLE, that utilizes both strongly and weakly associated SNPs to understand the causal relationship between complex traits. GRAPPLE is robust to pervasive pleiotropy and can identify multiple pleiotropic pathways. The multivariable MR performed by GRAPPLE can adjust for known confounding risk factors.</p>
<p>GRAPPLE incorporates several improvements over existing MR methods. It avoids weak instrument bias by dealing with measurement errors of the SNP associations on the risk factors with profile likelihood. Our likelihood from (<xref ref-type="disp-formula" rid="pgen.1009575.e045">9</xref>) is similar to the likelihood used in [<xref ref-type="bibr" rid="pgen.1009575.ref079">79</xref>], but our likelihood allows modelling pervasive pleiotropy as long as the InSIDE assumption holds for most SNPs. The multi-modality visualization shares similarities with [<xref ref-type="bibr" rid="pgen.1009575.ref008">8</xref>], which estimates the causal effect by the global mode, but we provide a more comprehensive analysis to identify multiple pleiotropic pathways by the local modes. Our causality direction identification is related to bidirectional MR where they used the assumption that if we reverse the role of risk factor and disease, the estimated causal effect is likely to be 0. We use this idea in a more principled way and can avoid bias when SNPs affecting the disease through the target risk factors are also selected as variants for the disease in the reverse MR. Finally, as the intercept term in MR-Egger is not invariant to the arbitrary assignment of effect alleles for each SNP, indicating a deficiency of the method, GRAPPLE does not include any intercept term.</p>
<p>GRAPPLE needs a separate GWAS cohort of the exposure for SNP selection, which is necessary for valid inference with weakly associated SNPs. Actually, as shown in <xref ref-type="supplementary-material" rid="pgen.1009575.s001">S1(a) Fig</xref>, the three-sample design is needed for other MR methods as well to avoid selection bias. In some domains, it is hard to obtain multiple good-quality public GWAS summary statistics with non-overlapping cohorts. We call for the release of stage-specific or study-specific GWAS data summary statistics to the public in the future.</p>
<p>In GRAPPLE, we still require using a p-value threshold, though it can be as relaxed as 10<sup>−2</sup>, instead of requiring no p-value threshold at all. There are two main reasons for this requirement. One consideration is to increase power, as including too many SNPs with <italic>γ</italic><sub><italic>j</italic></sub> = 0 or extremely small would instead increase the variance of <inline-formula id="pgen.1009575.e030"><alternatives><graphic id="pgen.1009575.e030g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e030" xlink:type="simple"/><mml:math display="inline" id="M30"><mml:mover accent="true"><mml:mi>β</mml:mi> <mml:mo>^</mml:mo></mml:mover></mml:math></alternatives></inline-formula> [<xref ref-type="bibr" rid="pgen.1009575.ref010">10</xref>, <xref ref-type="bibr" rid="pgen.1009575.ref080">80</xref>]. Another consideration is that we would not want unmeasured risk factors that are unassociated (or very weakly associated) with target risk factors to bring in large pleiotropic effects with SNPs that mainly affect these unmeasured risk factors. The chance of including these SNPs would be much lower by requiring a relaxed p-value threshold.</p>
<p>Finally, when discussing the causal effect of a risk factor, one implicit assumption we use is consistency, assuming that there is a clear and only one version of intervention that can be done on the risk factor. However, interventions on risk factors such as BMI are typically vague [<xref ref-type="bibr" rid="pgen.1009575.ref081">81</xref>]. For instance, there can be multiple ways to change weight, such as taking exercise, switching to different diet or conducting a surgery. It is common sense that these different interventions would have different effects on diseases, though they may change BMI by the same amount. However, the basic MR principle of gene-environment equivalence [<xref ref-type="bibr" rid="pgen.1009575.ref082">82</xref>] suggests that whilst there will be genetic mimics of increased physical activity and decreased calorie intake, there will be no such mimics for having surgery. Basic biological principles indicate which inferences can be sensibly made. For example, cholesterol has multiple functions in our bodies and is involved in multiple biological processes. Intervening in different biological processes to change the concentration of lipid traits may, in principle, have different effects on disease. However, for many LDL-C lowering drugs the direct genetic mimics produce effects as predicted by RCTs of these pharmaceutical agents [<xref ref-type="bibr" rid="pgen.1009575.ref083">83</xref>], demonstrating that gene-environment equivalence applies. We think that our causal inference using GRAPPLE, along with the markers we detect, would provide abundant information to deepen our understanding of the risk factors. However, one still needs to be careful when giving causal interpretations of the results. One recommendation in practice is to triangulate the results from MR with other sources of evidence [<xref ref-type="bibr" rid="pgen.1009575.ref084">84</xref>, <xref ref-type="bibr" rid="pgen.1009575.ref085">85</xref>].</p>
</sec>
<sec id="sec015" sec-type="materials|methods">
<title>Materials and methods</title>
<sec id="sec016">
<title>Model details</title>
<p>The structural <xref ref-type="disp-formula" rid="pgen.1009575.e001">Eq (1)</xref> where <bold><italic>X</italic></bold> = (<italic>X</italic><sub>1</sub>, <italic>X</italic><sub>2</sub>, ⋯, <italic>X</italic><sub><italic>K</italic></sub>) and <bold><italic>β</italic></bold> = (<italic>β</italic><sub>1</sub>, <italic>β</italic><sub>2</sub>, ⋯, <italic>β</italic><sub><italic>K</italic></sub>) describe how individual level data are generated. To link it with the GWAS summary statistics data, denote
<disp-formula id="pgen.1009575.e031"><alternatives><graphic id="pgen.1009575.e031g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e031" xlink:type="simple"/><mml:math display="block" id="M31"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mi>γ</mml:mi> <mml:mrow><mml:mi>j</mml:mi> <mml:mi>k</mml:mi></mml:mrow></mml:msub> <mml:mo>=</mml:mo> <mml:msub><mml:mtext>argmin</mml:mtext> <mml:mi>γ</mml:mi></mml:msub> <mml:mtext>Var</mml:mtext> <mml:mo>[</mml:mo> <mml:msub><mml:mi>X</mml:mi> <mml:mi>k</mml:mi></mml:msub> <mml:mo>-</mml:mo> <mml:mi>γ</mml:mi> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>]</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
which is the true marginal association between a SNP <italic>Z</italic><sub><italic>j</italic></sub> and risk factor <italic>X</italic><sub><italic>k</italic></sub> and
<disp-formula id="pgen.1009575.e032"><alternatives><graphic id="pgen.1009575.e032g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e032" xlink:type="simple"/><mml:math display="block" id="M32"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mi>α</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>=</mml:mo> <mml:msub><mml:mtext>argmin</mml:mtext> <mml:mi>α</mml:mi></mml:msub> <mml:mtext>Var</mml:mtext> <mml:mo>[</mml:mo> <mml:mi>f</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="bold-italic">U</mml:mi> <mml:mo>,</mml:mo> <mml:mi mathvariant="bold-italic">Z</mml:mi> <mml:mo>,</mml:mo> <mml:msub><mml:mi>E</mml:mi> <mml:mi>Y</mml:mi></mml:msub> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>-</mml:mo> <mml:mi>α</mml:mi> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>]</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
which is the marginal association between <italic>Z</italic><sub><italic>j</italic></sub> and the causal effects of unmeasured risk factors on <italic>Y</italic>, i.e. the horizontal pleiotropic effect of <italic>Z</italic><sub><italic>j</italic></sub> on <italic>Y</italic> given <bold><italic>X</italic></bold>. Then we can rewrite the structural equations into the following linear models:
<disp-formula id="pgen.1009575.e033"><alternatives><graphic id="pgen.1009575.e033g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e033" xlink:type="simple"/><mml:math display="block" id="M33"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mi>X</mml:mi> <mml:mi>k</mml:mi></mml:msub> <mml:mo>=</mml:mo> <mml:msub><mml:mi>γ</mml:mi> <mml:mrow><mml:mi>j</mml:mi> <mml:mi>k</mml:mi></mml:mrow></mml:msub> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:mo>[</mml:mo> <mml:msub><mml:mi>g</mml:mi> <mml:mi>k</mml:mi></mml:msub> <mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="bold-italic">U</mml:mi> <mml:mo>,</mml:mo> <mml:mi mathvariant="bold-italic">Z</mml:mi> <mml:mo>,</mml:mo> <mml:msub><mml:mi>E</mml:mi> <mml:msub><mml:mi>X</mml:mi> <mml:mi>k</mml:mi></mml:msub></mml:msub> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>-</mml:mo> <mml:msub><mml:mi>γ</mml:mi> <mml:mrow><mml:mi>j</mml:mi> <mml:mi>k</mml:mi></mml:mrow></mml:msub> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>]</mml:mo> <mml:mo>=</mml:mo> <mml:msub><mml:mi>γ</mml:mi> <mml:mrow><mml:mi>j</mml:mi> <mml:mi>k</mml:mi></mml:mrow></mml:msub> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>ϵ</mml:mi> <mml:mrow><mml:mi>j</mml:mi> <mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(5)</label></disp-formula> <disp-formula id="pgen.1009575.e034"><alternatives><graphic id="pgen.1009575.e034g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e034" xlink:type="simple"/><mml:math display="block" id="M34"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>Y</mml:mi> <mml:mo>=</mml:mo> <mml:msup><mml:mi mathvariant="bold-italic">X</mml:mi> <mml:mi>T</mml:mi></mml:msup> <mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>+</mml:mo> <mml:msub><mml:mi>α</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:mo>[</mml:mo> <mml:mi>f</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="bold-italic">U</mml:mi> <mml:mo>,</mml:mo> <mml:mi mathvariant="bold-italic">Z</mml:mi> <mml:mo>,</mml:mo> <mml:msub><mml:mi>E</mml:mi> <mml:mi>Y</mml:mi></mml:msub> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>-</mml:mo> <mml:msub><mml:mi>α</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>]</mml:mo> <mml:mo>=</mml:mo> <mml:msup><mml:mi mathvariant="bold-italic">X</mml:mi> <mml:mi>T</mml:mi></mml:msup> <mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>+</mml:mo> <mml:msub><mml:mi>α</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mover accent="true"><mml:mi>e</mml:mi> <mml:mo>˜</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(6)</label></disp-formula>
where corr(<italic>Z</italic><sub><italic>j</italic></sub>, <italic>ϵ</italic><sub><italic>jk</italic></sub>) = 0 for any <italic>k</italic> and <inline-formula id="pgen.1009575.e035"><alternatives><graphic id="pgen.1009575.e035g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e035" xlink:type="simple"/><mml:math display="inline" id="M35"><mml:mrow><mml:mtext>corr</mml:mtext> <mml:mo>(</mml:mo> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:msub><mml:mover accent="true"><mml:mi>e</mml:mi> <mml:mo>˜</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub> <mml:mo>)</mml:mo> <mml:mo>=</mml:mo> <mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> is guaranteed by the definitions of <italic>γ</italic><sub><italic>jk</italic></sub> and <italic>α</italic><sub><italic>j</italic></sub>. By replacing <bold><italic>X</italic></bold> in (<xref ref-type="disp-formula" rid="pgen.1009575.e034">6</xref>) with (<xref ref-type="disp-formula" rid="pgen.1009575.e033">5</xref>), we get
<disp-formula id="pgen.1009575.e036"><alternatives><graphic id="pgen.1009575.e036g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e036" xlink:type="simple"/><mml:math display="block" id="M36"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>Y</mml:mi> <mml:mo>=</mml:mo> <mml:mo>(</mml:mo> <mml:msubsup><mml:mi>γ</mml:mi> <mml:mi mathvariant="bold-italic">j</mml:mi> <mml:mi>T</mml:mi></mml:msubsup> <mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>+</mml:mo> <mml:msub><mml:mi>α</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>)</mml:mo> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mover accent="true"><mml:mi>e</mml:mi> <mml:mo>˜</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:munder><mml:mo>∑</mml:mo> <mml:mi>k</mml:mi></mml:munder> <mml:msub><mml:mi>β</mml:mi> <mml:mi>k</mml:mi></mml:msub> <mml:msub><mml:mi>ϵ</mml:mi> <mml:mrow><mml:mi>j</mml:mi> <mml:mi>k</mml:mi></mml:mrow></mml:msub> <mml:mo>=</mml:mo> <mml:msub><mml:mo>Γ</mml:mo> <mml:mi>j</mml:mi></mml:msub> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>e</mml:mi> <mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
where <inline-formula id="pgen.1009575.e037"><alternatives><graphic id="pgen.1009575.e037g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e037" xlink:type="simple"/><mml:math display="inline" id="M37"><mml:mrow><mml:msub><mml:mo>Γ</mml:mo> <mml:mi>j</mml:mi></mml:msub> <mml:mo>=</mml:mo> <mml:msubsup><mml:mi>γ</mml:mi> <mml:mi mathvariant="bold-italic">j</mml:mi> <mml:mi>T</mml:mi></mml:msubsup> <mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>+</mml:mo> <mml:msub><mml:mi>α</mml:mi> <mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009575.e038"><alternatives><graphic id="pgen.1009575.e038g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e038" xlink:type="simple"/><mml:math display="inline" id="M38"><mml:mrow><mml:msub><mml:mi>e</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>=</mml:mo> <mml:msub><mml:mover accent="true"><mml:mi>e</mml:mi> <mml:mo>˜</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mo>∑</mml:mo> <mml:mi>k</mml:mi></mml:msub> <mml:msub><mml:mi>β</mml:mi> <mml:mi>k</mml:mi></mml:msub> <mml:msub><mml:mi>∊</mml:mi> <mml:mrow><mml:mi>j</mml:mi> <mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></alternatives></inline-formula>. As Corr(<italic>Z</italic><sub><italic>j</italic></sub>, <italic>e</italic><sub><italic>j</italic></sub>) = 0, we conclude that Γ<sub><italic>j</italic></sub> also satisfies that
<disp-formula id="pgen.1009575.e039"><alternatives><graphic id="pgen.1009575.e039g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e039" xlink:type="simple"/><mml:math display="block" id="M39"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mo>Γ</mml:mo> <mml:mi>j</mml:mi></mml:msub> <mml:mo>=</mml:mo> <mml:msub><mml:mtext>argmin</mml:mtext> <mml:mo>Γ</mml:mo></mml:msub> <mml:mtext>Var</mml:mtext> <mml:mo>[</mml:mo> <mml:mi>Y</mml:mi> <mml:mo>-</mml:mo> <mml:mo>Γ</mml:mo> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>]</mml:mo> <mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula></p>
<p>Thus, parameters Γ<sub><italic>j</italic></sub> also represent true marginal associations between SNP <italic>Z</italic><sub><italic>j</italic></sub> and the disease trait. This is how we result in working with <xref ref-type="disp-formula" rid="pgen.1009575.e006">Eq (2)</xref>.</p>
<p>When the disease is a binary trait, the structural equation of <italic>Y</italic> changes to
<disp-formula id="pgen.1009575.e040"><alternatives><graphic id="pgen.1009575.e040g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e040" xlink:type="simple"/><mml:math display="block" id="M40"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mtext>logit</mml:mtext> <mml:mo>[</mml:mo> <mml:mi>P</mml:mi> <mml:mo>(</mml:mo> <mml:mi>Y</mml:mi> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn> <mml:mo>)</mml:mo> <mml:mo>]</mml:mo> <mml:mo>=</mml:mo> <mml:msup><mml:mi mathvariant="bold-italic">X</mml:mi> <mml:mi>T</mml:mi></mml:msup> <mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>+</mml:mo> <mml:mi>f</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="bold-italic">U</mml:mi> <mml:mo>,</mml:mo> <mml:mi mathvariant="bold-italic">Z</mml:mi> <mml:mo>,</mml:mo> <mml:msub><mml:mi>E</mml:mi> <mml:mi>Y</mml:mi></mml:msub> <mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(7)</label></disp-formula>
With the same argument, we have
<disp-formula id="pgen.1009575.e041"><alternatives><graphic id="pgen.1009575.e041g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e041" xlink:type="simple"/><mml:math display="block" id="M41"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mtext>logit</mml:mtext> <mml:mo>[</mml:mo> <mml:mi>P</mml:mi> <mml:mo>(</mml:mo> <mml:mi>Y</mml:mi> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn> <mml:mo>)</mml:mo> <mml:mo>]</mml:mo> <mml:mo>=</mml:mo> <mml:msub><mml:mo>Γ</mml:mo> <mml:mi>j</mml:mi></mml:msub> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>e</mml:mi> <mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula></p>
<p>If we further assume that for each genetic instrument <italic>j</italic>, <italic>Z</italic><sub><italic>j</italic></sub> is actually independent of <italic>e</italic><sub><italic>j</italic></sub> (instead of just being uncorrelated), then the odds ratio that is estimated from the marginal logistic regression will be approximately Γ<sub><italic>j</italic></sub>/<italic>c</italic> with a constant <italic>c</italic> &gt; 1 determined by the distribution of <italic>e</italic><sub><italic>j</italic></sub>. In other words, for binary disease outcomes, <xref ref-type="disp-formula" rid="pgen.1009575.e006">Eq (2)</xref> is still approximately correct with the <bold><italic>β</italic></bold> in (<xref ref-type="disp-formula" rid="pgen.1009575.e006">2</xref>) being a conservatively biased (by a ratio of 1/<italic>c</italic>) version of the <bold><italic>β</italic></bold> in (<xref ref-type="disp-formula" rid="pgen.1009575.e040">7</xref>) (for a detailed calculation, see A.1 of [<xref ref-type="bibr" rid="pgen.1009575.ref010">10</xref>]).</p>
</sec>
<sec id="sec017">
<title>GWAS summary statistics from overlapping cohorts</title>
<p>The GWAS estimated effect sizes (log odds ratios for binary traits) of SNP <italic>j</italic> are <inline-formula id="pgen.1009575.e042"><alternatives><graphic id="pgen.1009575.e042g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e042" xlink:type="simple"/><mml:math display="inline" id="M42"><mml:msub><mml:mover accent="true"><mml:mo>Γ</mml:mo> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:math></alternatives></inline-formula> for the disease and a length <italic>K</italic> vector <inline-formula id="pgen.1009575.e043"><alternatives><graphic id="pgen.1009575.e043g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e043" xlink:type="simple"/><mml:math display="inline" id="M43"><mml:mover accent="true"><mml:msub><mml:mi>γ</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>^</mml:mo></mml:mover></mml:math></alternatives></inline-formula> for the risk factors. As shown in [<xref ref-type="bibr" rid="pgen.1009575.ref086">86</xref>] and derived in <xref ref-type="supplementary-material" rid="pgen.1009575.s008">S2 Text</xref>, for any risk factor <italic>k</italic> we have
<disp-formula id="pgen.1009575.e044"><alternatives><graphic id="pgen.1009575.e044g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e044" xlink:type="simple"/><mml:math display="block" id="M44"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mo form="prefix">Corr</mml:mo> <mml:mrow/></mml:msub> <mml:mo>[</mml:mo> <mml:msub><mml:mover accent="true"><mml:mo>Γ</mml:mo> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mrow><mml:mi>j</mml:mi> <mml:mi>k</mml:mi></mml:mrow></mml:msub> <mml:mo>]</mml:mo> <mml:mo>≈</mml:mo> <mml:mfrac><mml:msub><mml:mi>N</mml:mi> <mml:mrow><mml:mi>s</mml:mi> <mml:mi>k</mml:mi></mml:mrow></mml:msub> <mml:msqrt><mml:mrow><mml:msub><mml:mi>N</mml:mi> <mml:mrow><mml:mi>e</mml:mi> <mml:mi>k</mml:mi></mml:mrow></mml:msub> <mml:msub><mml:mi>N</mml:mi> <mml:mi>o</mml:mi></mml:msub></mml:mrow></mml:msqrt></mml:mfrac> <mml:msub><mml:mo form="prefix">Corr</mml:mo> <mml:mrow/></mml:msub> <mml:mo>[</mml:mo> <mml:msub><mml:mi>Y</mml:mi> <mml:mi>s</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:msub><mml:mi>X</mml:mi> <mml:mrow><mml:mi>k</mml:mi> <mml:mi>s</mml:mi></mml:mrow></mml:msub> <mml:mo>]</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(8)</label></disp-formula>
where <italic>N</italic><sub><italic>o</italic></sub> and <italic>N</italic><sub><italic>ek</italic></sub> are the total sample sizes for the disease and <italic>k</italic>th risk factor. <italic>N</italic><sub><italic>sk</italic></sub> is the number of shared samples. The correlation of <italic>X</italic><sub><italic>k</italic></sub> and <italic>Y</italic> of any shared sample is Corr[<italic>Y</italic><sub><italic>s</italic></sub>, <italic>X</italic><sub><italic>ks</italic></sub>]. <xref ref-type="disp-formula" rid="pgen.1009575.e044">Eq (8)</xref> shows that all the SNPs share the same correlation. As a consequence, we assume
<disp-formula id="pgen.1009575.e045"><alternatives><graphic id="pgen.1009575.e045g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e045" xlink:type="simple"/><mml:math display="block" id="M45"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mo>(</mml:mo> <mml:mtable><mml:mtr><mml:mtd><mml:msub><mml:mover accent="true"><mml:mo>Γ</mml:mo> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:mtd></mml:mtr> <mml:mtr><mml:mtd><mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:mtd></mml:mtr></mml:mtable> <mml:mo>)</mml:mo> <mml:mo>∼</mml:mo> <mml:mi mathvariant="script">N</mml:mi> <mml:mo>(</mml:mo> <mml:mo>(</mml:mo> <mml:mtable><mml:mtr><mml:mtd><mml:msub><mml:mo>Γ</mml:mo> <mml:mi>j</mml:mi></mml:msub></mml:mtd></mml:mtr> <mml:mtr><mml:mtd><mml:msub><mml:mi>γ</mml:mi> <mml:mi>j</mml:mi></mml:msub></mml:mtd></mml:mtr></mml:mtable> <mml:mo>)</mml:mo> <mml:mo>,</mml:mo> <mml:msub><mml:mo>Σ</mml:mo> <mml:mi>j</mml:mi></mml:msub> <mml:mo>=</mml:mo> <mml:mo>(</mml:mo> <mml:mtable><mml:mtr><mml:mtd><mml:msub><mml:mi>σ</mml:mi> <mml:msub><mml:mi>Y</mml:mi> <mml:mi>j</mml:mi></mml:msub></mml:msub></mml:mtd> <mml:mtd/><mml:mtd/><mml:mtd/></mml:mtr> <mml:mtr><mml:mtd/><mml:mtd><mml:msub><mml:mi>σ</mml:mi> <mml:msub><mml:mi>X</mml:mi> <mml:mrow><mml:mi>j</mml:mi> <mml:mn>1</mml:mn></mml:mrow></mml:msub></mml:msub></mml:mtd> <mml:mtd/><mml:mtd/></mml:mtr> <mml:mtr><mml:mtd/><mml:mtd/><mml:mtd><mml:mo>⋱</mml:mo></mml:mtd> <mml:mtd/></mml:mtr> <mml:mtr><mml:mtd/><mml:mtd/><mml:mtd/><mml:mtd><mml:msub><mml:mi>σ</mml:mi> <mml:msub><mml:mi>X</mml:mi> <mml:mrow><mml:mi>j</mml:mi> <mml:mi>K</mml:mi></mml:mrow></mml:msub></mml:msub></mml:mtd></mml:mtr></mml:mtable> <mml:mo>)</mml:mo> <mml:mo>Σ</mml:mo> <mml:mo>(</mml:mo> <mml:mtable><mml:mtr><mml:mtd><mml:msub><mml:mi>σ</mml:mi> <mml:msub><mml:mi>Y</mml:mi> <mml:mi>j</mml:mi></mml:msub></mml:msub></mml:mtd> <mml:mtd/><mml:mtd/><mml:mtd/></mml:mtr> <mml:mtr><mml:mtd/><mml:mtd><mml:msub><mml:mi>σ</mml:mi> <mml:msub><mml:mi>X</mml:mi> <mml:mrow><mml:mi>j</mml:mi> <mml:mn>1</mml:mn></mml:mrow></mml:msub></mml:msub></mml:mtd> <mml:mtd/><mml:mtd/></mml:mtr> <mml:mtr><mml:mtd/><mml:mtd/><mml:mtd><mml:mo>⋱</mml:mo></mml:mtd> <mml:mtd/></mml:mtr> <mml:mtr><mml:mtd/><mml:mtd/><mml:mtd/><mml:mtd><mml:msub><mml:mi>σ</mml:mi> <mml:msub><mml:mi>X</mml:mi> <mml:mrow><mml:mi>j</mml:mi> <mml:mi>K</mml:mi></mml:mrow></mml:msub></mml:msub></mml:mtd></mml:mtr></mml:mtable> <mml:mo>)</mml:mo> <mml:mo>)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(9)</label></disp-formula>
where Σ is the unknown shared correlation matrix.</p>
</sec>
<sec id="sec018">
<title>Estimate the shared correlation Σ</title>
<p>To estimate Σ from summary statistics, we can use <xref ref-type="disp-formula" rid="pgen.1009575.e044">Eq (8)</xref>. We first need to choose SNPs where <italic>γ</italic><sub><italic>jk</italic></sub> = 0 for all risk factors <italic>k</italic> so that we can estimate the shared correlation <inline-formula id="pgen.1009575.e046"><alternatives><graphic id="pgen.1009575.e046g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e046" xlink:type="simple"/><mml:math display="inline" id="M46"><mml:mrow><mml:msub><mml:mo form="prefix">Corr</mml:mo> <mml:mrow/></mml:msub> <mml:mo>[</mml:mo> <mml:msub><mml:mover accent="true"><mml:mo>Γ</mml:mo> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mrow><mml:mi>j</mml:mi> <mml:mi>k</mml:mi></mml:mrow></mml:msub> <mml:mo>]</mml:mo></mml:mrow></mml:math></alternatives></inline-formula> using the sample correlation of the chosen SNPs. We choose all SNPs whose selection p-values <italic>p</italic><sub><italic>jk</italic></sub> ≥ 0.5 for all <italic>k</italic>.</p>
<p>For these selected SNPs, denote the Z-values of <inline-formula id="pgen.1009575.e047"><alternatives><graphic id="pgen.1009575.e047g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e047" xlink:type="simple"/><mml:math display="inline" id="M47"><mml:mrow><mml:mo>(</mml:mo> <mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:msub><mml:mover accent="true"><mml:mo>Γ</mml:mo> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub> <mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula> for <italic>j</italic> = 1, ⋯, <italic>T</italic> as matrix <italic>Z</italic><sub><italic>T</italic>×(<italic>K</italic>+1)</sub> where <italic>T</italic> is the number of selected SNPs. Then Σ is estimated as the correlation matrix of <italic>Z</italic><sub><italic>T</italic>×(<italic>K</italic>+1)</sub>.</p>
</sec>
<sec id="sec019">
<title>Instruments selection using LD clumping</title>
<p>In GRAPPLE, we need to first select a set of SNPs as genetic instruments to estimate the causal effects <bold><italic>β</italic></bold>. Here, we only select independent SNPs to simplify the calculation. Besides the independence requirement, we only include SNPs that pass a p-value threshold to reduce the inclusion of false positives that can decrease power. To avoid selection bias, a separate cohort for each risk factor is used where the reported p-values in that cohort are used for instruments selection. Denote the selection p-value for SNP <italic>j</italic> and risk factor <italic>k</italic> as <italic>p</italic><sub><italic>jk</italic></sub>, for multiple risk factors and a given selection threshold, we require the Bonferroni combined p-values <italic>K</italic> min(<italic>p</italic><sub><italic>jk</italic></sub>) to pass the threshold. After that, we use LD clumping with PLINK [<xref ref-type="bibr" rid="pgen.1009575.ref087">87</xref>] to select independent genetic instruments. The LD <italic>r</italic><sup>2</sup> threshold for PLINK is set to 0.001.</p>
</sec>
<sec id="sec020">
<title>Estimate the effects <italic>β</italic></title>
<p>Here, we perform statistical analysis assuming <italic>α</italic><sub><italic>j</italic></sub> ∼ <italic>N</italic>(0, <italic>τ</italic><sup>2</sup>) for the pleiotropic effects, while robust to outliers where the pleiotropic effects for a few instruments are large.</p>
<p>Under model (<xref ref-type="disp-formula" rid="pgen.1009575.e045">9</xref>), <xref ref-type="disp-formula" rid="pgen.1009575.e006">Eq (2)</xref> and given Σ, the log-likelihood with GWAS summary statistics satisfy:
<disp-formula id="pgen.1009575.e048"><alternatives><graphic id="pgen.1009575.e048g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e048" xlink:type="simple"/><mml:math display="block" id="M48"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd/><mml:mtd columnalign="left"><mml:mrow><mml:mi>L</mml:mi> <mml:mo>(</mml:mo> <mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>,</mml:mo> <mml:msub><mml:mi>γ</mml:mi> <mml:mn>1</mml:mn></mml:msub> <mml:mo>,</mml:mo> <mml:mo>⋯</mml:mo> <mml:mo>,</mml:mo> <mml:msub><mml:mi>γ</mml:mi> <mml:mi>p</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:msup><mml:mi>τ</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mo>)</mml:mo></mml:mrow></mml:mtd></mml:mtr> <mml:mtr><mml:mtd columnalign="right"><mml:mo>=</mml:mo></mml:mtd> <mml:mtd><mml:mrow><mml:mo>-</mml:mo> <mml:mfrac><mml:mn>1</mml:mn> <mml:mn>2</mml:mn></mml:mfrac> <mml:munderover><mml:mo>∑</mml:mo> <mml:mrow><mml:mi>j</mml:mi> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn></mml:mrow> <mml:mi>p</mml:mi></mml:munderover> <mml:mo>[</mml:mo> <mml:msup><mml:mrow><mml:mo>(</mml:mo> <mml:mtable><mml:mtr><mml:mtd><mml:mrow><mml:msub><mml:mover accent="true"><mml:mo>Γ</mml:mo> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub> <mml:mo>-</mml:mo> <mml:msubsup><mml:mi>γ</mml:mi> <mml:mi>j</mml:mi> <mml:mi>T</mml:mi></mml:msubsup> <mml:mi>β</mml:mi></mml:mrow></mml:mtd></mml:mtr> <mml:mtr><mml:mtd><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub> <mml:mo>-</mml:mo> <mml:msub><mml:mi>γ</mml:mi> <mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:mtd></mml:mtr></mml:mtable> <mml:mo>)</mml:mo></mml:mrow> <mml:mi>T</mml:mi></mml:msup> <mml:msup><mml:mrow><mml:mo>(</mml:mo> <mml:msub><mml:mo>Σ</mml:mo> <mml:mi>j</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msup><mml:mi>τ</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mi>e</mml:mi> <mml:msup><mml:mi>e</mml:mi> <mml:mi>T</mml:mi></mml:msup> <mml:mo>)</mml:mo></mml:mrow> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>1</mml:mn></mml:mrow></mml:msup> <mml:mo>(</mml:mo> <mml:mtable><mml:mtr><mml:mtd><mml:mrow><mml:msub><mml:mover accent="true"><mml:mo>Γ</mml:mo> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub> <mml:mo>-</mml:mo> <mml:msubsup><mml:mi>γ</mml:mi> <mml:mi>j</mml:mi> <mml:mi>T</mml:mi></mml:msubsup> <mml:mi>β</mml:mi></mml:mrow></mml:mtd></mml:mtr> <mml:mtr><mml:mtd><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub> <mml:mo>-</mml:mo> <mml:msub><mml:mi>γ</mml:mi> <mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:mtd></mml:mtr></mml:mtable> <mml:mo>)</mml:mo> <mml:mo>+</mml:mo> <mml:mo form="prefix">log</mml:mo> <mml:mrow><mml:mo>|</mml:mo> <mml:msub><mml:mo>Σ</mml:mo> <mml:mi>j</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msup><mml:mi>τ</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mi>e</mml:mi> <mml:msup><mml:mi>e</mml:mi> <mml:mi>T</mml:mi></mml:msup> <mml:mo>|</mml:mo></mml:mrow> <mml:mo>]</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
up to some additive constant. Here, <italic>e</italic> = (1, 0, ⋯, 0).</p>
<p>Define for each SNP <italic>j</italic> the statistics
<disp-formula id="pgen.1009575.e049"><alternatives><graphic id="pgen.1009575.e049g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e049" xlink:type="simple"/><mml:math display="block" id="M49"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mi>t</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>,</mml:mo> <mml:msup><mml:mi>τ</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:mfrac><mml:mrow><mml:msub><mml:mover accent="true"><mml:mo>Γ</mml:mo> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub> <mml:mo>-</mml:mo> <mml:msup><mml:mover accent="true"><mml:msub><mml:mi>γ</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>^</mml:mo></mml:mover> <mml:mi>T</mml:mi></mml:msup> <mml:mi mathvariant="bold-italic">β</mml:mi></mml:mrow> <mml:msqrt><mml:mrow><mml:msubsup><mml:mi>σ</mml:mi> <mml:mrow><mml:msub><mml:mi>Y</mml:mi> <mml:mi>j</mml:mi></mml:msub></mml:mrow> <mml:mn>2</mml:mn></mml:msubsup> <mml:mo>+</mml:mo> <mml:msup><mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mi>T</mml:mi></mml:msup> <mml:msub><mml:mo>Σ</mml:mo> <mml:msub><mml:mi mathvariant="bold-italic">X</mml:mi> <mml:mi>j</mml:mi></mml:msub></mml:msub> <mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>-</mml:mo> <mml:mn>2</mml:mn> <mml:msup><mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mi>T</mml:mi></mml:msup> <mml:msub><mml:mo>Σ</mml:mo> <mml:mrow><mml:msub><mml:mi mathvariant="bold-italic">X</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:msub><mml:mi>Y</mml:mi> <mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:msub> <mml:mo>+</mml:mo> <mml:msup><mml:mi>τ</mml:mi> <mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:msqrt></mml:mfrac></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(10)</label></disp-formula>
where <inline-formula id="pgen.1009575.e050"><alternatives><graphic id="pgen.1009575.e050g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e050" xlink:type="simple"/><mml:math display="inline" id="M50"><mml:msub><mml:mo>Σ</mml:mo> <mml:msub><mml:mi mathvariant="bold-italic">X</mml:mi> <mml:mi>j</mml:mi></mml:msub></mml:msub></mml:math></alternatives></inline-formula> is the variance of <inline-formula id="pgen.1009575.e051"><alternatives><graphic id="pgen.1009575.e051g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e051" xlink:type="simple"/><mml:math display="inline" id="M51"><mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009575.e052"><alternatives><graphic id="pgen.1009575.e052g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e052" xlink:type="simple"/><mml:math display="inline" id="M52"><mml:msub><mml:mo>Σ</mml:mo> <mml:mrow><mml:msub><mml:mi mathvariant="bold-italic">X</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:msub><mml:mi>Y</mml:mi> <mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:msub></mml:math></alternatives></inline-formula> is the covariance between <inline-formula id="pgen.1009575.e053"><alternatives><graphic id="pgen.1009575.e053g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e053" xlink:type="simple"/><mml:math display="inline" id="M53"><mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009575.e054"><alternatives><graphic id="pgen.1009575.e054g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e054" xlink:type="simple"/><mml:math display="inline" id="M54"><mml:msub><mml:mover accent="true"><mml:mo>Γ</mml:mo> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:math></alternatives></inline-formula> in Σ<sub><italic>j</italic></sub>. Then the profile log-likelihood that profile out parameters <inline-formula id="pgen.1009575.e055"><alternatives><graphic id="pgen.1009575.e055g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e055" xlink:type="simple"/><mml:math display="inline" id="M55"><mml:mrow><mml:mo>(</mml:mo> <mml:msub><mml:mi>γ</mml:mi> <mml:mn>1</mml:mn></mml:msub> <mml:mo>,</mml:mo> <mml:mo>⋯</mml:mo> <mml:mo>,</mml:mo> <mml:msub><mml:mi>γ</mml:mi> <mml:mi>p</mml:mi></mml:msub> <mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula> results in
<disp-formula id="pgen.1009575.e056"><alternatives><graphic id="pgen.1009575.e056g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e056" xlink:type="simple"/><mml:math display="block" id="M56"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>L</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>,</mml:mo> <mml:msup><mml:mi>τ</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:msub><mml:mtext>max</mml:mtext> <mml:mrow><mml:mo>(</mml:mo> <mml:msub><mml:mi>γ</mml:mi> <mml:mn>1</mml:mn></mml:msub> <mml:mo>,</mml:mo> <mml:mo>⋯</mml:mo> <mml:mo>,</mml:mo> <mml:msub><mml:mi>γ</mml:mi> <mml:mi>p</mml:mi></mml:msub> <mml:mo>)</mml:mo></mml:mrow></mml:msub> <mml:mi>L</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>,</mml:mo> <mml:msub><mml:mi>γ</mml:mi> <mml:mn>1</mml:mn></mml:msub> <mml:mo>,</mml:mo> <mml:mo>⋯</mml:mo> <mml:mo>,</mml:mo> <mml:msub><mml:mi>γ</mml:mi> <mml:mi>p</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:msup><mml:mi>τ</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:mo>-</mml:mo> <mml:mfrac><mml:mn>1</mml:mn> <mml:mn>2</mml:mn></mml:mfrac> <mml:munderover><mml:mo>∑</mml:mo> <mml:mrow><mml:mi>j</mml:mi> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn></mml:mrow> <mml:mi>p</mml:mi></mml:munderover> <mml:mo>[</mml:mo> <mml:msub><mml:mi>t</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:msup><mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>,</mml:mo> <mml:msup><mml:mi>τ</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mo>)</mml:mo></mml:mrow> <mml:mn>2</mml:mn></mml:msup> <mml:mo>+</mml:mo> <mml:mo form="prefix">log</mml:mo> <mml:mrow><mml:mo>|</mml:mo> <mml:msub><mml:mo>Σ</mml:mo> <mml:mi>j</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msup><mml:mi>τ</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mi>e</mml:mi> <mml:msup><mml:mi>e</mml:mi> <mml:mi>T</mml:mi></mml:msup> <mml:mo>|</mml:mo></mml:mrow> <mml:mo>]</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula></p>
<p>As discussed in [<xref ref-type="bibr" rid="pgen.1009575.ref010">10</xref>], maximizing <inline-formula id="pgen.1009575.e057"><alternatives><graphic id="pgen.1009575.e057g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e057" xlink:type="simple"/><mml:math display="inline" id="M57"><mml:mrow><mml:mi>L</mml:mi> <mml:mo>(</mml:mo> <mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>,</mml:mo> <mml:msup><mml:mi>τ</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula> would not give consistent estimate of <italic>τ</italic><sup>2</sup>. Because of this and the goal of making <inline-formula id="pgen.1009575.e058"><alternatives><graphic id="pgen.1009575.e058g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e058" xlink:type="simple"/><mml:math display="inline" id="M58"><mml:mover accent="true"><mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>^</mml:mo></mml:mover></mml:math></alternatives></inline-formula> robust to outlier SNPs with large pleiotropic effects, our optimization function is the adjusted robust profile likelihood defined as
<disp-formula id="pgen.1009575.e059"><alternatives><graphic id="pgen.1009575.e059g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e059" xlink:type="simple"/><mml:math display="block" id="M59"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>l</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>,</mml:mo> <mml:msup><mml:mi>τ</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:mo>-</mml:mo> <mml:munder><mml:mo>∑</mml:mo> <mml:mi>j</mml:mi></mml:munder> <mml:msub><mml:mi>l</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>,</mml:mo> <mml:msup><mml:mi>τ</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:mo>-</mml:mo> <mml:munder><mml:mo>∑</mml:mo> <mml:mi>j</mml:mi></mml:munder> <mml:mi>ρ</mml:mi> <mml:mo>(</mml:mo> <mml:msub><mml:mi>t</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>,</mml:mo> <mml:msup><mml:mi>τ</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(11)</label></disp-formula>
where <italic>ρ</italic>(⋅) is some robust loss function. By default, GRAPPLE uses the Tukey’s Biweight loss function:
<disp-formula id="pgen.1009575.e060"><alternatives><graphic id="pgen.1009575.e060g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e060" xlink:type="simple"/><mml:math display="block" id="M60"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>ρ</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>r</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:mo>{</mml:mo> <mml:mtable><mml:mtr><mml:mtd columnalign="left"><mml:mrow><mml:mfrac><mml:msup><mml:mi>c</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mn>6</mml:mn></mml:mfrac> <mml:mo>[</mml:mo> <mml:mn>1</mml:mn> <mml:mo>-</mml:mo> <mml:msup><mml:mrow><mml:mo>(</mml:mo> <mml:mn>1</mml:mn> <mml:mo>-</mml:mo> <mml:msup><mml:mrow><mml:mo>(</mml:mo> <mml:mi>r</mml:mi> <mml:mo>/</mml:mo> <mml:mi>c</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mn>2</mml:mn></mml:msup> <mml:mo>)</mml:mo></mml:mrow> <mml:mn>3</mml:mn></mml:msup> <mml:mo>]</mml:mo></mml:mrow></mml:mtd> <mml:mtd columnalign="left"><mml:mrow><mml:mspace width="4pt"/><mml:mtext>if</mml:mtext> <mml:mspace width="4pt"/><mml:mo>|</mml:mo> <mml:mi>r</mml:mi> <mml:mo>|</mml:mo> <mml:mo>≤</mml:mo> <mml:mi>c</mml:mi></mml:mrow></mml:mtd></mml:mtr> <mml:mtr><mml:mtd columnalign="left"><mml:mrow><mml:msup><mml:mi>c</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mo>/</mml:mo> <mml:mn>6</mml:mn></mml:mrow></mml:mtd> <mml:mtd columnalign="left"><mml:mrow><mml:mspace width="4pt"/><mml:mtext>otherwise</mml:mtext> <mml:mspace width="4pt"/></mml:mrow></mml:mtd></mml:mtr></mml:mtable> <mml:mo/></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
where <italic>c</italic> is set to its common default value 4.6851. We maximize (<xref ref-type="disp-formula" rid="pgen.1009575.e059">11</xref>) with respect to <bold><italic>β</italic></bold> as well as solving the following estimating equation for the heterogeneity <italic>τ</italic><sup>2</sup> which is
<disp-formula id="pgen.1009575.e061"><alternatives><graphic id="pgen.1009575.e061g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e061" xlink:type="simple"/><mml:math display="block" id="M61"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mi>φ</mml:mi> <mml:mn>2</mml:mn></mml:msub> <mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>,</mml:mo> <mml:msup><mml:mi>τ</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:mi>l</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>,</mml:mo> <mml:msup><mml:mi>τ</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>-</mml:mo> <mml:mi>p</mml:mi> <mml:mi>η</mml:mi> <mml:mo>=</mml:mo> <mml:mn>0</mml:mn></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(12)</label></disp-formula>
where <inline-formula id="pgen.1009575.e062"><alternatives><graphic id="pgen.1009575.e062g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e062" xlink:type="simple"/><mml:math display="inline" id="M62"><mml:mrow><mml:mi>η</mml:mi> <mml:mo>=</mml:mo> <mml:msub><mml:mi mathvariant="double-struck">E</mml:mi> <mml:mrow/></mml:msub> <mml:mo>[</mml:mo> <mml:mi>ρ</mml:mi> <mml:mo>(</mml:mo> <mml:mi>Z</mml:mi> <mml:mo>)</mml:mo> <mml:mo>]</mml:mo></mml:mrow></mml:math></alternatives></inline-formula> with <inline-formula id="pgen.1009575.e063"><alternatives><graphic id="pgen.1009575.e063g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e063" xlink:type="simple"/><mml:math display="inline" id="M63"><mml:mrow><mml:mi>Z</mml:mi> <mml:mo>∼</mml:mo> <mml:mi mathvariant="script">N</mml:mi> <mml:mo>(</mml:mo> <mml:mn>0</mml:mn> <mml:mo>,</mml:mo> <mml:mn>1</mml:mn> <mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula>. The estimating equation satisfies <inline-formula id="pgen.1009575.e064"><alternatives><graphic id="pgen.1009575.e064g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e064" xlink:type="simple"/><mml:math display="inline" id="M64"><mml:mrow><mml:msub><mml:mi mathvariant="double-struck">E</mml:mi> <mml:mrow/></mml:msub> <mml:mo>[</mml:mo> <mml:msub><mml:mi>φ</mml:mi> <mml:mn>2</mml:mn></mml:msub> <mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="bold-italic">β</mml:mi> <mml:mo>,</mml:mo> <mml:msup><mml:mi>τ</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>]</mml:mo> <mml:mo>=</mml:mo> <mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> at the true values of <bold><italic>β</italic></bold> and <italic>τ</italic><sup>2</sup>, thus can result in consistent estimate of <italic>τ</italic><sup>2</sup>. For the details of estimating <bold><italic>β</italic></bold> and <italic>τ</italic><sup>2</sup> as well building confidence intervals for them, see <xref ref-type="supplementary-material" rid="pgen.1009575.s008">S2 Text</xref>.</p>
</sec>
<sec id="sec021">
<title>Identify pleiotropic pathways via the multi-modality diagnosis</title>
<p>We use the mode detection of the robust profile likelihood (<xref ref-type="disp-formula" rid="pgen.1009575.e059">11</xref>) to detect multiple pleiotropic pathways. To increase sensitivity, we set <italic>τ</italic><sup>2</sup> = 0 and reduce the tuning parameter in the Tukey’s Biweight loss function to <italic>c</italic> = 3. Here we present a detailed argument on why mode detection can identify pleiotropic pathways.</p>
<p>If there is a confounding Genetic Pathway 2 <inline-formula id="pgen.1009575.e065"><alternatives><graphic id="pgen.1009575.e065g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e065" xlink:type="simple"/><mml:math display="inline" id="M65"><mml:mover accent="true"><mml:mi>X</mml:mi> <mml:mo>˜</mml:mo></mml:mover></mml:math></alternatives></inline-formula>, as shown in <xref ref-type="fig" rid="pgen.1009575.g001">Fig 1a</xref>, that are missed, then we have the structural equation
<disp-formula id="pgen.1009575.e066"><alternatives><graphic id="pgen.1009575.e066g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e066" xlink:type="simple"/><mml:math display="block" id="M66"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>Y</mml:mi> <mml:mo>=</mml:mo> <mml:mi>β</mml:mi> <mml:mi>X</mml:mi> <mml:mo>+</mml:mo> <mml:mi>κ</mml:mi> <mml:mover accent="true"><mml:mi>X</mml:mi> <mml:mo>˜</mml:mo></mml:mover> <mml:mo>+</mml:mo> <mml:mi>f</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>U</mml:mi> <mml:mo>,</mml:mo> <mml:msub><mml:mi>Z</mml:mi> <mml:mn>1</mml:mn></mml:msub> <mml:mo>,</mml:mo> <mml:mo>⋯</mml:mo> <mml:mo>,</mml:mo> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>p</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:msub><mml:mi>E</mml:mi> <mml:mi>Y</mml:mi></mml:msub> <mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
and also the linear model
<disp-formula id="pgen.1009575.e067"><alternatives><graphic id="pgen.1009575.e067g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e067" xlink:type="simple"/><mml:math display="block" id="M67"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>X</mml:mi> <mml:mo>=</mml:mo> <mml:mi>δ</mml:mi> <mml:mover accent="true"><mml:mi>X</mml:mi> <mml:mo>˜</mml:mo></mml:mover> <mml:mo>+</mml:mo> <mml:mi>ϵ</mml:mi> <mml:mo>,</mml:mo> <mml:mspace width="1em"/><mml:mtext>Corr</mml:mtext> <mml:mrow><mml:mo>(</mml:mo> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:mi>ϵ</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:mn>0</mml:mn> <mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(13)</label></disp-formula>
for a SNP <italic>j</italic> that only associates with Genetic Pathway 2 and uncorrelates with <italic>X</italic> conditional on <inline-formula id="pgen.1009575.e068"><alternatives><graphic id="pgen.1009575.e068g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e068" xlink:type="simple"/><mml:math display="inline" id="M68"><mml:mover accent="true"><mml:mi>X</mml:mi> <mml:mo>˜</mml:mo></mml:mover></mml:math></alternatives></inline-formula>. Similar to (<xref ref-type="disp-formula" rid="pgen.1009575.e033">5</xref>), we have
<disp-formula id="pgen.1009575.e069"><alternatives><graphic id="pgen.1009575.e069g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e069" xlink:type="simple"/><mml:math display="block" id="M69"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>X</mml:mi> <mml:mo>=</mml:mo> <mml:msub><mml:mi>γ</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>ϵ</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:mspace width="1em"/><mml:mover accent="true"><mml:mi>X</mml:mi> <mml:mo>˜</mml:mo></mml:mover> <mml:mo>=</mml:mo> <mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>˜</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub> <mml:msub><mml:mi>Z</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mover accent="true"><mml:mi>ϵ</mml:mi> <mml:mo>˜</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula></p>
<p>Plug in (<xref ref-type="disp-formula" rid="pgen.1009575.e067">13</xref>), we have
<disp-formula id="pgen.1009575.e070"><alternatives><graphic id="pgen.1009575.e070g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e070" xlink:type="simple"/><mml:math display="block" id="M70"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mi>γ</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>=</mml:mo> <mml:mi>δ</mml:mi> <mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>˜</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula> <disp-formula id="pgen.1009575.e071"><alternatives><graphic id="pgen.1009575.e071g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e071" xlink:type="simple"/><mml:math display="block" id="M71"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mo>Γ</mml:mo> <mml:mi>j</mml:mi></mml:msub> <mml:mo>=</mml:mo> <mml:mi>β</mml:mi> <mml:msub><mml:mi>γ</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:mi>κ</mml:mi> <mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>˜</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>α</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>=</mml:mo> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>β</mml:mi> <mml:mo>+</mml:mo> <mml:mi>κ</mml:mi> <mml:mo>/</mml:mo> <mml:mi>δ</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:msub><mml:mi>γ</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>α</mml:mi> <mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula></p>
<p>Thus, if there are enough SNPs like SNP <italic>j</italic>, they would contribute to another mode of (<xref ref-type="disp-formula" rid="pgen.1009575.e016">4</xref>) at <italic>β</italic> + <italic>κ</italic>/<italic>δ</italic>.</p>
<p>The same argument works for identification of the causal direction. Say there is another <inline-formula id="pgen.1009575.e072"><alternatives><graphic id="pgen.1009575.e072g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e072" xlink:type="simple"/><mml:math display="inline" id="M72"><mml:mover accent="true"><mml:mi>X</mml:mi> <mml:mo>˜</mml:mo></mml:mover></mml:math></alternatives></inline-formula> that affects <italic>Y</italic> but is uncorrelated with the risk factor <italic>X</italic> (<italic>δ</italic> = 0). The existence of such <inline-formula id="pgen.1009575.e073"><alternatives><graphic id="pgen.1009575.e073g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e073" xlink:type="simple"/><mml:math display="inline" id="M73"><mml:mover accent="true"><mml:mi>X</mml:mi> <mml:mo>˜</mml:mo></mml:mover></mml:math></alternatives></inline-formula> is common, unless <italic>X</italic> is the only heritable risk factor of <italic>Y</italic>. SNPs strongly associated with <inline-formula id="pgen.1009575.e074"><alternatives><graphic id="pgen.1009575.e074g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e074" xlink:type="simple"/><mml:math display="inline" id="M74"><mml:mover accent="true"><mml:mi>X</mml:mi> <mml:mo>˜</mml:mo></mml:mover></mml:math></alternatives></inline-formula> would not likely be selected when <italic>X</italic> is the exposure while would appear when the roles of <italic>X</italic> and <italic>Y</italic> are switched. These SNPs can be used to identify the causal direction, as as in the reverse MR, they contribute to a mode at 0, while the SNPs that affect <italic>Y</italic> through <italic>X</italic> will contribute to a mode at 1/<italic>β</italic>.</p>
</sec>
<sec id="sec022">
<title>Select marker SNPs and genes for each mode</title>
<p>GRAPPLE uses LD clumping with a stringent <italic>r</italic><sup>2</sup> (= 0.001) threshold to guarantee independence among the genetic instruments. However, marker SNPs are not restricted to these independent instruments in order to get more biological meaningful markers. Marker SNPs are selected from a SNP set <inline-formula id="pgen.1009575.e075"><alternatives><graphic id="pgen.1009575.e075g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e075" xlink:type="simple"/><mml:math display="inline" id="M75"><mml:mi mathvariant="script">G</mml:mi></mml:math></alternatives></inline-formula> where the SNPs are selected using LD clumping with <italic>r</italic><sup>2</sup> threshold 0.05.</p>
<p>Assume that there are <italic>M</italic> modes detected at positions <italic>β</italic><sub>1</sub>, <italic>β</italic><sub>2</sub>, ⋯, <italic>β</italic><sub><italic>M</italic></sub>. Define the residual of SNP <italic>j</italic> (<inline-formula id="pgen.1009575.e076"><alternatives><graphic id="pgen.1009575.e076g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e076" xlink:type="simple"/><mml:math display="inline" id="M76"><mml:mrow><mml:mi>j</mml:mi> <mml:mo>∈</mml:mo> <mml:mi mathvariant="script">G</mml:mi></mml:mrow></mml:math></alternatives></inline-formula>) for mode <italic>m</italic> as
<disp-formula id="pgen.1009575.e077"><alternatives><graphic id="pgen.1009575.e077g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e077" xlink:type="simple"/><mml:math display="block" id="M77"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mi>r</mml:mi> <mml:mrow><mml:mi>j</mml:mi> <mml:mi>m</mml:mi></mml:mrow></mml:msub> <mml:mo>=</mml:mo> <mml:msub><mml:mi>t</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mrow><mml:mo>(</mml:mo> <mml:msub><mml:mi>β</mml:mi> <mml:mi>m</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:mn>0</mml:mn> <mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
where <italic>t</italic><sub><italic>j</italic></sub>(⋅, ⋅) is defined in <xref ref-type="disp-formula" rid="pgen.1009575.e049">Eq (10)</xref>. SNP <italic>j</italic> is selected as a marker for mode <italic>m</italic> if |<italic>r</italic><sub><italic>jm</italic>′</sub>|&gt;<italic>t</italic><sub>1</sub> for any <italic>m</italic>′ ≠ <italic>m</italic> and |<italic>r</italic><sub><italic>jm</italic></sub>|≤<italic>t</italic><sub>0</sub>. By default, <italic>t</italic><sub>1</sub> is set to 2 and <italic>t</italic><sub>0</sub> is set to 1 which gives reasonable results in practice. When the marker SNPs are selected, GRAPPLE further map the SNPs to ENCODE genes where the marker SNPs locate and search for the traits that these SNPs are strongly associated with in GWA studies by querying HaploReg v4.1 [<xref ref-type="bibr" rid="pgen.1009575.ref088">88</xref>] using the R package <italic>HaploR</italic>. The ratios <inline-formula id="pgen.1009575.e078"><alternatives><graphic id="pgen.1009575.e078g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e078" xlink:type="simple"/><mml:math display="inline" id="M78"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mo>Γ</mml:mo> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub> <mml:mo>/</mml:mo> <mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:math></alternatives></inline-formula> of the marker SNPs are also returned for reference (shown as the vertical bars in <xref ref-type="fig" rid="pgen.1009575.g003">Fig 3b</xref>).</p>
</sec>
<sec id="sec023">
<title>Compute replicability p-values across SNP selection thresholds</title>
<p>Each p-value shown in <xref ref-type="fig" rid="pgen.1009575.g003">Fig 3a</xref> summarizes a vector of p-values across 7 different selection p-value thresholds ranging from 10<sup>−8</sup> ot 10<sup>−2</sup> for each risk factor and disease pair. It reflects how consistent the significance is across SNP selection thresholds. Specifically, it is the partial conjunction p-value [<xref ref-type="bibr" rid="pgen.1009575.ref089">89</xref>] for rejecting the null that <italic>β</italic> is non-zero for at most 2 of the selection thresholds. For a risk factor and disease pair <italic>k</italic>, let the p-values computed by using SNPs selected with the 7 thresholds <italic>p</italic><sub><italic>ks</italic></sub> where <italic>s</italic> = 1, 2, ⋯, 7. Then rank them as <italic>p</italic><sub><italic>k</italic>(1)</sub> ≤ <italic>p</italic><sub><italic>k</italic>(2)</sub> ≤ ⋯ ≤ <italic>p</italic><sub><italic>k</italic>(7)</sub>, the partial conjunction p-value for the pair <italic>k</italic> is computed as 5<italic>p</italic><sub><italic>k</italic>(3)</sub>.</p>
</sec>
</sec>
<sec id="sec024" sec-type="supplementary-material">
<title>Supporting information</title>
<supplementary-material id="pgen.1009575.s001" mimetype="image/tiff" position="float" xlink:href="info:doi/10.1371/journal.pgen.1009575.s001" xlink:type="simple">
<label>S1 Fig</label>
<caption>
<title>Additional evaluation results with real data.</title>
<p><bold>a</bold>, Selection bias in MR methods when SNP selection and <inline-formula id="pgen.1009575.e079"><alternatives><graphic id="pgen.1009575.e079g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009575.e079" xlink:type="simple"/><mml:math display="inline" id="M79"><mml:msub><mml:mover accent="true"><mml:mi>γ</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mi>j</mml:mi></mml:msub></mml:math></alternatives></inline-formula> are obtained from the same GWAS dataset. True <italic>β</italic> ≈ 1 and error bars show 95% confidence intervals. The numbers are the number of clumped SNPs at different threshold. <bold>b</bold>, The estimate of <italic>β</italic> across three independent categories of SNPs with different association strengths for four risk factor and disease pairs using three other bench-marking MR methods. The numbers are the number of SNPs in each category, separated by the values of their selection p-values (dashed vertical lines).</p>
<p>(TIFF)</p>
</caption>
</supplementary-material>
<supplementary-material id="pgen.1009575.s002" mimetype="image/tiff" position="float" xlink:href="info:doi/10.1371/journal.pgen.1009575.s002" xlink:type="simple">
<label>S2 Fig</label>
<caption>
<title>Simulation results.</title>
<p><bold>a</bold>, Boxplots of the estimated <italic>β</italic><sub>1</sub> using different MR methods over 100 repeated random experiments when there are no correlated pleiotropy. We compare across three different <italic>β</italic><sub>1</sub> values (0.2, 0.5 and 1) with SNPs selected by three different selection thresholds: 10<sup>−8</sup> for the top 106 SNPs, 10<sup>−5</sup> for the top 217 SNPs and 0.01 for the top 422 SNPs. <bold>b</bold>, Performance of GRAPPLE in detecting multi-modality. In each setting with pleiotropic pathways, we evaluate three metrics: the detection rate of multi-modality, the precision of the identified marker genes of the pleiotropic pathways and the recall of true marker genes that are identified. Each color represent a different metric and each shape is for a different selection threshold. The title of each plot shows (<italic>β</italic><sub>1</sub>, ⋯, <italic>β</italic><sub><italic>K</italic></sub>) in each setting where <italic>β</italic><sub>1</sub> is the true causal effect, and in each setting, we vary the genetic correlation between each genetic confounding risk factor and the risk factor of interest.</p>
<p>(TIFF)</p>
</caption>
</supplementary-material>
<supplementary-material id="pgen.1009575.s003" mimetype="image/tiff" position="float" xlink:href="info:doi/10.1371/journal.pgen.1009575.s003" xlink:type="simple">
<label>S3 Fig</label>
<caption>
<title>Comparison of different MR methods in settings with pleiotropic pathways when the selection threshold is 10<sup>−8</sup> (top 106 SNPs).</title>
<p><bold>a</bold>, Boxplots of the estimated <italic>β</italic><sub>1</sub> using different MR methods over 100 repeated random experiments. <bold>b</bold> The actual coverage of the 95% confidence intervals of <italic>β</italic><sub>1</sub> provided by different methods. For CAUSE, we report the coverage of the 95% credible intervals of <italic>β</italic><sub>1</sub>. The red dotted line shows the expected 0.95 nominal level. For the three settings in the second row with <italic>β</italic><sub>1</sub> = 0, the CI coverage is the same as 1−type I error.</p>
<p>(TIFF)</p>
</caption>
</supplementary-material>
<supplementary-material id="pgen.1009575.s004" mimetype="image/tiff" position="float" xlink:href="info:doi/10.1371/journal.pgen.1009575.s004" xlink:type="simple">
<label>S4 Fig</label>
<caption>
<title>Same as <xref ref-type="supplementary-material" rid="pgen.1009575.s003">S3 Fig</xref> with the selection threshold being 10<sup>−5</sup> (top 217 SNPs).</title>
<p>(TIFF)</p>
</caption>
</supplementary-material>
<supplementary-material id="pgen.1009575.s005" mimetype="image/tiff" position="float" xlink:href="info:doi/10.1371/journal.pgen.1009575.s005" xlink:type="simple">
<label>S5 Fig</label>
<caption>
<title>Same as <xref ref-type="supplementary-material" rid="pgen.1009575.s003">S3 Fig</xref> with the selection threshold being 10<sup>−2</sup> (top 422 SNPs).</title>
<p>(TIFF)</p>
</caption>
</supplementary-material>
<supplementary-material id="pgen.1009575.s006" mimetype="image/tiff" position="float" xlink:href="info:doi/10.1371/journal.pgen.1009575.s006" xlink:type="simple">
<label>S6 Fig</label>
<caption>
<title>Additional results on identifying pleiotropic pathways on 25 diseases.</title>
<p>Each figure is for results obtained using one of the 7 p-value thresholds. The colors show the number of detected modes. The “+” sign shows a positive estimated effect and “−” sign shows a negative estimated effect.</p>
<p>(TIFF)</p>
</caption>
</supplementary-material>
<supplementary-material id="pgen.1009575.s007" mimetype="application/pdf" position="float" xlink:href="info:doi/10.1371/journal.pgen.1009575.s007" xlink:type="simple">
<label>S1 Text</label>
<caption>
<title>Simulation details.</title>
<p>(PDF)</p>
</caption>
</supplementary-material>
<supplementary-material id="pgen.1009575.s008" mimetype="application/pdf" position="float" xlink:href="info:doi/10.1371/journal.pgen.1009575.s008" xlink:type="simple">
<label>S2 Text</label>
<caption>
<title>Additional mathematical details of the statistical analysis.</title>
<p>(PDF)</p>
</caption>
</supplementary-material>
<supplementary-material id="pgen.1009575.s009" mimetype="application/pdf" position="float" xlink:href="info:doi/10.1371/journal.pgen.1009575.s009" xlink:type="simple">
<label>S3 Text</label>
<caption>
<title>A list of resources for GWAS datasets used in the paper.</title>
<p>(PDF)</p>
</caption>
</supplementary-material>
</sec>
</body>
<back>
<ref-list>
<title>References</title>
<ref id="pgen.1009575.ref001">
<label>1</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Davey Smith</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Ebrahim</surname> <given-names>S</given-names></name>. <article-title>‘Mendelian randomization’: can genetic epidemiology contribute to understanding environmental determinants of disease?</article-title> <source>International journal of epidemiology</source>. <year>2003</year>;<volume>32</volume>(<issue>1</issue>):<fpage>1</fpage>–<lpage>22</lpage>.</mixed-citation>
</ref>
<ref id="pgen.1009575.ref002">
<label>2</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Davey Smith</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Holmes</surname> <given-names>MV</given-names></name>, <name name-style="western"><surname>Davies</surname> <given-names>NM</given-names></name>, <name name-style="western"><surname>Ebrahim</surname> <given-names>S</given-names></name>. <article-title>Mendel’s laws, Mendelian randomization and causal inference in observational data: substantive and nomenclatural issues</article-title>. <source>European Journal of Epidemiology</source>. <year>2020</year>; p. <fpage>1</fpage>–<lpage>13</lpage>.</mixed-citation>
</ref>
<ref id="pgen.1009575.ref003">
<label>3</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Davey Smith</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Hemani</surname> <given-names>G</given-names></name>. <article-title>Mendelian randomization: genetic anchors for causal inference in epidemiological studies</article-title>. <source>Human molecular genetics</source>. <year>2014</year>;<volume>23</volume>(<issue>R1</issue>):<fpage>R89</fpage>–<lpage>R98</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/hmg/ddu328" xlink:type="simple">10.1093/hmg/ddu328</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref004">
<label>4</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Ebrahim</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Davey Smith</surname> <given-names>G</given-names></name>. <article-title>Mendelian randomization: can genetic epidemiology help redress the failures of observational epidemiology?</article-title> <source>Human genetics</source>. <year>2008</year>;<volume>123</volume>(<issue>1</issue>):<fpage>15</fpage>–<lpage>33</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/s00439-007-0448-6" xlink:type="simple">10.1007/s00439-007-0448-6</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref005">
<label>5</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Burgess</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Butterworth</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Thompson</surname> <given-names>SG</given-names></name>. <article-title>Mendelian randomization analysis with multiple genetic variants using summarized data</article-title>. <source>Genetic epidemiology</source>. <year>2013</year>;<volume>37</volume>(<issue>7</issue>):<fpage>658</fpage>–<lpage>665</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1002/gepi.21758" xlink:type="simple">10.1002/gepi.21758</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref006">
<label>6</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Bowden</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Davey Smith</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Burgess</surname> <given-names>S</given-names></name>. <article-title>Mendelian randomization with invalid instruments: effect estimation and bias detection through Egger regression</article-title>. <source>International journal of epidemiology</source>. <year>2015</year>;<volume>44</volume>(<issue>2</issue>):<fpage>512</fpage>–<lpage>525</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/ije/dyv080" xlink:type="simple">10.1093/ije/dyv080</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref007">
<label>7</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Bowden</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Davey Smith</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Haycock</surname> <given-names>PC</given-names></name>, <name name-style="western"><surname>Burgess</surname> <given-names>S</given-names></name>. <article-title>Consistent estimation in Mendelian randomization with some invalid instruments using a weighted median estimator</article-title>. <source>Genetic epidemiology</source>. <year>2016</year>;<volume>40</volume>(<issue>4</issue>):<fpage>304</fpage>–<lpage>314</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1002/gepi.21965" xlink:type="simple">10.1002/gepi.21965</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref008">
<label>8</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Hartwig</surname> <given-names>FP</given-names></name>, <name name-style="western"><surname>Davey Smith</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Bowden</surname> <given-names>J</given-names></name>. <article-title>Robust inference in summary data Mendelian randomization via the zero modal pleiotropy assumption</article-title>. <source>International journal of epidemiology</source>. <year>2017</year>;<volume>46</volume>(<issue>6</issue>):<fpage>1985</fpage>–<lpage>1998</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/ije/dyx102" xlink:type="simple">10.1093/ije/dyx102</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref009">
<label>9</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Verbanck</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Chen</surname> <given-names>Cy</given-names></name>, <name name-style="western"><surname>Neale</surname> <given-names>B</given-names></name>, <name name-style="western"><surname>Do</surname> <given-names>R</given-names></name>. <article-title>Detection of widespread horizontal pleiotropy in causal relationships inferred from Mendelian randomization between complex traits and diseases</article-title>. <source>Nature genetics</source>. <year>2018</year>;<volume>50</volume>(<issue>5</issue>):<fpage>693</fpage>–<lpage>698</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41588-018-0099-7" xlink:type="simple">10.1038/s41588-018-0099-7</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref010">
<label>10</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Zhao</surname> <given-names>Q</given-names></name>, <name name-style="western"><surname>Wang</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Hemani</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Bowden</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Small</surname> <given-names>DS</given-names></name>. <article-title>Statistical inference in two-sample summary-data Mendelian randomization using robust adjusted profile score</article-title>. <source>Annals of Statistics</source>. <year>2020</year>;<volume>48</volume>(<issue>3</issue>):<fpage>1742</fpage>–<lpage>1769</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1214/19-AOS1866" xlink:type="simple">10.1214/19-AOS1866</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref011">
<label>11</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Burgess</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Zuber</surname> <given-names>V</given-names></name>, <name name-style="western"><surname>Gkatzionis</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Foley</surname> <given-names>CN</given-names></name>. <article-title>Modal-based estimation via heterogeneity-penalized weighting: model averaging for consistent and efficient estimation in Mendelian randomization when a plurality of candidate instruments are valid</article-title>, <source>International journal of epidemiology</source>. <year>2018</year>;<volume>47</volume>(<issue>4</issue>):<fpage>1242</fpage>–<lpage>1254</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/ije/dyy080" xlink:type="simple">10.1093/ije/dyy080</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref012">
<label>12</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Qi</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Chatterjee</surname> <given-names>N</given-names></name>. <article-title>Mendelian randomization analysis using mixture models for robust and efficient estimation of causal effects</article-title>. <source>Nature Communications</source>. <year>2019</year>;<volume>10</volume>(<issue>1</issue>):<fpage>1</fpage>–<lpage>10</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41467-019-09432-2" xlink:type="simple">10.1038/s41467-019-09432-2</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref013">
<label>13</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Burgess</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Foley</surname> <given-names>CN</given-names></name>, <name name-style="western"><surname>Allara</surname> <given-names>E</given-names></name>, <name name-style="western"><surname>Staley</surname> <given-names>JR</given-names></name>, <name name-style="western"><surname>Howson</surname> <given-names>JM</given-names></name>. <article-title>A robust and efficient method for Mendelian randomization with hundreds of genetic variants</article-title>. <source>Nature Communications</source>. <year>2020</year>;<volume>11</volume>(<issue>1</issue>):<fpage>1</fpage>–<lpage>11</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41467-019-14156-4" xlink:type="simple">10.1038/s41467-019-14156-4</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref014">
<label>14</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Berzuini</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Guo</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Burgess</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Bernardinelli</surname> <given-names>L</given-names></name>. <article-title>A Bayesian approach to Mendelian randomization with multiple pleiotropic variants</article-title>. <source>Biostatistics</source>. <year>2020</year>;<volume>21</volume>(<issue>1</issue>):<fpage>86</fpage>–<lpage>101</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/biostatistics/kxy027" xlink:type="simple">10.1093/biostatistics/kxy027</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref015">
<label>15</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Morrison</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Knoblauch</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Marcus</surname> <given-names>JH</given-names></name>, <name name-style="western"><surname>Stephens</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>He</surname> <given-names>X</given-names></name>. <article-title>Mendelian randomization accounting for correlated and uncorrelated pleiotropic effects using genome-wide summary statistics</article-title>. <source>Nature Genetics</source>. <year>2020</year>; p. <fpage>1</fpage>–<lpage>7</lpage>.</mixed-citation>
</ref>
<ref id="pgen.1009575.ref016">
<label>16</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Sanderson</surname> <given-names>E</given-names></name>, <name name-style="western"><surname>Spiller</surname> <given-names>W</given-names></name>, <name name-style="western"><surname>Bowden</surname> <given-names>J</given-names></name>. <article-title>Testing and Correcting for Weak and Pleiotropic Instruments in Two-Sample Multivariable Mendelian Randomisation</article-title>. <source>bioRxiv</source>. <year>2020</year>;.</mixed-citation>
</ref>
<ref id="pgen.1009575.ref017">
<label>17</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Consortium</surname> <given-names>IS</given-names></name>. <article-title>Common polygenic variation contributes to risk of schizophrenia that overlaps with bipolar disorder</article-title>. <source>Nature</source>. <year>2009</year>;<volume>460</volume>(<issue>7256</issue>):<fpage>748</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nature08185" xlink:type="simple">10.1038/nature08185</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref018">
<label>18</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Yang</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Benyamin</surname> <given-names>B</given-names></name>, <name name-style="western"><surname>McEvoy</surname> <given-names>BP</given-names></name>, <name name-style="western"><surname>Gordon</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Henders</surname> <given-names>AK</given-names></name>, <name name-style="western"><surname>Nyholt</surname> <given-names>DR</given-names></name>, <etal>et al</etal>. <article-title>Common SNPs explain a large proportion of the heritability for human height</article-title>. <source>Nature Genetics</source>. <year>2010</year>;<volume>42</volume>(<issue>7</issue>):<fpage>565</fpage>–<lpage>569</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng.608" xlink:type="simple">10.1038/ng.608</ext-link></comment> <object-id pub-id-type="pmid">20562875</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref019">
<label>19</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Bulik-Sullivan</surname> <given-names>BK</given-names></name>, <name name-style="western"><surname>Loh</surname> <given-names>PR</given-names></name>, <name name-style="western"><surname>Finucane</surname> <given-names>HK</given-names></name>, <name name-style="western"><surname>Ripke</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Yang</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Patterson</surname> <given-names>N</given-names></name>, <etal>et al</etal>. <article-title>LD Score regression distinguishes confounding from polygenicity in genome-wide association studies</article-title>. <source>Nature genetics</source>. <year>2015</year>;<volume>47</volume>(<issue>3</issue>):<fpage>291</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng.3211" xlink:type="simple">10.1038/ng.3211</ext-link></comment> <object-id pub-id-type="pmid">25642630</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref020">
<label>20</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Loh</surname> <given-names>PR</given-names></name>, <name name-style="western"><surname>Bhatia</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Gusev</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Finucane</surname> <given-names>HK</given-names></name>, <name name-style="western"><surname>Bulik-Sullivan</surname> <given-names>BK</given-names></name>, <name name-style="western"><surname>Pollack</surname> <given-names>SJ</given-names></name>, <etal>et al</etal>. <article-title>Contrasting genetic architectures of schizophrenia and other complex diseases using fast variance-components analysis</article-title>. <source>Nature Genetics</source>. <year>2015</year>;<volume>47</volume>(<issue>12</issue>):<fpage>1385</fpage>–<lpage>1392</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng.3431" xlink:type="simple">10.1038/ng.3431</ext-link></comment> <object-id pub-id-type="pmid">26523775</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref021">
<label>21</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Shi</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Kichaev</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Pasaniuc</surname> <given-names>B</given-names></name>. <article-title>Contrasting the genetic architecture of 30 complex traits from summary association data</article-title>. <source>The American Journal of Human Genetics</source>. <year>2016</year>;<volume>99</volume>(<issue>1</issue>):<fpage>139</fpage>–<lpage>153</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.ajhg.2016.05.013" xlink:type="simple">10.1016/j.ajhg.2016.05.013</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref022">
<label>22</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Timpson</surname> <given-names>NJ</given-names></name>, <name name-style="western"><surname>Greenwood</surname> <given-names>CM</given-names></name>, <name name-style="western"><surname>Soranzo</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Lawson</surname> <given-names>DJ</given-names></name>, <name name-style="western"><surname>Richards</surname> <given-names>JB</given-names></name>. <article-title>Genetic architecture: the shape of the genetic contribution to human traits and disease</article-title>. <source>Nature Reviews Genetics</source>. <year>2018</year>;<volume>19</volume>(<issue>2</issue>):<fpage>110</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nrg.2017.101" xlink:type="simple">10.1038/nrg.2017.101</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref023">
<label>23</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>O’Connor</surname> <given-names>LJ</given-names></name>, <name name-style="western"><surname>Schoech</surname> <given-names>AP</given-names></name>, <name name-style="western"><surname>Hormozdiari</surname> <given-names>F</given-names></name>, <name name-style="western"><surname>Gazal</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Patterson</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Price</surname> <given-names>AL</given-names></name>. <article-title>Extreme polygenicity of complex traits is explained by negative selection</article-title>. <source>The American Journal of Human Genetics</source>. <year>2019</year>;<volume>105</volume>(<issue>3</issue>):<fpage>456</fpage>–<lpage>476</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.ajhg.2019.07.003" xlink:type="simple">10.1016/j.ajhg.2019.07.003</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref024">
<label>24</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Wray</surname> <given-names>NR</given-names></name>, <name name-style="western"><surname>Wijmenga</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Sullivan</surname> <given-names>PF</given-names></name>, <name name-style="western"><surname>Yang</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Visscher</surname> <given-names>PM</given-names></name>. <article-title>Common disease is more complex than implied by the core gene omnigenic model</article-title>. <source>Cell</source>. <year>2018</year>;<volume>173</volume>(<issue>7</issue>):<fpage>1573</fpage>–<lpage>1580</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.cell.2018.05.051" xlink:type="simple">10.1016/j.cell.2018.05.051</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref025">
<label>25</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Boyle</surname> <given-names>EA</given-names></name>, <name name-style="western"><surname>Li</surname> <given-names>YI</given-names></name>, <name name-style="western"><surname>Pritchard</surname> <given-names>JK</given-names></name>. <article-title>An expanded view of complex traits: from polygenic to omnigenic</article-title>. <source>Cell</source>. <year>2017</year>;<volume>169</volume>(<issue>7</issue>):<fpage>1177</fpage>–<lpage>1186</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.cell.2017.05.038" xlink:type="simple">10.1016/j.cell.2017.05.038</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref026">
<label>26</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>O’Connor</surname> <given-names>LJ</given-names></name>, <name name-style="western"><surname>Price</surname> <given-names>AL</given-names></name>. <article-title>Distinguishing genetic correlation from causation across 52 diseases and complex traits</article-title>. <source>Nature genetics</source>. <year>2018</year>;<volume>50</volume>(<issue>12</issue>):<fpage>1728</fpage>–<lpage>1734</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41588-018-0255-0" xlink:type="simple">10.1038/s41588-018-0255-0</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref027">
<label>27</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Krauss</surname> <given-names>RM</given-names></name>. <article-title>Lipids and lipoproteins in patients with type 2 diabetes</article-title>. <source>Diabetes care</source>. <year>2004</year>;<volume>27</volume>(<issue>6</issue>):<fpage>1496</fpage>–<lpage>1504</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.2337/diacare.27.6.1496" xlink:type="simple">10.2337/diacare.27.6.1496</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref028">
<label>28</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Lotta</surname> <given-names>LA</given-names></name>, <name name-style="western"><surname>Sharp</surname> <given-names>SJ</given-names></name>, <name name-style="western"><surname>Burgess</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Perry</surname> <given-names>JR</given-names></name>, <name name-style="western"><surname>Stewart</surname> <given-names>ID</given-names></name>, <name name-style="western"><surname>Willems</surname> <given-names>SM</given-names></name>, <etal>et al</etal>. <article-title>Association between low-density lipoprotein cholesterol–lowering genetic variants and risk of type 2 diabetes: a meta-analysis</article-title>. <source>Jama</source>. <year>2016</year>;<volume>316</volume>(<issue>13</issue>):<fpage>1383</fpage>–<lpage>1391</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1001/jama.2016.14568" xlink:type="simple">10.1001/jama.2016.14568</ext-link></comment> <object-id pub-id-type="pmid">27701660</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref029">
<label>29</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Timpson</surname> <given-names>NJ</given-names></name>, <name name-style="western"><surname>Nordestgaard</surname> <given-names>BG</given-names></name>, <name name-style="western"><surname>Harbord</surname> <given-names>RM</given-names></name>, <name name-style="western"><surname>Zacho</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Frayling</surname> <given-names>TM</given-names></name>, <name name-style="western"><surname>Tybjærg-Hansen</surname> <given-names>A</given-names></name>, <etal>et al</etal>. <article-title>C-reactive protein levels and body mass index: elucidating direction of causation through reciprocal Mendelian randomization</article-title>. <source>International journal of obesity</source>. <year>2011</year>;<volume>35</volume>(<issue>2</issue>):<fpage>300</fpage>–<lpage>308</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ijo.2010.137" xlink:type="simple">10.1038/ijo.2010.137</ext-link></comment> <object-id pub-id-type="pmid">20714329</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref030">
<label>30</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Hemani</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Tilling</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Davey Smith</surname> <given-names>G</given-names></name>. <article-title>Orienting the causal relationship between imprecisely measured traits using GWAS summary data</article-title>. <source>PLoS genetics</source>. <year>2017</year>;<volume>13</volume>(<issue>11</issue>):<fpage>e1007081</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pgen.1007081" xlink:type="simple">10.1371/journal.pgen.1007081</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref031">
<label>31</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Burgess</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Thompson</surname> <given-names>SG</given-names></name>, <name name-style="western"><surname>Collaboration</surname> <given-names>CCG</given-names></name>. <article-title>Avoiding bias from weak instruments in Mendelian randomization studies</article-title>. <source>International journal of epidemiology</source>. <year>2011</year>;<volume>40</volume>(<issue>3</issue>):<fpage>755</fpage>–<lpage>764</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/ije/dyr036" xlink:type="simple">10.1093/ije/dyr036</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref032">
<label>32</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Purcell</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Neale</surname> <given-names>B</given-names></name>, <name name-style="western"><surname>Todd-Brown</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Thomas</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Ferreira</surname> <given-names>MA</given-names></name>, <name name-style="western"><surname>Bender</surname> <given-names>D</given-names></name>, <etal>et al</etal>. <article-title>PLINK: a tool set for whole-genome association and population-based linkage analyses</article-title>. <source>The American journal of human genetics</source>. <year>2007</year>;<volume>81</volume>(<issue>3</issue>):<fpage>559</fpage>–<lpage>575</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1086/519795" xlink:type="simple">10.1086/519795</ext-link></comment> <object-id pub-id-type="pmid">17701901</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref033">
<label>33</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Justice</surname> <given-names>AE</given-names></name>, <name name-style="western"><surname>Winkler</surname> <given-names>TW</given-names></name>, <name name-style="western"><surname>Feitosa</surname> <given-names>MF</given-names></name>, <name name-style="western"><surname>Graff</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Fisher</surname> <given-names>VA</given-names></name>, <name name-style="western"><surname>Young</surname> <given-names>K</given-names></name>, <etal>et al</etal>. <article-title>Genome-wide meta-analysis of 241,258 adults accounting for smoking behaviour identifies novel loci for obesity traits</article-title>. <source>Nature communications</source>. <year>2017</year>;<volume>8</volume>:<fpage>14977</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ncomms14977" xlink:type="simple">10.1038/ncomms14977</ext-link></comment> <object-id pub-id-type="pmid">28443625</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref034">
<label>34</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Randall</surname> <given-names>JC</given-names></name>, <name name-style="western"><surname>Winkler</surname> <given-names>TW</given-names></name>, <name name-style="western"><surname>Kutalik</surname> <given-names>Z</given-names></name>, <name name-style="western"><surname>Berndt</surname> <given-names>SI</given-names></name>, <name name-style="western"><surname>Jackson</surname> <given-names>AU</given-names></name>, <name name-style="western"><surname>Monda</surname> <given-names>KL</given-names></name>, <etal>et al</etal>. <article-title>Sex-stratified genome-wide association studies including 270,000 individuals show sexual dimorphism in genetic loci for anthropometric traits</article-title>. <source>PLoS Genet</source>. <year>2013</year>;<volume>9</volume>(<issue>6</issue>):<fpage>e1003500</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pgen.1003500" xlink:type="simple">10.1371/journal.pgen.1003500</ext-link></comment> <object-id pub-id-type="pmid">23754948</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref035">
<label>35</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Morris</surname> <given-names>AP</given-names></name>, <name name-style="western"><surname>Voight</surname> <given-names>BF</given-names></name>, <name name-style="western"><surname>Teslovich</surname> <given-names>TM</given-names></name>, <name name-style="western"><surname>Ferreira</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Segre</surname> <given-names>AV</given-names></name>, <name name-style="western"><surname>Steinthorsdottir</surname> <given-names>V</given-names></name>, <etal>et al</etal>. <article-title>Large-scale association analysis provides insights into the genetic architecture and pathophysiology of type 2 diabetes</article-title>. <source>Nature genetics</source>. <year>2012</year>;<volume>44</volume>(<issue>9</issue>):<fpage>981</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng.2383" xlink:type="simple">10.1038/ng.2383</ext-link></comment> <object-id pub-id-type="pmid">22885922</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref036">
<label>36</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Sanderson</surname> <given-names>E</given-names></name>, <name name-style="western"><surname>Davey Smith</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Windmeijer</surname> <given-names>F</given-names></name>, <name name-style="western"><surname>Bowden</surname> <given-names>J</given-names></name>. <article-title>An examination of multivariable Mendelian randomization in the single-sample and two-sample summary data settings</article-title> <source>International journal of epidemiology</source>. <year>2019</year>;<volume>48</volume>(<issue>3</issue>):<fpage>713</fpage>–<lpage>727</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/ije/dyy262" xlink:type="simple">10.1093/ije/dyy262</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref037">
<label>37</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Wood</surname> <given-names>AR</given-names></name>, <name name-style="western"><surname>Esko</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Yang</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Vedantam</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Pers</surname> <given-names>TH</given-names></name>, <name name-style="western"><surname>Gustafsson</surname> <given-names>S</given-names></name>, <etal>et al</etal>. <article-title>Defining the role of common variation in the genomic and biological architecture of adult human height</article-title>. <source>Nature genetics</source>. <year>2014</year>;<volume>46</volume>(<issue>11</issue>):<fpage>1173</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng.3097" xlink:type="simple">10.1038/ng.3097</ext-link></comment> <object-id pub-id-type="pmid">25282103</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref038">
<label>38</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Willer</surname> <given-names>CJ</given-names></name>, <name name-style="western"><surname>Schmidt</surname> <given-names>EM</given-names></name>, <name name-style="western"><surname>Sengupta</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Peloso</surname> <given-names>GM</given-names></name>, <name name-style="western"><surname>Gustafsson</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Kanoni</surname> <given-names>S</given-names></name>, <etal>et al</etal>. <article-title>Discovery and refinement of loci associated with lipid levels</article-title>. <source>Nature genetics</source>. <year>2013</year>;<volume>45</volume>(<issue>11</issue>):<fpage>1274</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng.2797" xlink:type="simple">10.1038/ng.2797</ext-link></comment> <object-id pub-id-type="pmid">24097068</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref039">
<label>39</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Hoffmann</surname> <given-names>TJ</given-names></name>, <name name-style="western"><surname>Ehret</surname> <given-names>GB</given-names></name>, <name name-style="western"><surname>Nandakumar</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Ranatunga</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Schaefer</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Kwok</surname> <given-names>PY</given-names></name>, <etal>et al</etal>. <article-title>Genome-wide association analyses using electronic health records identify new loci influencing blood pressure variation</article-title>. <source>Nature genetics</source>. <year>2017</year>;<volume>49</volume>(<issue>1</issue>):<fpage>54</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng.3715" xlink:type="simple">10.1038/ng.3715</ext-link></comment> <object-id pub-id-type="pmid">27841878</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref040">
<label>40</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Nelson</surname> <given-names>CP</given-names></name>, <name name-style="western"><surname>Goel</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Butterworth</surname> <given-names>AS</given-names></name>, <name name-style="western"><surname>Kanoni</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Webb</surname> <given-names>TR</given-names></name>, <name name-style="western"><surname>Marouli</surname> <given-names>E</given-names></name>, <etal>et al</etal>. <article-title>Association analyses based on false discovery rate implicate new loci for coronary artery disease</article-title>. <source>Nature genetics</source>. <year>2017</year>;<volume>49</volume>(<issue>9</issue>):<fpage>1385</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng.3913" xlink:type="simple">10.1038/ng.3913</ext-link></comment> <object-id pub-id-type="pmid">28714975</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref041">
<label>41</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Malik</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Chauhan</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Traylor</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Sargurupremraj</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Okada</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Mishra</surname> <given-names>A</given-names></name>, <etal>et al</etal>. <article-title>Multiancestry genome-wide association study of 520,000 subjects identifies 32 loci associated with stroke and stroke subtypes</article-title>. <source>Nature genetics</source>. <year>2018</year>;<volume>50</volume>(<issue>4</issue>):<fpage>524</fpage>–<lpage>537</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41588-018-0058-3" xlink:type="simple">10.1038/s41588-018-0058-3</ext-link></comment> <object-id pub-id-type="pmid">29531354</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref042">
<label>42</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Linnér</surname> <given-names>RK</given-names></name>, <name name-style="western"><surname>Biroli</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Kong</surname> <given-names>E</given-names></name>, <name name-style="western"><surname>Meddens</surname> <given-names>SFW</given-names></name>, <name name-style="western"><surname>Wedow</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Fontana</surname> <given-names>MA</given-names></name>, <etal>et al</etal>. <article-title>Genome-wide association analyses of risk tolerance and risky behaviors in over 1 million individuals identify hundreds of loci and shared genetic influences</article-title>. <source>Nature genetics</source>. <year>2019</year>;<volume>51</volume>(<issue>2</issue>):<fpage>245</fpage>–<lpage>257</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41588-018-0309-3" xlink:type="simple">10.1038/s41588-018-0309-3</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref043">
<label>43</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Coronary Artery Disease (C4D) Genetics</surname> <given-names>Consortium</given-names></name>. <article-title>A genome-wide association study in Europeans and South Asians identifies five new loci for coronary artery disease</article-title>. <source>Nature genetics</source>. <year>2011</year>;<volume>43</volume>(<issue>4</issue>):<fpage>339</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng.782" xlink:type="simple">10.1038/ng.782</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref044">
<label>44</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Schunkert</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>König</surname> <given-names>IR</given-names></name>, <name name-style="western"><surname>Kathiresan</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Reilly</surname> <given-names>MP</given-names></name>, <name name-style="western"><surname>Assimes</surname> <given-names>TL</given-names></name>, <name name-style="western"><surname>Holm</surname> <given-names>H</given-names></name>, <etal>et al</etal>. <article-title>Large-scale association analysis identifies 13 new susceptibility loci for coronary artery disease</article-title>. <source>Nature genetics</source>. <year>2011</year>;<volume>43</volume>(<issue>4</issue>):<fpage>333</fpage>–<lpage>338</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng.784" xlink:type="simple">10.1038/ng.784</ext-link></comment> <object-id pub-id-type="pmid">21378990</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref045">
<label>45</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Elliott</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Chambers</surname> <given-names>JC</given-names></name>, <name name-style="western"><surname>Zhang</surname> <given-names>W</given-names></name>, <name name-style="western"><surname>Clarke</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Hopewell</surname> <given-names>JC</given-names></name>, <name name-style="western"><surname>Peden</surname> <given-names>JF</given-names></name>, <etal>et al</etal>. <article-title>Genetic loci associated with C-reactive protein levels and risk of coronary heart disease</article-title>. <source>Jama</source>. <year>2009</year>;<volume>302</volume>(<issue>1</issue>):<fpage>37</fpage>–<lpage>48</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1001/jama.2009.954" xlink:type="simple">10.1001/jama.2009.954</ext-link></comment> <object-id pub-id-type="pmid">19567438</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref046">
<label>46</label>
<mixed-citation publication-type="journal" xlink:type="simple"><collab>C Reactive Protein Coronary Heart Disease Genetics Collaboration</collab>. <article-title>Association between C reactive protein and coronary heart disease: Mendelian randomization analysis based on individual participant data</article-title>. <source>Bmj</source>. <year>2011</year>;<volume>342</volume>:<fpage>d548</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1136/bmj.d548" xlink:type="simple">10.1136/bmj.d548</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref047">
<label>47</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Holmes</surname> <given-names>MV</given-names></name>, <name name-style="western"><surname>Ala-Korpela</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Davey Smith</surname> <given-names>G</given-names></name>. <article-title>Mendelian randomization in cardiometabolic disease: challenges in evaluating causality</article-title>. <source>Nature Reviews Cardiology</source>. <year>2017</year>;<volume>14</volume>(<issue>10</issue>):<fpage>577</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nrcardio.2017.78" xlink:type="simple">10.1038/nrcardio.2017.78</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref048">
<label>48</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Prins</surname> <given-names>BP</given-names></name>, <name name-style="western"><surname>Kuchenbaecker</surname> <given-names>KB</given-names></name>, <name name-style="western"><surname>Bao</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Smart</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Zabaneh</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Fatemifar</surname> <given-names>G</given-names></name>, <etal>et al</etal>. <article-title>Genome-wide analysis of health-related biomarkers in the UK Household Longitudinal Study reveals novel associations</article-title>. <source>Scientific reports</source>. <year>2017</year>;<volume>7</volume>(<issue>1</issue>):<fpage>1</fpage>–<lpage>9</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41598-017-10812-1" xlink:type="simple">10.1038/s41598-017-10812-1</ext-link></comment> <object-id pub-id-type="pmid">28887542</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref049">
<label>49</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Dehghan</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Dupuis</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Barbalic</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Bis</surname> <given-names>JC</given-names></name>, <name name-style="western"><surname>Eiriksdottir</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Lu</surname> <given-names>C</given-names></name>, <etal>et al</etal>. <article-title>Meta-Analysis of Genome-Wide Association Studies in &gt;80 000 Subjects Identifies Multiple Loci for C-Reactive Protein LevelsClinical Perspective</article-title>. <source>Circulation</source>. <year>2011</year>;<volume>123</volume>(<issue>7</issue>):<fpage>731</fpage>–<lpage>738</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1161/CIRCULATIONAHA.110.948570" xlink:type="simple">10.1161/CIRCULATIONAHA.110.948570</ext-link></comment> <object-id pub-id-type="pmid">21300955</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref050">
<label>50</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Spencer</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Köstel Bal</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Egner</surname> <given-names>W</given-names></name>, <name name-style="western"><surname>Lango Allen</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Raza</surname> <given-names>SI</given-names></name>, <name name-style="western"><surname>Ma</surname> <given-names>CA</given-names></name>, <etal>et al</etal>. <article-title>Loss of the interleukin-6 receptor causes immunodeficiency, atopy, and abnormal inflammatory responses</article-title>. <source>Journal of Experimental Medicine</source>. <year>2019</year>;<volume>216</volume>(<issue>9</issue>):<fpage>1986</fpage>–<lpage>1998</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1084/jem.20190344" xlink:type="simple">10.1084/jem.20190344</ext-link></comment> <object-id pub-id-type="pmid">31235509</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref051">
<label>51</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Teng</surname> <given-names>JP</given-names></name>, <name name-style="western"><surname>Yang</surname> <given-names>ZY</given-names></name>, <name name-style="western"><surname>Zhu</surname> <given-names>YM</given-names></name>, <name name-style="western"><surname>Ni</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Zhu</surname> <given-names>ZJ</given-names></name>, <name name-style="western"><surname>Li</surname> <given-names>XQ</given-names></name>. <article-title>The roles of ARHGAP10 in the proliferation, migration and invasion of lung cancer cells</article-title>. <source>Oncology letters</source>. <year>2017</year>;<volume>14</volume>(<issue>4</issue>):<fpage>4613</fpage>–<lpage>4618</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3892/ol.2017.6729" xlink:type="simple">10.3892/ol.2017.6729</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref052">
<label>52</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Akiyama</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Okada</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Kanai</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Takahashi</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Momozawa</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Ikeda</surname> <given-names>M</given-names></name>, <etal>et al</etal>. <article-title>Genome-wide association study identifies 112 new loci for body mass index in the Japanese population</article-title>. <source>Nature genetics</source>. <year>2017</year>;<volume>49</volume>(<issue>10</issue>):<fpage>1458</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng.3951" xlink:type="simple">10.1038/ng.3951</ext-link></comment> <object-id pub-id-type="pmid">28892062</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref053">
<label>53</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Hoffmann</surname> <given-names>TJ</given-names></name>, <name name-style="western"><surname>Theusch</surname> <given-names>E</given-names></name>, <name name-style="western"><surname>Haldar</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Ranatunga</surname> <given-names>DK</given-names></name>, <name name-style="western"><surname>Jorgenson</surname> <given-names>E</given-names></name>, <name name-style="western"><surname>Medina</surname> <given-names>MW</given-names></name>, <etal>et al</etal>. <article-title>A large electronic-health-record-based genome-wide study of serum lipids</article-title>. <source>Nature genetics</source>. <year>2018</year>;<volume>50</volume>(<issue>3</issue>):<fpage>401</fpage>–<lpage>413</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41588-018-0064-5" xlink:type="simple">10.1038/s41588-018-0064-5</ext-link></comment> <object-id pub-id-type="pmid">29507422</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref054">
<label>54</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Wuttke</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Li</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Li</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Sieber</surname> <given-names>KB</given-names></name>, <name name-style="western"><surname>Feitosa</surname> <given-names>MF</given-names></name>, <name name-style="western"><surname>Gorski</surname> <given-names>M</given-names></name>, <etal>et al</etal>. <article-title>A catalog of genetic loci associated with kidney function from analyses of a million individuals</article-title>. <source>Nature genetics</source>. <year>2019</year>;<volume>51</volume>(<issue>6</issue>):<fpage>957</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41588-019-0407-x" xlink:type="simple">10.1038/s41588-019-0407-x</ext-link></comment> <object-id pub-id-type="pmid">31152163</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref055">
<label>55</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Nagel</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Jansen</surname> <given-names>PR</given-names></name>, <name name-style="western"><surname>Stringer</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Watanabe</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>de Leeuw</surname> <given-names>CA</given-names></name>, <name name-style="western"><surname>Bryois</surname> <given-names>J</given-names></name>, <etal>et al</etal>. <article-title>Meta-analysis of genome-wide association studies for neuroticism in 449,484 individuals identifies novel genetic loci and pathways</article-title>. <source>Nature genetics</source>. <year>2018</year>;<volume>50</volume>(<issue>7</issue>):<fpage>920</fpage>–<lpage>927</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41588-018-0151-7" xlink:type="simple">10.1038/s41588-018-0151-7</ext-link></comment> <object-id pub-id-type="pmid">29942085</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref056">
<label>56</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Demontis</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Walters</surname> <given-names>RK</given-names></name>, <name name-style="western"><surname>Martin</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Mattheisen</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Als</surname> <given-names>TD</given-names></name>, <name name-style="western"><surname>Agerbo</surname> <given-names>E</given-names></name>, <etal>et al</etal>. <article-title>Discovery of the first genome-wide significant risk loci for attention deficit/hyperactivity disorder</article-title>. <source>Nature genetics</source>. <year>2019</year>;<volume>51</volume>(<issue>1</issue>):<fpage>63</fpage>–<lpage>75</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41588-018-0269-7" xlink:type="simple">10.1038/s41588-018-0269-7</ext-link></comment> <object-id pub-id-type="pmid">30478444</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref057">
<label>57</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Wray</surname> <given-names>NR</given-names></name>, <name name-style="western"><surname>Ripke</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Mattheisen</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Trzaskowski</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Byrne</surname> <given-names>EM</given-names></name>, <name name-style="western"><surname>Abdellaoui</surname> <given-names>A</given-names></name>, <etal>et al</etal>. <article-title>Genome-wide association analyses identify 44 risk variants and refine the genetic architecture of major depression</article-title>. <source>Nature genetics</source>. <year>2018</year>;<volume>50</volume>(<issue>5</issue>):<fpage>668</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41588-018-0090-3" xlink:type="simple">10.1038/s41588-018-0090-3</ext-link></comment> <object-id pub-id-type="pmid">29700475</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref058">
<label>58</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Stahl</surname> <given-names>EA</given-names></name>, <name name-style="western"><surname>Breen</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Forstner</surname> <given-names>AJ</given-names></name>, <name name-style="western"><surname>McQuillin</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Ripke</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Trubetskoy</surname> <given-names>V</given-names></name>, <etal>et al</etal>. <article-title>Genome-wide association study identifies 30 loci associated with bipolar disorder</article-title>. <source>Nature genetics</source>. <year>2019</year>;<volume>51</volume>(<issue>5</issue>):<fpage>793</fpage>–<lpage>803</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41588-019-0397-8" xlink:type="simple">10.1038/s41588-019-0397-8</ext-link></comment> <object-id pub-id-type="pmid">31043756</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref059">
<label>59</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<article-title>Meta-analysis of GWAS of over 16,000 individuals with autism spectrum disorder highlights a novel locus at 10q24. 32 and a significant overlap with schizophrenia</article-title>. <source>Molecular autism</source>. <year>2017</year>;<volume>8</volume>:<fpage>1</fpage>–<lpage>17</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/s13229-016-0115-7" xlink:type="simple">10.1186/s13229-016-0115-7</ext-link></comment> <object-id pub-id-type="pmid">28070266</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref060">
<label>60</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Ripke</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>O’Dushlaine</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Chambert</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Moran</surname> <given-names>JL</given-names></name>, <name name-style="western"><surname>Kähler</surname> <given-names>AK</given-names></name>, <name name-style="western"><surname>Akterin</surname> <given-names>S</given-names></name>, <etal>et al</etal>. <article-title>Genome-wide association analysis identifies 13 new risk loci for schizophrenia</article-title>. <source>Nature genetics</source>. <year>2013</year>;<volume>45</volume>(<issue>10</issue>):<fpage>1150</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng.2742" xlink:type="simple">10.1038/ng.2742</ext-link></comment> <object-id pub-id-type="pmid">23974872</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref061">
<label>61</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Arnold</surname> <given-names>PD</given-names></name>, <name name-style="western"><surname>Askland</surname> <given-names>KD</given-names></name>, <name name-style="western"><surname>Barlassina</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Bellodi</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Bienvenu</surname> <given-names>O</given-names></name>, <name name-style="western"><surname>Black</surname> <given-names>D</given-names></name>, <etal>et al</etal>. <article-title>Revealing the complex genetic architecture of obsessive-compulsive disorder using meta-analysis</article-title>. <source>Molecular psychiatry</source>. <year>2018</year>;<volume>23</volume>(<issue>5</issue>):<fpage>1181</fpage>–<lpage>1181</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/mp.2017.154" xlink:type="simple">10.1038/mp.2017.154</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref062">
<label>62</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Marioni</surname> <given-names>RE</given-names></name>, <name name-style="western"><surname>Harris</surname> <given-names>SE</given-names></name>, <name name-style="western"><surname>Zhang</surname> <given-names>Q</given-names></name>, <name name-style="western"><surname>McRae</surname> <given-names>AF</given-names></name>, <name name-style="western"><surname>Hagenaars</surname> <given-names>SP</given-names></name>, <name name-style="western"><surname>Hill</surname> <given-names>WD</given-names></name>, <etal>et al</etal>. <article-title>GWAS on family history of Alzheimer’s disease</article-title>. <source>Translational psychiatry</source>. <year>2018</year>;<volume>8</volume>(<issue>1</issue>):<fpage>1</fpage>–<lpage>7</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41398-018-0150-6" xlink:type="simple">10.1038/s41398-018-0150-6</ext-link></comment> <object-id pub-id-type="pmid">29777097</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref063">
<label>63</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Hill</surname> <given-names>WD</given-names></name>, <name name-style="western"><surname>Weiss</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Liewald</surname> <given-names>DC</given-names></name>, <name name-style="western"><surname>Davies</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Porteous</surname> <given-names>DJ</given-names></name>, <name name-style="western"><surname>Hayward</surname> <given-names>C</given-names></name>, <etal>et al</etal>. <article-title>Genetic contributions to two special factors of neuroticism are associated with affluence, higher intelligence, better health, and longer life</article-title>. <source>Molecular psychiatry</source>. <year>2019</year>; p. <fpage>1</fpage>–<lpage>19</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41380-019-0387-3" xlink:type="simple">10.1038/s41380-019-0387-3</ext-link></comment> <object-id pub-id-type="pmid">30867560</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref064">
<label>64</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Savage</surname> <given-names>JE</given-names></name>, <name name-style="western"><surname>Jansen</surname> <given-names>PR</given-names></name>, <name name-style="western"><surname>Stringer</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Watanabe</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Bryois</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>De Leeuw</surname> <given-names>CA</given-names></name>, <etal>et al</etal>. <article-title>Genome-wide association meta-analysis in 269,867 individuals identifies new genetic and functional links to intelligence</article-title>. <source>Nature genetics</source>. <year>2018</year>;<volume>50</volume>(<issue>7</issue>):<fpage>912</fpage>–<lpage>919</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41588-018-0152-6" xlink:type="simple">10.1038/s41588-018-0152-6</ext-link></comment> <object-id pub-id-type="pmid">29942086</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref065">
<label>65</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Lane</surname> <given-names>JM</given-names></name>, <name name-style="western"><surname>Jones</surname> <given-names>SE</given-names></name>, <name name-style="western"><surname>Dashti</surname> <given-names>HS</given-names></name>, <name name-style="western"><surname>Wood</surname> <given-names>AR</given-names></name>, <name name-style="western"><surname>Aragam</surname> <given-names>KG</given-names></name>, <name name-style="western"><surname>van Hees</surname> <given-names>VT</given-names></name>, <etal>et al</etal>. <article-title>Biological and clinical insights from genetics of insomnia symptoms</article-title>. <source>Nature genetics</source>. <year>2019</year>;<volume>51</volume>(<issue>3</issue>):<fpage>387</fpage>–<lpage>393</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41588-019-0361-7" xlink:type="simple">10.1038/s41588-019-0361-7</ext-link></comment> <object-id pub-id-type="pmid">30804566</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref066">
<label>66</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Yap</surname> <given-names>CX</given-names></name>, <name name-style="western"><surname>Sidorenko</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Wu</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Kemper</surname> <given-names>KE</given-names></name>, <name name-style="western"><surname>Yang</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Wray</surname> <given-names>NR</given-names></name>, <etal>et al</etal>. <article-title>Dissection of genetic variation and evidence for pleiotropy in male pattern baldness</article-title>. <source>Nature communications</source>. <year>2018</year>;<volume>9</volume>(<issue>1</issue>):<fpage>1</fpage>–<lpage>12</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41467-018-07862-y" xlink:type="simple">10.1038/s41467-018-07862-y</ext-link></comment> <object-id pub-id-type="pmid">30573740</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref067">
<label>67</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Liu</surname> <given-names>JZ</given-names></name>, <name name-style="western"><surname>Van Sommeren</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Huang</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Ng</surname> <given-names>SC</given-names></name>, <name name-style="western"><surname>Alberts</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Takahashi</surname> <given-names>A</given-names></name>, <etal>et al</etal>. <article-title>Association analyses identify 38 susceptibility loci for inflammatory bowel disease and highlight shared genetic risk across populations</article-title>. <source>Nature genetics</source>. <year>2015</year>;<volume>47</volume>(<issue>9</issue>):<fpage>979</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng.3359" xlink:type="simple">10.1038/ng.3359</ext-link></comment> <object-id pub-id-type="pmid">26192919</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref068">
<label>68</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Michailidou</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Lindström</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Dennis</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Beesley</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Hui</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Kar</surname> <given-names>S</given-names></name>, <etal>et al</etal>. <article-title>Association analysis identifies 65 new breast cancer risk loci</article-title>. <source>Nature</source>. <year>2017</year>;<volume>551</volume>(<issue>7678</issue>):<fpage>92</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nature24284" xlink:type="simple">10.1038/nature24284</ext-link></comment> <object-id pub-id-type="pmid">29059683</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref069">
<label>69</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Phelan</surname> <given-names>CM</given-names></name>, <name name-style="western"><surname>Kuchenbaecker</surname> <given-names>KB</given-names></name>, <name name-style="western"><surname>Tyrer</surname> <given-names>JP</given-names></name>, <name name-style="western"><surname>Kar</surname> <given-names>SP</given-names></name>, <name name-style="western"><surname>Lawrenson</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Winham</surname> <given-names>SJ</given-names></name>, <etal>et al</etal>. <article-title>Identification of 12 new susceptibility loci for different histotypes of epithelial ovarian cancer</article-title>. <source>Nature genetics</source>. <year>2017</year>;<volume>49</volume>(<issue>5</issue>):<fpage>680</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng.3826" xlink:type="simple">10.1038/ng.3826</ext-link></comment> <object-id pub-id-type="pmid">28346442</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref070">
<label>70</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Schumacher</surname> <given-names>FR</given-names></name>, <name name-style="western"><surname>Al Olama</surname> <given-names>AA</given-names></name>, <name name-style="western"><surname>Berndt</surname> <given-names>SI</given-names></name>, <name name-style="western"><surname>Benlloch</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Ahmed</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Saunders</surname> <given-names>EJ</given-names></name>, <etal>et al</etal>. <article-title>Association analyses of more than 140,000 men identify 63 new prostate cancer susceptibility loci</article-title>. <source>Nature genetics</source>. <year>2018</year>;<volume>50</volume>(<issue>7</issue>):<fpage>928</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41588-018-0142-8" xlink:type="simple">10.1038/s41588-018-0142-8</ext-link></comment> <object-id pub-id-type="pmid">29892016</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref071">
<label>71</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Buniello</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>MacArthur</surname> <given-names>JAL</given-names></name>, <name name-style="western"><surname>Cerezo</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Harris</surname> <given-names>LW</given-names></name>, <name name-style="western"><surname>Hayhurst</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Malangone</surname> <given-names>C</given-names></name>, <etal>et al</etal>. <article-title>The NHGRI-EBI GWAS Catalog of published genome-wide association studies, targeted arrays and summary statistics 2019</article-title>. <source>Nucleic acids research</source>. <year>2019</year>;<volume>47</volume>(<issue>D1</issue>):<fpage>D1005</fpage>–<lpage>D1012</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/nar/gky1120" xlink:type="simple">10.1093/nar/gky1120</ext-link></comment> <object-id pub-id-type="pmid">30445434</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref072">
<label>72</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Wang</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Li</surname> <given-names>F</given-names></name>, <name name-style="western"><surname>Wei</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Lian</surname> <given-names>ZX</given-names></name>, <name name-style="western"><surname>Sun</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Tian</surname> <given-names>Z</given-names></name>. <article-title>Respiratory influenza virus infection induces intestinal immune injury via microbiota-mediated Th17 cell–dependent inflammation</article-title>. <source>Journal of Experimental Medicine</source>. <year>2014</year>;<volume>211</volume>(<issue>12</issue>):<fpage>2397</fpage>–<lpage>2410</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1084/jem.20140625" xlink:type="simple">10.1084/jem.20140625</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref073">
<label>73</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Zhao</surname> <given-names>Q</given-names></name>, <name name-style="western"><surname>Wang</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Miao</surname> <given-names>Z</given-names></name>, <name name-style="western"><surname>Zhang</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Hennessy</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Small</surname> <given-names>DS</given-names></name>, <etal>et al</etal>. <article-title>A Mendelian randomization study of the role of lipoprotein subfractions in coronary artery disease</article-title>. <source>Elife</source>. <year>2021</year>; <fpage>e58361</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.7554/eLife.58361" xlink:type="simple">10.7554/eLife.58361</ext-link></comment> <object-id pub-id-type="pmid">33899735</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref074">
<label>74</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>White</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Swerdlow</surname> <given-names>DI</given-names></name>, <name name-style="western"><surname>Preiss</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Fairhurst-Hunter</surname> <given-names>Z</given-names></name>, <name name-style="western"><surname>Keating</surname> <given-names>BJ</given-names></name>, <name name-style="western"><surname>Asselbergs</surname> <given-names>FW</given-names></name>, <etal>et al</etal>. <article-title>Association of lipid fractions with risks for coronary artery disease and diabetes</article-title>. <source>JAMA cardiology</source>. <year>2016</year>;<volume>1</volume>(<issue>6</issue>):<fpage>692</fpage>–<lpage>699</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1001/jamacardio.2016.1884" xlink:type="simple">10.1001/jamacardio.2016.1884</ext-link></comment> <object-id pub-id-type="pmid">27487401</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref075">
<label>75</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Yadav</surname> <given-names>RS</given-names></name>, <name name-style="western"><surname>Tiwari</surname> <given-names>NK</given-names></name>. <article-title>Lipid integration in neurodegeneration: an overview of Alzheimer’s disease</article-title>. <source>Molecular neurobiology</source>. <year>2014</year>;<volume>50</volume>(<issue>1</issue>):<fpage>168</fpage>–<lpage>176</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/s12035-014-8661-5" xlink:type="simple">10.1007/s12035-014-8661-5</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref076">
<label>76</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Hibbeln</surname> <given-names>JR</given-names></name>, <name name-style="western"><surname>Salem</surname> <given-names>N</given-names> <suffix>Jr</suffix></name>. <article-title>Dietary polyunsaturated fatty acids and depression: when cholesterol does not satisfy</article-title>. <source>The American journal of clinical nutrition</source>. <year>1995</year>;<volume>62</volume>(<issue>1</issue>):<fpage>1</fpage>–<lpage>9</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/ajcn/62.1.1" xlink:type="simple">10.1093/ajcn/62.1.1</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref077">
<label>77</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Agouridis</surname> <given-names>AP</given-names></name>, <name name-style="western"><surname>Elisaf</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Milionis</surname> <given-names>HJ</given-names></name>. <article-title>An overview of lipid abnormalities in patients with inflammatory bowel disease</article-title>. <source>Annals of Gastroenterology: Quarterly Publication of the Hellenic Society of Gastroenterology</source>. <year>2011</year>;<volume>24</volume>(<issue>3</issue>):<fpage>181</fpage>.</mixed-citation>
</ref>
<ref id="pgen.1009575.ref078">
<label>78</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Fall</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Xie</surname> <given-names>W</given-names></name>, <name name-style="western"><surname>Poon</surname> <given-names>W</given-names></name>, <name name-style="western"><surname>Yaghootkar</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Mägi</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Knowles</surname> <given-names>JW</given-names></name>, <etal>et al</etal>. <article-title>Using genetic variants to assess the relationship between circulating lipids and type 2 diabetes</article-title>. <source>Diabetes</source>. <year>2015</year>; p. <fpage>db141710</fpage>. <object-id pub-id-type="pmid">25948681</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref079">
<label>79</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Burgess</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Thompson</surname> <given-names>SG</given-names></name>. <article-title>Multivariable Mendelian randomization: the use of pleiotropic genetic variants to estimate causal effects</article-title>. <source>American journal of epidemiology</source>. <year>2015</year>;<volume>181</volume>(<issue>4</issue>):<fpage>251</fpage>–<lpage>260</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/aje/kwu283" xlink:type="simple">10.1093/aje/kwu283</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref080">
<label>80</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Zhao</surname> <given-names>Q</given-names></name>, <name name-style="western"><surname>Chen</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Wang</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Small</surname> <given-names>DS</given-names></name>. <article-title>Powerful three-sample genome-wide design and robust statistical inference in summary-data Mendelian randomization</article-title>. <source>International Journal of Epidemiology</source>. <year>2019</year>;<volume>48</volume>(<issue>5</issue>):<fpage>1478</fpage>–<lpage>1492</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/ije/dyz142" xlink:type="simple">10.1093/ije/dyz142</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref081">
<label>81</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Cole</surname> <given-names>SR</given-names></name>, <name name-style="western"><surname>Frangakis</surname> <given-names>CE</given-names></name>. <article-title>The consistency statement in causal inference: a definition or an assumption?</article-title> <source>Epidemiology</source>. <year>2009</year>;<volume>20</volume>(<issue>1</issue>):<fpage>3</fpage>–<lpage>5</lpage>.</mixed-citation>
</ref>
<ref id="pgen.1009575.ref082">
<label>82</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Davey Smith</surname> <given-names>G</given-names></name>. <article-title>Epigenesis for epidemiologists: does evo-devo have implications for population health research and practice?</article-title> <source>International Journal of Epidemiology</source>. <year>2012</year>(<issue>1</issue>); <volume>41</volume>:<fpage>236</fpage>–<lpage>247</lpage>.</mixed-citation>
</ref>
<ref id="pgen.1009575.ref083">
<label>83</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Holmes</surname> <given-names>MV</given-names></name> and <name name-style="western"><surname>Davey Smith</surname> <given-names>G</given-names></name>. <article-title>Revealing the effect of CETP inhibition in cardiovascular disease</article-title>. <source>Nature Reviews Cardiology</source>. <year>2017</year>;<volume>14</volume>:<fpage>635</fpage>–<lpage>636</lpage>.</mixed-citation>
</ref>
<ref id="pgen.1009575.ref084">
<label>84</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Munafò</surname> <given-names>MR</given-names></name>, <name name-style="western"><surname>Davey Smith</surname> <given-names>G</given-names></name>. <article-title>Robust research needs many lines of evidence: Replication is not enough</article-title>. <source>Nature</source>. <year>2018</year>; <volume>553</volume>:<fpage>399</fpage>–<lpage>401</lpage>.</mixed-citation>
</ref>
<ref id="pgen.1009575.ref085">
<label>85</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Munafo</surname> <given-names>MR</given-names></name>, <name name-style="western"><surname>Higgins</surname> <given-names>JPT</given-names></name>, <name name-style="western"><surname>Davey Smith</surname> <given-names>G</given-names></name>. <article-title>Triangulating evidence through the inclusion of genetically informed designs</article-title>. <source>Cold Spring Harbour Perspectives in Medicine Collection</source>. <year>2021</year>, <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1101/cshperspect.a040659" xlink:type="simple">10.1101/cshperspect.a040659</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref086">
<label>86</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Bulik-Sullivan</surname> <given-names>B</given-names></name>, <name name-style="western"><surname>Finucane</surname> <given-names>HK</given-names></name>, <name name-style="western"><surname>Anttila</surname> <given-names>V</given-names></name>, <name name-style="western"><surname>Gusev</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Day</surname> <given-names>FR</given-names></name>, <name name-style="western"><surname>Loh</surname> <given-names>PR</given-names></name>, <etal>et al</etal>. <article-title>An atlas of genetic correlations across human diseases and traits</article-title>. <source>Nature genetics</source>. <year>2015</year>;<volume>47</volume>(<issue>11</issue>):<fpage>1236</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng.3406" xlink:type="simple">10.1038/ng.3406</ext-link></comment> <object-id pub-id-type="pmid">26414676</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref087">
<label>87</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<collab>International Schizophrenia Consortium</collab>, <name name-style="western"><surname>Purcell</surname> <given-names>SM</given-names></name>, <name name-style="western"><surname>Wray</surname> <given-names>NR</given-names></name>, <name name-style="western"><surname>Stone</surname> <given-names>JL</given-names></name>, <name name-style="western"><surname>Visscher</surname> <given-names>PM</given-names></name>, <name name-style="western"><surname>O’Donovan</surname> <given-names>MC</given-names></name>, <etal>et al</etal>. <article-title>Common polygenic variation contributes to risk of schizophrenia and bipolar disorder</article-title>. <source>Nature</source>. <year>2009</year>;<volume>460</volume>(<issue>7256</issue>):<fpage>748</fpage>–<lpage>752</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nature08185" xlink:type="simple">10.1038/nature08185</ext-link></comment> <object-id pub-id-type="pmid">19571811</object-id></mixed-citation>
</ref>
<ref id="pgen.1009575.ref088">
<label>88</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Ward</surname> <given-names>LD</given-names></name>, <name name-style="western"><surname>Kellis</surname> <given-names>M</given-names></name>. <article-title>HaploReg: a resource for exploring chromatin states, conservation, and regulatory motif alterations within sets of genetically linked variants</article-title>. <source>Nucleic acids research</source>. <year>2012</year>;<volume>40</volume>(<issue>D1</issue>):<fpage>D930</fpage>–<lpage>D934</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/nar/gkr917" xlink:type="simple">10.1093/nar/gkr917</ext-link></comment></mixed-citation>
</ref>
<ref id="pgen.1009575.ref089">
<label>89</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Benjamini</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Heller</surname> <given-names>R</given-names></name>. <article-title>Screening for partial conjunction hypotheses</article-title>. <source>Biometrics</source>. <year>2008</year>;<volume>64</volume>(<issue>4</issue>):<fpage>1215</fpage>–<lpage>1222</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/j.1541-0420.2007.00984.x" xlink:type="simple">10.1111/j.1541-0420.2007.00984.x</ext-link></comment></mixed-citation>
</ref>
</ref-list>
</back>
</article>