<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.1d3 20150301//EN" "http://jats.nlm.nih.gov/publishing/1.1d3/JATS-journalpublishing1.dtd">
<article article-type="research-article" dtd-version="1.1d3" xml:lang="en" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="nlm-ta">PLoS Genet</journal-id>
<journal-id journal-id-type="publisher-id">plos</journal-id>
<journal-id journal-id-type="pmc">plosgen</journal-id>
<journal-title-group>
<journal-title>PLOS Genetics</journal-title>
</journal-title-group>
<issn pub-type="ppub">1553-7390</issn>
<issn pub-type="epub">1553-7404</issn>
<publisher>
<publisher-name>Public Library of Science</publisher-name>
<publisher-loc>San Francisco, CA USA</publisher-loc>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">PGENETICS-D-19-01506</article-id>
<article-id pub-id-type="doi">10.1371/journal.pgen.1009241</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Research Article</subject>
</subj-group>
<subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Genetics</subject><subj-group><subject>Heredity</subject><subj-group><subject>Inbreeding</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Physical sciences</subject><subj-group><subject>Mathematics</subject><subj-group><subject>Statistics</subject><subj-group><subject>Statistical models</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Computational biology</subject><subj-group><subject>Genome analysis</subject><subj-group><subject>Genome-wide association studies</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Genetics</subject><subj-group><subject>Genomics</subject><subj-group><subject>Genome analysis</subject><subj-group><subject>Genome-wide association studies</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Genetics</subject><subj-group><subject>Human genetics</subject><subj-group><subject>Genome-wide association studies</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Research and analysis methods</subject><subj-group><subject>Simulation and modeling</subject></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Genetics</subject><subj-group><subject>Heredity</subject><subj-group><subject>Genetic mapping</subject><subj-group><subject>Variant genotypes</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Genetics</subject><subj-group><subject>Heredity</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Evolutionary biology</subject><subj-group><subject>Population genetics</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Genetics</subject><subj-group><subject>Population genetics</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Population biology</subject><subj-group><subject>Population genetics</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Genetics</subject><subj-group><subject>Genetic loci</subject></subj-group></subj-group></subj-group></article-categories>
<title-group>
<article-title>Estimating <italic>F</italic><sub>ST</sub> and kinship for arbitrary population structures</article-title>
<alt-title alt-title-type="running-head">Estimating <italic>F</italic><sub>ST</sub> and kinship for arbitrary population structures</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0003-4928-3403</contrib-id>
<name name-style="western">
<surname>Ochoa</surname> <given-names>Alejandro</given-names></name>
<role content-type="https://casrai.org/credit/">Conceptualization</role>
<role content-type="https://casrai.org/credit/">Formal analysis</role>
<role content-type="https://casrai.org/credit/">Funding acquisition</role>
<role content-type="https://casrai.org/credit/">Investigation</role>
<role content-type="https://casrai.org/credit/">Methodology</role>
<role content-type="https://casrai.org/credit/">Software</role>
<role content-type="https://casrai.org/credit/">Writing – original draft</role>
<role content-type="https://casrai.org/credit/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0001-5992-402X</contrib-id>
<name name-style="western">
<surname>Storey</surname> <given-names>John D.</given-names></name>
<role content-type="https://casrai.org/credit/">Conceptualization</role>
<role content-type="https://casrai.org/credit/">Formal analysis</role>
<role content-type="https://casrai.org/credit/">Funding acquisition</role>
<role content-type="https://casrai.org/credit/">Investigation</role>
<role content-type="https://casrai.org/credit/">Methodology</role>
<role content-type="https://casrai.org/credit/">Writing – original draft</role>
<role content-type="https://casrai.org/credit/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff003"><sup>3</sup></xref>
<xref ref-type="corresp" rid="cor001">*</xref>
</contrib>
</contrib-group>
<aff id="aff001">
<label>1</label>
<addr-line>Duke Center for Statistical Genetics and Genomics, Duke University, Durham, North Carolina, United States of America</addr-line>
</aff>
<aff id="aff002">
<label>2</label>
<addr-line>Department of Biostatistics and Bioinformatics, Duke University, Durham, North Carolina, United States of America</addr-line>
</aff>
<aff id="aff003">
<label>3</label>
<addr-line>Lewis-Sigler Institute for Integrative Genomics, Princeton University, Princeton, New Jersey, United States of America</addr-line>
</aff>
<contrib-group>
<contrib contrib-type="editor" xlink:type="simple">
<name name-style="western">
<surname>Feldman</surname> <given-names>Marcus W.</given-names></name>
<role>Editor</role>
<xref ref-type="aff" rid="edit1"/>
</contrib>
</contrib-group>
<aff id="edit1">
<addr-line>Stanford University, UNITED STATES</addr-line>
</aff>
<author-notes>
<fn fn-type="conflict" id="coi001">
<p>The authors have declared that no competing interests exist.</p>
</fn>
<corresp id="cor001">* E-mail: <email xlink:type="simple">jstorey@princeton.edu</email></corresp>
</author-notes>
<pub-date pub-type="collection">
<month>1</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="epub">
<day>19</day>
<month>1</month>
<year>2021</year>
</pub-date>
<volume>17</volume>
<issue>1</issue>
<elocation-id>e1009241</elocation-id>
<history>
<date date-type="received">
<day>11</day>
<month>9</month>
<year>2019</year>
</date>
<date date-type="accepted">
<day>2</day>
<month>11</month>
<year>2020</year>
</date>
</history>
<permissions>
<copyright-year>2021</copyright-year>
<copyright-holder>Ochoa, Storey</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">
<license-p>This is an open access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">Creative Commons Attribution License</ext-link>, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
</license>
</permissions>
<self-uri content-type="pdf" xlink:href="info:doi/10.1371/journal.pgen.1009241"/>
<abstract>
<p><italic>F</italic><sub>ST</sub> and kinship are key parameters often estimated in modern population genetics studies in order to quantitatively characterize structure and relatedness. Kinship matrices have also become a fundamental quantity used in genome-wide association studies and heritability estimation. The most frequently-used estimators of <italic>F</italic><sub>ST</sub> and kinship are method-of-moments estimators whose accuracies depend strongly on the existence of simple underlying forms of structure, such as the independent subpopulations model of non-overlapping, independently evolving subpopulations. However, modern data sets have revealed that these simple models of structure likely do not hold in many populations, including humans. In this work, we analyze the behavior of these estimators in the presence of arbitrarily-complex population structures, which results in an improved estimation framework specifically designed for arbitrary population structures. After generalizing the definition of <italic>F</italic><sub>ST</sub> to arbitrary population structures and establishing a framework for assessing bias and consistency of genome-wide estimators, we calculate the accuracy of existing <italic>F</italic><sub>ST</sub> and kinship estimators under arbitrary population structures, characterizing biases and estimation challenges unobserved under their originally-assumed models of structure. We then present our new approach, which consistently estimates kinship and <italic>F</italic><sub>ST</sub> when the minimum kinship value in the dataset is estimated consistently. We illustrate our results using simulated genotypes from an admixture model, constructing a one-dimensional geographic scenario that departs nontrivially from the independent subpopulations model. Our simulations reveal the potential for severe biases in estimates of existing approaches that are overcome by our new framework. This work may significantly improve future analyses that rely on accurate kinship and <italic>F</italic><sub>ST</sub> estimates.</p>
</abstract>
<abstract abstract-type="summary">
<title>Author summary</title>
<p>Kinship coefficients and <italic>F</italic><sub>ST</sub>, which measure relatedness and population structure, respectively, are important quantities needed to accurately perform various analyses on genetic data, including genome-wide association studies and heritability estimation. However, existing estimators require restrictive assumptions of independence that are not met by real human and other datasets. In this work we find that existing estimators can be severely biased under reasonable scenarios, first by theoretically determining their properties, and then using an admixture simulation to illustrate our findings. In particular, we find that existing <italic>F</italic><sub>ST</sub> estimators are downwardly biased, and that existing kinship matrix estimators have related biases that are on average downward and of similar magnitude but vary for every pair of individuals. These insights led us to a new estimation framework for kinship and <italic>F</italic><sub>ST</sub> that is practically unbiased for any population structure, as demonstrated by theory and simulations. Our new approaches—available as open-source R packages—are easy to use and are more widely applicable than existing approaches, and they are likely to improve downstream analyses that require accurate kinship and <italic>F</italic><sub>ST</sub> estimates.</p>
</abstract>
<funding-group>
<award-group id="award001">
<funding-source>
<institution-wrap>
<institution-id institution-id-type="funder-id">http://dx.doi.org/10.13039/100000051</institution-id>
<institution>National Human Genome Research Institute</institution>
</institution-wrap>
</funding-source>
<award-id>R01 HG006448</award-id>
<principal-award-recipient>
<contrib-id authenticated="true" contrib-id-type="orcid">https://orcid.org/0000-0001-5992-402X</contrib-id>
<name name-style="western">
<surname>Storey</surname> <given-names>John D.</given-names></name>
</principal-award-recipient>
</award-group>
<funding-statement>This research was supported in part by National Institutes of Health, National Human Genome Research Institute grant R01 HG006448 (JDS). The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</funding-statement>
</funding-group>
<counts>
<fig-count count="7"/>
<table-count count="0"/>
<page-count count="36"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>PLOS Publication Stage</meta-name>
<meta-value>vor-update-to-uncorrected-proof</meta-value>
</custom-meta>
<custom-meta>
<meta-name>Publication Update</meta-name>
<meta-value>2021-01-29</meta-value>
</custom-meta>
<custom-meta id="data-availability">
<meta-name>Data Availability</meta-name>
<meta-value>The data and computer code for these manuscripts can be found at <ext-link ext-link-type="uri" xlink:href="https://github.com/StoreyLab/human-differentiation-manuscript" xlink:type="simple">https://github.com/StoreyLab/human-differentiation-manuscript</ext-link>.</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="sec001" sec-type="intro">
<title>Introduction</title>
<p>In population genetics studies, one is often interested in characterizing structure, genetic differentiation, and relatedness among individuals. Two quantities often considered in this context are <italic>F</italic><sub>ST</sub> and kinship. <italic>F</italic><sub>ST</sub> is a parameter that measures structure in a subdivided population, satisfying <italic>F</italic><sub>ST</sub> = 0 for an unstructured population and <italic>F</italic><sub>ST</sub> = 1 if every locus has become fixed for some allele in each subpopulation. More generally, <italic>F</italic><sub>ST</sub> is the probability that alleles drawn randomly from a subpopulation are “identical by descent” (IBD) relative to an ancestral population [<xref ref-type="bibr" rid="pgen.1009241.ref001">1</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref002">2</xref>]. The kinship coefficient is a measure of relatedness between individuals defined in terms of IBD probabilities, and it is closely related to <italic>F</italic><sub>ST</sub>, since the mean kinship of the parents in a subpopulation is the <italic>F</italic><sub>ST</sub> of the following generation [<xref ref-type="bibr" rid="pgen.1009241.ref001">1</xref>].</p>
<p>This work focuses on the estimation of <italic>F</italic><sub>ST</sub> and kinship from biallelic single-nucleotide polymorphism (SNP) data. Existing estimators can be classified into parametric estimators (methods that require a likelihood function) and non-parametric estimators (such as the method-of-moments estimators we focus on, which only require low-order moment equations). There are many likelihood approaches that estimate <italic>F</italic><sub>ST</sub> and kinship, but these are limited by assuming independent subpopulations or Normal approximations for <italic>F</italic><sub>ST</sub> [<xref ref-type="bibr" rid="pgen.1009241.ref003">3</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref011">11</xref>] or totally outbred individuals for kinship [<xref ref-type="bibr" rid="pgen.1009241.ref012">12</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref013">13</xref>]. Additionally, more complete likelihood models such as that of Jacquard [<xref ref-type="bibr" rid="pgen.1009241.ref014">14</xref>] are underdetermined for biallelic loci [<xref ref-type="bibr" rid="pgen.1009241.ref015">15</xref>]. Non-parametric approaches such as those based on the method of moments are considerably more flexible and computationally tractable [<xref ref-type="bibr" rid="pgen.1009241.ref016">16</xref>], so they are the natural choice to study arbitrary population structures.</p>
<p>The most frequently-used <italic>F</italic><sub>ST</sub> estimators are derived and justified under the “independent subpopulations model,” in which non-overlapping subpopulations evolved independently by splitting all at the same time from a common ancestral population. The Weir-Cockerham (WC) <italic>F</italic><sub>ST</sub> estimator assumes subpopulations of differing sample sizes and equal per-subpopulation <italic>F</italic><sub>ST</sub> relative to the common ancestral population [<xref ref-type="bibr" rid="pgen.1009241.ref017">17</xref>]. The Weir-Hill <italic>F</italic><sub>ST</sub> estimator generalized WC for subpopulations with different <italic>F</italic><sub>ST</sub> values, and first considered arbitrary coancestry between subpopulations, resulting in estimates of a linearly-transformed <italic>F</italic><sub>ST</sub>, namely <inline-formula id="pgen.1009241.e001"><alternatives><graphic id="pgen.1009241.e001g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e001" xlink:type="simple"/><mml:math display="inline" id="M1"><mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>-</mml:mo><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>˜</mml:mo></mml:mover><mml:mo>)</mml:mo></mml:mrow><mml:mo>/</mml:mo><mml:mrow><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>˜</mml:mo></mml:mover><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:math></alternatives></inline-formula> (where <inline-formula id="pgen.1009241.e002"><alternatives><graphic id="pgen.1009241.e002g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e002" xlink:type="simple"/><mml:math display="inline" id="M2"><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>˜</mml:mo></mml:mover></mml:math></alternatives></inline-formula> is the unknown mean coancestry value between subpopulations) [<xref ref-type="bibr" rid="pgen.1009241.ref004">4</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref018">18</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref019">19</xref>]. Weir-Hill has further evolved into the Weir-Goudet approach, incorporating relatedness for subpopulations and individuals based on allele matching, also estimating a linearly-transformed <italic>F</italic><sub>ST</sub> [<xref ref-type="bibr" rid="pgen.1009241.ref020">20</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref022">22</xref>]. Note that the Weir-Hill and Weir-Goudet approaches intended to estimate such linearly-transformed quantities, which may be negative, and they did not aim to estimate IBD probabilities [<xref ref-type="bibr" rid="pgen.1009241.ref004">4</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref018">18</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref022">22</xref>]; in contrast, our goal is to estimate IBD probabilities, which must be non-negative and valid probabilities. The “Hudson” <italic>F</italic><sub>ST</sub> estimator [<xref ref-type="bibr" rid="pgen.1009241.ref023">23</xref>] assumes two subpopulations with different <italic>F</italic><sub>ST</sub> values. All of the previous <italic>F</italic><sub>ST</sub> estimators are ratio estimators derived using the method of moments to have unbiased numerators and denominators, which gives approximately unbiased ratio estimates when their assumptions are met [<xref ref-type="bibr" rid="pgen.1009241.ref004">4</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref017">17</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref023">23</xref>]. We also evaluate BayeScan [<xref ref-type="bibr" rid="pgen.1009241.ref010">10</xref>], which estimates population-specific <italic>F</italic><sub>ST</sub> values using a Bayesian model and the Dirichlet-Multinomial likelihood function—thus representing non-method-of-moments approaches—but which like other existing <italic>F</italic><sub>ST</sub> estimators also assumes that subpopulations are non-overlapping and evolve independently. These <italic>F</italic><sub>ST</sub> estimators are important contributions, used widely in the field.</p>
<p>Kinship coefficients are now commonly calculated in population genetics studies to capture structure and relatedness. Kinship is utilized in principal components analyses and linear-mixed effects models to correct for structure in Genome-Wide Association Studies (GWAS) [<xref ref-type="bibr" rid="pgen.1009241.ref016">16</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref024">24</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref030">30</xref>] and to estimate genome-wide heritability [<xref ref-type="bibr" rid="pgen.1009241.ref031">31</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref032">32</xref>]. Often absent in previous models is a clear identification and role of the ancestral population <italic>T</italic> that sets the scale of the kinship estimates used. Omission of <italic>T</italic> makes sense when kinship is estimated on an unstructured population (where only a few individual pairs are closely related; there <italic>T</italic> is the current population). Our more complete notation brings <italic>T</italic> to the fore and highlights its key role in kinship estimation and its applications. The most commonly-used kinship estimator [<xref ref-type="bibr" rid="pgen.1009241.ref016">16</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref027">27</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref030">30</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref036">36</xref>] is also a method-of-moments estimator whose operating characteristics are largely unknown in the presence of structure. We show here that this popular estimator is accurate only when the average kinship is zero, which implies that the population must be unstructured.</p>
<p>The goal of our work is to consistently estimate IBD probabilities, namely kinship coefficients and <italic>F</italic><sub>ST</sub>, for which there are currently no consistent estimators under general relatedness. Estimation of these as probabilities, as opposed to linearly-transformed quantities that may be negative, is important since the probabilistic definition of these parameters was required to derive their fundamental connections to many applications in genetics, including allele fixation [<xref ref-type="bibr" rid="pgen.1009241.ref001">1</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref002">2</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref037">37</xref>], DNA forensics [<xref ref-type="bibr" rid="pgen.1009241.ref003">3</xref>], and heritability [<xref ref-type="bibr" rid="pgen.1009241.ref038">38</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref039">39</xref>]. Although IBD probabilities are not absolute, but rather depend on the choice of ancestral population [<xref ref-type="bibr" rid="pgen.1009241.ref040">40</xref>], their values become fixed upon agreeing to estimate them in terms of the Most Recent Common Ancestor (MRCA) population, which has long been the choice for models of <italic>F</italic><sub>ST</sub> [<xref ref-type="bibr" rid="pgen.1009241.ref017">17</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref023">23</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref041">41</xref>] and kinship estimation from pedigrees [<xref ref-type="bibr" rid="pgen.1009241.ref042">42</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref043">43</xref>] or markers [<xref ref-type="bibr" rid="pgen.1009241.ref012">12</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref013">13</xref>].</p>
<p>Recent genome-wide studies have revealed that humans and other natural populations are structured in a complex manner that break the assumptions of the above estimators. Such complex population structures has been observed in several large human studies, such as the Human Genome Diversity Project [<xref ref-type="bibr" rid="pgen.1009241.ref044">44</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref045">45</xref>], the 1000 Genomes Project [<xref ref-type="bibr" rid="pgen.1009241.ref046">46</xref>], Human Origins [<xref ref-type="bibr" rid="pgen.1009241.ref047">47</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref049">49</xref>], and other contemporary [<xref ref-type="bibr" rid="pgen.1009241.ref050">50</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref054">54</xref>] and archaic populations [<xref ref-type="bibr" rid="pgen.1009241.ref055">55</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref056">56</xref>]. We have also demonstrated that the global human population has a complex kinship matrix and no independent subpopulations [<xref ref-type="bibr" rid="pgen.1009241.ref057">57</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref059">59</xref>]. Therefore, there is a need for innovative approaches designed for complex population structures. To this end, we reveal the operating characteristics of these frequently-used <italic>F</italic><sub>ST</sub> and kinship estimators in the presence of arbitrary forms of structure, which leads to a new estimation strategy for <italic>F</italic><sub>ST</sub> and kinship.</p>
<p>Here, we study existing <italic>F</italic><sub>ST</sub> and kinship method-of-moments estimators in models that allow for arbitrary population structures (see <xref ref-type="fig" rid="pgen.1009241.g001">Fig 1</xref> for an overview of the results). First, in section <bold>The generalized <italic>F</italic><sub>ST</sub> for arbitrary population structures</bold> we present the generalized definition of <italic>F</italic><sub>ST</sub> for arbitrary population structures [<xref ref-type="bibr" rid="pgen.1009241.ref057">57</xref>]. In section <bold>The kinship and coancestry models</bold> we review the kinship model for genotype covariance [<xref ref-type="bibr" rid="pgen.1009241.ref001">1</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref014">14</xref>] and the coancestry model for individual-specific allele frequencies [<xref ref-type="bibr" rid="pgen.1009241.ref057">57</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref060">60</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref061">61</xref>]. In section <bold>Assessing the accuracy of genome-wide ratio estimators</bold> we obtain new strong convergence results for a family of ratio estimators that includes the most common <italic>F</italic><sub>ST</sub> and kinship estimators. Next, we calculate the convergence values of these <italic>F</italic><sub>ST</sub> (section <bold><italic>F</italic><sub>ST</sub> estimation based on the independent subpopulations model</bold>) and kinship (section <bold>Characterizing a kinship estimator and its relationship to <italic>F</italic><sub>ST</sub></bold>) estimators under arbitrary population structures, where we find biases that are not present under their original assumptions about structure (panels “Indep. Subpop. <italic>F</italic><sub>ST</sub> Estimator” and “Existing Kinship Estimator” in <xref ref-type="fig" rid="pgen.1009241.g001">Fig 1</xref>). We characterize the limit of the standard kinship estimator, identifying complex biases or distortions, in agreement with recent work [<xref ref-type="bibr" rid="pgen.1009241.ref021">21</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref062">62</xref>].</p>
<fig id="pgen.1009241.g001" position="float">
<object-id pub-id-type="doi">10.1371/journal.pgen.1009241.g001</object-id>
<label>Fig 1</label>
<caption>
<title>Accuracy of <italic>F</italic><sub>ST</sub> and kinship estimators: Overview of models and results.</title>
<p>Our analysis is based on the generalized <italic>F</italic><sub>ST</sub> definition (section <bold>The generalized <italic>F</italic><sub>ST</sub> for arbitrary population structures</bold>) and two parallel models: the “Coancestry Model” for individual-specific allele frequencies (<italic>π</italic><sub><italic>ij</italic></sub>), and the “Kinship Model” for genotypes (<italic>x</italic><sub><italic>ij</italic></sub>). The “Coancestry in Terms of Kinship” panel connects kinship (<inline-formula id="pgen.1009241.e003"><alternatives><graphic id="pgen.1009241.e003g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e003" xlink:type="simple"/><mml:math display="inline" id="M3"><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula>, <inline-formula id="pgen.1009241.e004"><alternatives><graphic id="pgen.1009241.e004g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e004" xlink:type="simple"/><mml:math display="inline" id="M4"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula>) and coancestry (<inline-formula id="pgen.1009241.e005"><alternatives><graphic id="pgen.1009241.e005g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e005" xlink:type="simple"/><mml:math display="inline" id="M5"><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula>) parameters (section <bold>The kinship and coancestry models</bold>). We use these models to study the accuracy of <italic>F</italic><sub>ST</sub> and kinship method-of-moment estimators under arbitrary population structures. The “Indep. Subpop. <italic>F</italic><sub>ST</sub> Estimator” panel shows the bias resulting from the misapplication of <italic>F</italic><sub>ST</sub> estimators for independent subpopulations (<inline-formula id="pgen.1009241.e006"><alternatives><graphic id="pgen.1009241.e006g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e006" xlink:type="simple"/><mml:math display="inline" id="M6"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula>) to arbitrary structures (section <bold><italic>F</italic><sub>ST</sub> estimation based on the independent subpopulations model</bold>), as calculated under the coancestry model. The “Existing Kinship Estimator” panel shows the bias in the standard kinship model estimator (<inline-formula id="pgen.1009241.e007"><alternatives><graphic id="pgen.1009241.e007g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e007" xlink:type="simple"/><mml:math display="inline" id="M7"><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula>) and its resulting plug-in <italic>F</italic><sub>ST</sub> estimator (<inline-formula id="pgen.1009241.e008"><alternatives><graphic id="pgen.1009241.e008g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e008" xlink:type="simple"/><mml:math display="inline" id="M8"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula>; section <bold>Characterizing a kinship estimator and its relationship to <italic>F</italic><sub>ST</sub></bold>), as calculated under the kinship model. The “New Kinship Estimator” panel presents a new statistic <italic>A</italic><sub><italic>jk</italic></sub> that estimates kinship with a uniform bias, which together with a consistent estimator of its minimum value (<inline-formula id="pgen.1009241.e009"><alternatives><graphic id="pgen.1009241.e009g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e009" xlink:type="simple"/><mml:math display="inline" id="M9"><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>min</mml:mtext></mml:msub></mml:math></alternatives></inline-formula>) results in our new kinship (<inline-formula id="pgen.1009241.e010"><alternatives><graphic id="pgen.1009241.e010g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e010" xlink:type="simple"/><mml:math display="inline" id="M10"><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>new</mml:mtext></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula>) and <italic>F</italic><sub>ST</sub> (<inline-formula id="pgen.1009241.e011"><alternatives><graphic id="pgen.1009241.e011g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e011" xlink:type="simple"/><mml:math display="inline" id="M11"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>new</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula>) estimators, which are consistent under arbitrary population structure (section <bold>A new approach for kinship and <italic>F</italic><sub>ST</sub> estimation</bold>).</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pgen.1009241.g001" xlink:type="simple"/>
</fig>
<p>In section <bold>A new approach for kinship and <italic>F</italic><sub>ST</sub> estimation</bold> we introduce a new approach for kinship and <italic>F</italic><sub>ST</sub> estimation for arbitrary population structures, and demonstrate the improved performance using a simple implementation of these estimators (panel “New Kinship Estimator” in <xref ref-type="fig" rid="pgen.1009241.g001">Fig 1</xref>). There are two key innovations. First, based on the method of moments, we derive a statistic that estimates kinship coefficients up to a shared unknown scaling factor. Second, we propose a new condition, the identification of unrelated individual pairs in the data, which yields the value of the unknown scaling factor and enables the consistent estimation of kinship matrices and <italic>F</italic><sub>ST</sub>. We present a simple implementation of this second estimator, based on taking the minimum average statistic value between subpopulations, which in section <bold>Simulations evaluating <italic>F</italic><sub>ST</sub> and kinship estimators</bold> is shown to perform well under some misspecification, namely in an admixture scenario that does not actually have subpopulations [<xref ref-type="bibr" rid="pgen.1009241.ref063">63</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref065">65</xref>]. Elsewhere, we analyze the Human Origins and 1000 Genomes Project datasets with our novel kinship and <italic>F</italic><sub>ST</sub> estimation approach, where we demonstrate its coherence with the African Origins model, and illustrate the shortcomings of previous approaches in these complex data [<xref ref-type="bibr" rid="pgen.1009241.ref059">59</xref>]. In summary, we identify a new approach for unbiased estimation of <italic>F</italic><sub>ST</sub> and kinship, and we provide new estimators that are nearly unbiased.</p>
</sec>
<sec id="sec002" sec-type="results">
<title>Results</title>
<sec id="sec003">
<title>The generalized <italic>F</italic><sub>ST</sub> for arbitrary population structures</title>
<p>The existing <italic>F</italic><sub>ST</sub> definition requires individuals to belong to discrete, non-overlapping subpopulations, so it must be generalized in order to apply to arbitrary population structures (such as the admixture model with individual-specific ancestry proportions considered in our simulations). Our generalized <italic>F</italic><sub>ST</sub> can be understood as a two-step strategy: (1) we define <italic>F</italic><sub>ST</sub> on a per-individual basis, and (2) we define <italic>F</italic><sub>ST</sub> for a group of individuals as a weighted average of the per-individual <italic>F</italic><sub>ST</sub> values [<xref ref-type="bibr" rid="pgen.1009241.ref057">57</xref>].</p>
<p>The inbreeding coefficient <inline-formula id="pgen.1009241.e012"><alternatives><graphic id="pgen.1009241.e012g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e012" xlink:type="simple"/><mml:math display="inline" id="M12"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> of an individual <italic>j</italic> relative to an ancestral population <italic>T</italic> is defined as the probability that the two alleles at a random locus are <italic>identical by descent</italic> (IBD) [<xref ref-type="bibr" rid="pgen.1009241.ref037">37</xref>]. Note that the ancestral population <italic>T</italic> determines what is IBD: only relationships since <italic>T</italic> count toward IBD. This <italic>total</italic> inbreeding coefficient (<inline-formula id="pgen.1009241.e013"><alternatives><graphic id="pgen.1009241.e013g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e013" xlink:type="simple"/><mml:math display="inline" id="M13"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula>) is the individual analog of Wright’s total inbreeding coefficient <italic>F</italic><sub>IT</sub>, the latter of which is the mean <inline-formula id="pgen.1009241.e014"><alternatives><graphic id="pgen.1009241.e014g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e014" xlink:type="simple"/><mml:math display="inline" id="M14"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> over a group of individuals [<xref ref-type="bibr" rid="pgen.1009241.ref002">2</xref>]. Wright partitioned <italic>total</italic> inbreeding (<italic>F</italic><sub>IT</sub>) into <italic>local</italic> (<italic>F</italic><sub>IS</sub>) and <italic>structural</italic> (<italic>F</italic><sub>ST</sub>) coefficients defined by a subpopulation <italic>S</italic> that contains all individuals in question and evolved from the ancestral population <italic>T</italic>, so that <italic>F</italic><sub>IS</sub> is the inbreeding of individuals relative to <italic>S</italic> (as opposed to <italic>T</italic>) and <italic>F</italic><sub>ST</sub> is inbreeding of the subpopulation <italic>S</italic> relative to <italic>T</italic>, and these coefficients satisfy (1 − <italic>F</italic><sub>IT</sub>) = (1 − <italic>F</italic><sub>IS</sub>)(1 − <italic>F</italic><sub>ST</sub>) [<xref ref-type="bibr" rid="pgen.1009241.ref002">2</xref>]. In our generalized definitions for one individual <italic>j</italic>, we restrict the subpopulation of interest (<italic>S</italic>) to be <italic>L</italic><sub><italic>j</italic></sub>, called the local subpopulation of <italic>j</italic>, which is the most recent subpopulation from which <italic>j</italic> drew its alleles. In this case, <inline-formula id="pgen.1009241.e015"><alternatives><graphic id="pgen.1009241.e015g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e015" xlink:type="simple"/><mml:math display="inline" id="M15"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:msubsup></mml:math></alternatives></inline-formula> is the <italic>local</italic> inbreeding coefficient of <italic>j</italic> (always relative to its local subpopulation <italic>L</italic><sub><italic>j</italic></sub>), and <inline-formula id="pgen.1009241.e016"><alternatives><graphic id="pgen.1009241.e016g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e016" xlink:type="simple"/><mml:math display="inline" id="M16"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> is the <italic>structural</italic> inbreeding coefficient of <italic>j</italic> (equal to the inbreeding of the subpopulation <italic>L</italic><sub><italic>j</italic></sub> relative to <italic>T</italic>), and being a special case of Wright’s equation, they also satisfy [<xref ref-type="bibr" rid="pgen.1009241.ref057">57</xref>]
<disp-formula id="pgen.1009241.e017"><alternatives><graphic id="pgen.1009241.e017g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e017" xlink:type="simple"/><mml:math display="block" id="M17"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:mo>=</mml:mo><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:msubsup><mml:mo>)</mml:mo><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(1)</label></disp-formula></p>
<p>Now we discuss estimating the three quantities we just introduced. First, the total inbreeding coefficient (<inline-formula id="pgen.1009241.e018"><alternatives><graphic id="pgen.1009241.e018g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e018" xlink:type="simple"/><mml:math display="inline" id="M18"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula>) should be estimated from the variance of genotypes, using the practically unbiased approach we introduce in this work. Second, note that the local inbreeding coefficient (<inline-formula id="pgen.1009241.e019"><alternatives><graphic id="pgen.1009241.e019g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e019" xlink:type="simple"/><mml:math display="inline" id="M19"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:msubsup></mml:math></alternatives></inline-formula>) corresponds to (non-population) family relatedness, so it can be taken to be the inbreeding calculated from a pedigree if it is available [<xref ref-type="bibr" rid="pgen.1009241.ref042">42</xref>]. Note that estimation of the various inbreeding coefficients from pedigrees was the only approach available to Wright when he studied cattle and defined inbreeding and <italic>F</italic><sub>ST</sub> [<xref ref-type="bibr" rid="pgen.1009241.ref002">2</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref037">37</xref>]. Alternatively, in the absence of pedigrees, local inbreeding can be estimated from inferred self-IBD blocks or unusually-large runs of homozygosity [<xref ref-type="bibr" rid="pgen.1009241.ref066">66</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref068">68</xref>]. Lastly, since the structural inbreeding coefficient (<inline-formula id="pgen.1009241.e020"><alternatives><graphic id="pgen.1009241.e020g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e020" xlink:type="simple"/><mml:math display="inline" id="M20"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula>) is given by the previous two quantities (solving from <xref ref-type="disp-formula" rid="pgen.1009241.e017">Eq (1)</xref>) by
<disp-formula id="pgen.1009241.e021"><alternatives><graphic id="pgen.1009241.e021g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e021" xlink:type="simple"/><mml:math display="block" id="M21"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>-</mml:mo><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:msubsup></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:msubsup></mml:mrow></mml:mfrac><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(2)</label></disp-formula>
then we propose estimating <inline-formula id="pgen.1009241.e022"><alternatives><graphic id="pgen.1009241.e022g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e022" xlink:type="simple"/><mml:math display="inline" id="M22"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> using this equation, from the above estimates of <inline-formula id="pgen.1009241.e023"><alternatives><graphic id="pgen.1009241.e023g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e023" xlink:type="simple"/><mml:math display="inline" id="M23"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009241.e024"><alternatives><graphic id="pgen.1009241.e024g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e024" xlink:type="simple"/><mml:math display="inline" id="M24"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:msubsup></mml:math></alternatives></inline-formula>.</p>
<p>As a toy example, suppose we estimate a total inbreeding coefficient of <inline-formula id="pgen.1009241.e025"><alternatives><graphic id="pgen.1009241.e025g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e025" xlink:type="simple"/><mml:math display="inline" id="M25"><mml:mrow><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>15</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> for a given individual whose parents are first cousins, then the pedigree expectation for its local inbreeding is <inline-formula id="pgen.1009241.e026"><alternatives><graphic id="pgen.1009241.e026g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e026" xlink:type="simple"/><mml:math display="inline" id="M26"><mml:mrow><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:msubsup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mn>16</mml:mn></mml:mfrac><mml:mo>=</mml:mo><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>0625</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>, and the structural inbreeding (i.e. the <italic>F</italic><sub>ST</sub> of this individual) using <xref ref-type="disp-formula" rid="pgen.1009241.e021">Eq (2)</xref> is <inline-formula id="pgen.1009241.e027"><alternatives><graphic id="pgen.1009241.e027g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e027" xlink:type="simple"/><mml:math display="inline" id="M27"><mml:mrow><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>≈</mml:mo><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>093</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>. However, if in the same example (<inline-formula id="pgen.1009241.e028"><alternatives><graphic id="pgen.1009241.e028g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e028" xlink:type="simple"/><mml:math display="inline" id="M28"><mml:mrow><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>15</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>) the individual instead had parents who were second cousins, then <inline-formula id="pgen.1009241.e029"><alternatives><graphic id="pgen.1009241.e029g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e029" xlink:type="simple"/><mml:math display="inline" id="M29"><mml:mrow><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:msubsup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mn>64</mml:mn></mml:mfrac><mml:mo>≈</mml:mo><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>0156</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>, then the structural estimate becomes <inline-formula id="pgen.1009241.e030"><alternatives><graphic id="pgen.1009241.e030g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e030" xlink:type="simple"/><mml:math display="inline" id="M30"><mml:mrow><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>≈</mml:mo><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>137</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>, which is much closer to the total inbreeding value. Thus, when total inbreeding estimates are much larger than local inbreeding estimates, correcting for the latter via <xref ref-type="disp-formula" rid="pgen.1009241.e021">Eq (2)</xref> may not change the numerical estimate of structural inbreeding by a meaningful amount. Conversely, as the local inbreeding coefficient is reduced exponentially with the degree of relatedness of the parents (<inline-formula id="pgen.1009241.e031"><alternatives><graphic id="pgen.1009241.e031g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e031" xlink:type="simple"/><mml:math display="inline" id="M31"><mml:mrow><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:msubsup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:msup><mml:mn>4</mml:mn><mml:mrow><mml:mi>n</mml:mi><mml:mo>+</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msup></mml:mfrac></mml:mrow></mml:math></alternatives></inline-formula> for <italic>n</italic>-th cousins), and as local inbreeding is required to be recent (to exclude population-level inbreeding), then sufficiently-accurate estimates of structural inbreeding can be obtained by estimating non-zero local inbreeding only for individuals with the most related parent pairs (above a certain degree of relatedness).</p>
<p>We define the generalized <italic>F</italic><sub>ST</sub> across <italic>n</italic> individuals as the weighted average of the per-individual structural inbreeding coefficients (<italic>i.e.</italic>, individual <italic>F</italic><sub>ST</sub> values) [<xref ref-type="bibr" rid="pgen.1009241.ref057">57</xref>],
<disp-formula id="pgen.1009241.e032"><alternatives><graphic id="pgen.1009241.e032g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e032" xlink:type="simple"/><mml:math display="block" id="M32"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>=</mml:mo><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(3)</label></disp-formula>
where <italic>w</italic><sub><italic>j</italic></sub> is the weight of individual <italic>j</italic> and the weights are required to sum to one and be non-negative. The above is a straightforward generalization of Wright’s <italic>F</italic><sub>ST</sub>: if every individual <italic>j</italic> has <italic>L</italic><sub><italic>j</italic></sub> = <italic>S</italic> as its local subpopulation, then <xref ref-type="disp-formula" rid="pgen.1009241.e032">Eq (3)</xref> becomes <inline-formula id="pgen.1009241.e033"><alternatives><graphic id="pgen.1009241.e033g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e033" xlink:type="simple"/><mml:math display="inline" id="M33"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>=</mml:mo><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>S</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>S</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mrow></mml:math></alternatives></inline-formula>, where <inline-formula id="pgen.1009241.e034"><alternatives><graphic id="pgen.1009241.e034g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e034" xlink:type="simple"/><mml:math display="inline" id="M34"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>S</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> is the inbreeding coefficient of subpopulation <italic>S</italic> relative to <italic>T</italic>, so it has the same meaning as Wright’s <italic>F</italic><sub>ST</sub> (the exact weights here do not matter as long as <inline-formula id="pgen.1009241.e035"><alternatives><graphic id="pgen.1009241.e035g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e035" xlink:type="simple"/><mml:math display="inline" id="M35"><mml:mrow><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>, as required). Moreover, if each individual <italic>j</italic> belongs to one of <italic>K</italic> subpopulations <italic>S</italic><sub><italic>u</italic></sub> (<italic>u</italic> ∈ {1, …, <italic>K</italic>}) and if subpopulations are weighted equally (<inline-formula id="pgen.1009241.e036"><alternatives><graphic id="pgen.1009241.e036g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e036" xlink:type="simple"/><mml:math display="inline" id="M36"><mml:mrow><mml:msub><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>∈</mml:mo><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow></mml:msub><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>K</mml:mi></mml:mfrac></mml:mrow></mml:math></alternatives></inline-formula> for every <italic>S</italic><sub><italic>u</italic></sub>), then <xref ref-type="disp-formula" rid="pgen.1009241.e032">Eq (3)</xref> becomes <inline-formula id="pgen.1009241.e037"><alternatives><graphic id="pgen.1009241.e037g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e037" xlink:type="simple"/><mml:math display="inline" id="M37"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>K</mml:mi></mml:mfrac><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>u</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>K</mml:mi></mml:msubsup><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mrow></mml:math></alternatives></inline-formula>, so it equals the (unweighted) average subpopulation-specific <italic>F</italic><sub>ST</sub> (<italic>i.e.</italic>, <inline-formula id="pgen.1009241.e038"><alternatives><graphic id="pgen.1009241.e038g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e038" xlink:type="simple"/><mml:math display="inline" id="M38"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula>), which is the <italic>F</italic><sub>ST</sub> definition for multiple subpopulations prevalent in modern work [<xref ref-type="bibr" rid="pgen.1009241.ref004">4</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref021">21</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref023">23</xref>]. The last case illustrates the need for weights, which above downweights individuals that belong to subpopulations with greater numbers of observations. In general, weights allow adjustment for skewed or unbalanced samples. However, in complicated scenarios without subpopulations and no obvious sampling biases, for simplicity we recommend using uniform weights (<inline-formula id="pgen.1009241.e039"><alternatives><graphic id="pgen.1009241.e039g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e039" xlink:type="simple"/><mml:math display="inline" id="M39"><mml:mrow><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac></mml:mrow></mml:math></alternatives></inline-formula>) for the target generalized <italic>F</italic><sub>ST</sub>.</p>
<p>In terms of total and local inbreeding coefficients (using <xref ref-type="disp-formula" rid="pgen.1009241.e021">Eq (2)</xref>), the generalized <italic>F</italic><sub>ST</sub> equals
<disp-formula id="pgen.1009241.e040"><alternatives><graphic id="pgen.1009241.e040g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e040" xlink:type="simple"/><mml:math display="block" id="M40"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>=</mml:mo><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mfrac><mml:mrow><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>-</mml:mo><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:msubsup></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:msubsup></mml:mrow></mml:mfrac><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
which immediately suggests the estimation strategy when estimates of the total and local inbreeding coefficients are available. For simplicity, in the remainder of this work we shall consider only locally-outbred individuals (<inline-formula id="pgen.1009241.e041"><alternatives><graphic id="pgen.1009241.e041g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e041" xlink:type="simple"/><mml:math display="inline" id="M41"><mml:mrow><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:msubsup><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> for all <italic>j</italic>), for which the generalized <italic>F</italic><sub>ST</sub> simply equals the weighted mean total inbreeding coefficient:
<disp-formula id="pgen.1009241.e042"><alternatives><graphic id="pgen.1009241.e042g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e042" xlink:type="simple"/><mml:math display="block" id="M42"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>=</mml:mo><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(4)</label></disp-formula>
This greatly simplifies our discussion of bias for all of the <italic>F</italic><sub>ST</sub> estimators we analyzed; determining the statistical properties of local inbreeding estimators is beyond the scope of this work. Moreover, the assumption of locally-outbred individuals is satisfied in all of the simulations presented in this work.</p>
</sec>
<sec id="sec004">
<title>The kinship and coancestry models</title>
<p>The generalized <italic>F</italic><sub>ST</sub> above is given solely in terms of inbreeding coefficients. In order to establish our results and framework, it is necessary to consider kinship coefficients as well. The kinship coefficient is the extension of the inbreeding coefficient for a pair of individuals: the kinship coefficient <inline-formula id="pgen.1009241.e043"><alternatives><graphic id="pgen.1009241.e043g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e043" xlink:type="simple"/><mml:math display="inline" id="M43"><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> of two individuals <italic>j</italic> and <italic>k</italic> relative to an ancestral population <italic>T</italic> is the probability that two alleles, chosen at random from each individual at a random locus, are IBD [<xref ref-type="bibr" rid="pgen.1009241.ref001">1</xref>]. Note that the self-kinship coefficient is related to the inbreeding coefficient by <inline-formula id="pgen.1009241.e044"><alternatives><graphic id="pgen.1009241.e044g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e044" xlink:type="simple"/><mml:math display="inline" id="M44"><mml:mrow><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mn>2</mml:mn></mml:mfrac><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>+</mml:mo><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula> [<xref ref-type="bibr" rid="pgen.1009241.ref016">16</xref>].</p>
<p>Kinship coefficients determine the covariance structure of genotypes, which is the key to estimating kinship and <italic>F</italic><sub>ST</sub> from genotype data. We shall concentrate on biallelic variants, which include single-nucleotide polymorphisms, and are the dominant data from genotyping microarrays and whole-genome sequencing studies. We shall also restrict our attention to diploid organisms in this present work. Genotypes are encoded into variables <italic>x</italic><sub><italic>ij</italic></sub> for each locus <italic>i</italic> and individual <italic>j</italic> that count the number of alleles (dosage) of a given reference type, so for diploid organisms <italic>x</italic><sub><italic>ij</italic></sub> = 2 is homozygous for the reference allele, <italic>x</italic><sub><italic>ij</italic></sub> = 0 is homozygous for the alternative allele, and <italic>x</italic><sub><italic>ij</italic></sub> = 1 is heterozygous. Based on the definition of the IBD probabilities, the kinship model determines the mean and covariance structure of the genotype random variables at neutral loci [<xref ref-type="bibr" rid="pgen.1009241.ref001">1</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref002">2</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref014">14</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref016">16</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref037">37</xref>]:
<disp-formula id="pgen.1009241.e045"><alternatives><graphic id="pgen.1009241.e045g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e045" xlink:type="simple"/><mml:math display="block" id="M45"><mml:mtable equalcolumns="true" equalrows="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mtext>E</mml:mtext><mml:mo stretchy="false">[</mml:mo><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>|</mml:mo><mml:mi>T</mml:mi><mml:mo stretchy="false">]</mml:mo></mml:mrow></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:mn>2</mml:mn><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mtext>Cov</mml:mtext><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>|</mml:mo><mml:mi>T</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:mn>4</mml:mn><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mrow><mml:mn>1</mml:mn><mml:mo>−</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mrow><mml:mo>)</mml:mo><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr> </mml:mtable></mml:math></alternatives> <label>(5)</label></disp-formula>
where <inline-formula id="pgen.1009241.e046"><alternatives><graphic id="pgen.1009241.e046g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e046" xlink:type="simple"/><mml:math display="inline" id="M46"><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> is the allele frequency at locus <italic>i</italic> in the ancestral population <italic>T</italic> and <inline-formula id="pgen.1009241.e047"><alternatives><graphic id="pgen.1009241.e047g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e047" xlink:type="simple"/><mml:math display="inline" id="M47"><mml:mrow><mml:mn>0</mml:mn><mml:mo>&lt;</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>&lt;</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>.</p>
<p>The coancestry model resembles the kinship model, but it is formulated in terms of allele frequencies, which simplifies our analysis of <italic>F</italic><sub>ST</sub> estimators for subpopulations as well as yielding kinship coefficients under the admixture model we simulate from in this work. Let <italic>π</italic><sub><italic>ij</italic></sub> be the <italic>individual-specific allele frequency</italic> (IAF) at locus <italic>i</italic> for individual <italic>j</italic>, which is a real number between zero and one [<xref ref-type="bibr" rid="pgen.1009241.ref060">60</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref061">61</xref>]. Our coancestry model assumes that [<xref ref-type="bibr" rid="pgen.1009241.ref057">57</xref>]
<disp-formula id="pgen.1009241.e048"><alternatives><graphic id="pgen.1009241.e048g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e048" xlink:type="simple"/><mml:math display="block" id="M48"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mo form="prefix">E</mml:mo><mml:mo>[</mml:mo><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>|</mml:mo><mml:mi>T</mml:mi><mml:mo>]</mml:mo></mml:mrow></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mo form="prefix">Cov</mml:mo><mml:mo>(</mml:mo><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>|</mml:mo><mml:mi>T</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(6)</label></disp-formula>
where <inline-formula id="pgen.1009241.e049"><alternatives><graphic id="pgen.1009241.e049g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e049" xlink:type="simple"/><mml:math display="inline" id="M49"><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> is the coancestry coefficient between individuals <italic>j</italic> and <italic>k</italic> relative to the ancestral population <italic>T</italic>. This model is inspired by coancestry models for subpopulations common in the <italic>F</italic><sub>ST</sub> literature [<xref ref-type="bibr" rid="pgen.1009241.ref004">4</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref005">5</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref021">21</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref023">23</xref>], and exactly equals those models when subpopulation sizes go to infinity, in which case <italic>j</italic> and <italic>k</italic> index subpopulations rather than individuals, and <italic>π</italic><sub><italic>ij</italic></sub> is interpreted as the true allele frequency at locus <italic>i</italic> for subpopulation <italic>j</italic>.</p>
<p>The coancestry model connects to the kinship model under the additional assumption that the alleles of an individual <italic>j</italic> are drawn independently from its IAF,
<disp-formula id="pgen.1009241.e050"><alternatives><graphic id="pgen.1009241.e050g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e050" xlink:type="simple"/><mml:math display="block" id="M50"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo>|</mml:mo></mml:mrow><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>∼</mml:mo><mml:mtext>Binomial</mml:mtext><mml:mrow><mml:mo>(</mml:mo><mml:mn>2</mml:mn><mml:mo>,</mml:mo><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>)</mml:mo></mml:mrow><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(7)</label></disp-formula>
In this case, marginalizing the intermediate IAF random variables (<italic>π</italic><sub><italic>ij</italic></sub>) and matching the resulting genotype moments results in the following equivalence [<xref ref-type="bibr" rid="pgen.1009241.ref057">57</xref>]:
<disp-formula id="pgen.1009241.e051"><alternatives><graphic id="pgen.1009241.e051g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e051" xlink:type="simple"/><mml:math display="block" id="M51"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mo>{</mml:mo><mml:mtable><mml:mtr><mml:mtd columnalign="left"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mtext>if</mml:mtext><mml:mspace width="1em"/><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mi>k</mml:mi><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd columnalign="left"><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mtext>if</mml:mtext><mml:mspace width="1em"/><mml:mi>j</mml:mi><mml:mo>≠</mml:mo><mml:mi>k</mml:mi><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable><mml:mo/></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(8)</label></disp-formula>
The coancestry coefficient equals the kinship coefficient between two different individuals, but the self-coancestry coefficient equals the inbreeding coefficient (rather than the self-kinship coefficient). However, since in the coancestry model alleles are drawn independently conditional on the IAF in <xref ref-type="disp-formula" rid="pgen.1009241.e050">Eq (7)</xref>, then the only structure present is the population structure, so these coancestry models cannot generate family structures, unlike the more general kinship model that also encompasses pedigrees. Therefore, despite <xref ref-type="disp-formula" rid="pgen.1009241.e051">Eq (8)</xref>, the kinship and coancestry are not equivalent models except under the more restrictive assumptions of the coancestry model. Thus, individuals drawn from this model are always locally-outbred, so <inline-formula id="pgen.1009241.e052"><alternatives><graphic id="pgen.1009241.e052g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e052" xlink:type="simple"/><mml:math display="inline" id="M52"><mml:mrow><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mrow></mml:math></alternatives></inline-formula> also equals the structural inbreeding coefficient, and the generalized <italic>F</italic><sub>ST</sub> under the coancestry model is therefore
<disp-formula id="pgen.1009241.e053"><alternatives><graphic id="pgen.1009241.e053g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e053" xlink:type="simple"/><mml:math display="block" id="M53"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>=</mml:mo><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(9)</label></disp-formula>
which also generalizes previous definitions of <italic>F</italic><sub>ST</sub> under coancestry for subpopulations [<xref ref-type="bibr" rid="pgen.1009241.ref004">4</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref005">5</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref021">21</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref023">23</xref>]. The kinship and coancestry models, and their connection, is included in the overview <xref ref-type="fig" rid="pgen.1009241.g001">Fig 1</xref>.</p>
</sec>
<sec id="sec005">
<title>Assessing the accuracy of genome-wide ratio estimators</title>
<p>In this section we change gears to focus on theoretical convergence properties of two broad estimator families. The resulting theory will be applied repeatedly to various <italic>F</italic><sub>ST</sub> and kinship estimators of interest in later sections.</p>
<p>Many <italic>F</italic><sub>ST</sub> and kinship coefficient method-of-moments estimators are <italic>ratio estimators</italic>, a general class of estimators that tends to be biased and to have no closed-form expectation [<xref ref-type="bibr" rid="pgen.1009241.ref069">69</xref>]. In the <italic>F</italic><sub>ST</sub> literature, the expectation of a ratio is frequently approximated with a ratio of expectations [<xref ref-type="bibr" rid="pgen.1009241.ref004">4</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref017">17</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref023">23</xref>]. Specifically, ratio estimators are often called “unbiased” if the ratio of expectations is unbiased, even though the ratio estimator itself may be biased [<xref ref-type="bibr" rid="pgen.1009241.ref069">69</xref>]. Here we characterize the behavior of two ratio estimator families calculated from genome-wide data, known as “ratio-of-means” and “mean-of-ratios” estimators [<xref ref-type="bibr" rid="pgen.1009241.ref023">23</xref>], detailing conditions where the previous approximation is justified and providing additional criteria to assess the accuracy of such estimators.</p>
<sec id="sec006">
<title>Ratio estimators</title>
<p>The general problem of forming ratio estimators involves random variables <italic>a</italic><sub><italic>i</italic></sub> and <italic>b</italic><sub><italic>i</italic></sub> calculated from genotypes at each locus <italic>i</italic>, such that E[<italic>a</italic><sub><italic>i</italic></sub>] = <italic>Ac</italic><sub><italic>i</italic></sub> and E[<italic>b</italic><sub><italic>i</italic></sub>] = <italic>Bc</italic><sub><italic>i</italic></sub> and the goal is to estimate <inline-formula id="pgen.1009241.e054"><alternatives><graphic id="pgen.1009241.e054g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e054" xlink:type="simple"/><mml:math display="inline" id="M54"><mml:mfrac><mml:mi>A</mml:mi><mml:mi>B</mml:mi></mml:mfrac></mml:math></alternatives></inline-formula>. <italic>A</italic> and <italic>B</italic> are constants shared across loci (given by <italic>F</italic><sub>ST</sub> or <inline-formula id="pgen.1009241.e055"><alternatives><graphic id="pgen.1009241.e055g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e055" xlink:type="simple"/><mml:math display="inline" id="M55"><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula>), while <italic>c</italic><sub><italic>i</italic></sub> depends on the ancestral allele frequency <inline-formula id="pgen.1009241.e056"><alternatives><graphic id="pgen.1009241.e056g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e056" xlink:type="simple"/><mml:math display="inline" id="M56"><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> and varies per locus. The problem is that the single-locus estimator <inline-formula id="pgen.1009241.e057"><alternatives><graphic id="pgen.1009241.e057g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e057" xlink:type="simple"/><mml:math display="inline" id="M57"><mml:mfrac><mml:msub><mml:mi>a</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:msub><mml:mi>b</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mfrac></mml:math></alternatives></inline-formula> is biased, since <inline-formula id="pgen.1009241.e058"><alternatives><graphic id="pgen.1009241.e058g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e058" xlink:type="simple"/><mml:math display="inline" id="M58"><mml:mrow><mml:mo form="prefix">E</mml:mo><mml:mo>[</mml:mo><mml:mfrac><mml:msub><mml:mi>a</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:msub><mml:mi>b</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mfrac><mml:mo>]</mml:mo><mml:mo>≠</mml:mo><mml:mfrac><mml:mrow><mml:mo form="prefix">E</mml:mo><mml:mo>[</mml:mo><mml:msub><mml:mi>a</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>]</mml:mo></mml:mrow><mml:mrow><mml:mo form="prefix">E</mml:mo><mml:mo>[</mml:mo><mml:msub><mml:mi>b</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>]</mml:mo></mml:mrow></mml:mfrac><mml:mo>=</mml:mo><mml:mfrac><mml:mi>A</mml:mi><mml:mi>B</mml:mi></mml:mfrac></mml:mrow></mml:math></alternatives></inline-formula>, which applies to ratio estimators in general [<xref ref-type="bibr" rid="pgen.1009241.ref069">69</xref>]. Below we study two estimator families that combine large numbers of loci to better estimate <inline-formula id="pgen.1009241.e059"><alternatives><graphic id="pgen.1009241.e059g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e059" xlink:type="simple"/><mml:math display="inline" id="M59"><mml:mfrac><mml:mi>A</mml:mi><mml:mi>B</mml:mi></mml:mfrac></mml:math></alternatives></inline-formula>.</p>
</sec>
<sec id="sec007">
<title>Convergence</title>
<p>The solution we recommend is the “ratio-of-means” estimator <inline-formula id="pgen.1009241.e060"><alternatives><graphic id="pgen.1009241.e060g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e060" xlink:type="simple"/><mml:math display="inline" id="M60"><mml:mfrac><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>m</mml:mi></mml:msub><mml:msub><mml:mover accent="true"><mml:mi>B</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>m</mml:mi></mml:msub></mml:mfrac></mml:math></alternatives></inline-formula>, where <inline-formula id="pgen.1009241.e061"><alternatives><graphic id="pgen.1009241.e061g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e061" xlink:type="simple"/><mml:math display="inline" id="M61"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>m</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>m</mml:mi></mml:mfrac><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:msubsup><mml:msub><mml:mi>a</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></alternatives></inline-formula>, and <inline-formula id="pgen.1009241.e062"><alternatives><graphic id="pgen.1009241.e062g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e062" xlink:type="simple"/><mml:math display="inline" id="M62"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>B</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>m</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>m</mml:mi></mml:mfrac><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:msubsup><mml:msub><mml:mi>b</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></alternatives></inline-formula>, which is common for <italic>F</italic><sub>ST</sub> estimators [<xref ref-type="bibr" rid="pgen.1009241.ref004">4</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref017">17</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref019">19</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref023">23</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref070">70</xref>]. Note that <inline-formula id="pgen.1009241.e063"><alternatives><graphic id="pgen.1009241.e063g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e063" xlink:type="simple"/><mml:math display="inline" id="M63"><mml:mrow><mml:mo form="prefix">E</mml:mo><mml:mrow><mml:mo>[</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>m</mml:mi></mml:msub><mml:mo>]</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mi>A</mml:mi><mml:msub><mml:mover accent="true"><mml:mi>c</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>m</mml:mi></mml:msub></mml:mrow></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009241.e064"><alternatives><graphic id="pgen.1009241.e064g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e064" xlink:type="simple"/><mml:math display="inline" id="M64"><mml:mrow><mml:mo form="prefix">E</mml:mo><mml:mrow><mml:mo>[</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>B</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>m</mml:mi></mml:msub><mml:mo>]</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mi>B</mml:mi><mml:msub><mml:mover accent="true"><mml:mi>c</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>m</mml:mi></mml:msub></mml:mrow></mml:math></alternatives></inline-formula>, where <inline-formula id="pgen.1009241.e065"><alternatives><graphic id="pgen.1009241.e065g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e065" xlink:type="simple"/><mml:math display="inline" id="M65"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>c</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>m</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>m</mml:mi></mml:mfrac><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:msubsup><mml:msub><mml:mi>c</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></alternatives></inline-formula>. We will assume bounded terms (|<italic>a</italic><sub><italic>i</italic></sub>|, |<italic>b</italic><sub><italic>i</italic></sub>| ≤ <italic>C</italic> for some finite <italic>C</italic>), a convergent <inline-formula id="pgen.1009241.e066"><alternatives><graphic id="pgen.1009241.e066g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e066" xlink:type="simple"/><mml:math display="inline" id="M66"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>c</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>m</mml:mi></mml:msub><mml:mo>→</mml:mo><mml:mi>c</mml:mi></mml:mrow></mml:math></alternatives></inline-formula>, and <italic>Bc</italic> ≠ 0, which are satisfied by common estimators. Given independent loci, we prove almost sure convergence to the desired quantity (<xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref>),
<disp-formula id="pgen.1009241.e067"><alternatives><graphic id="pgen.1009241.e067g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e067" xlink:type="simple"/><mml:math display="block" id="M67"><mml:mrow><mml:mtable equalcolumns="true" equalrows="true"><mml:mtr><mml:mtd><mml:mrow><mml:mfrac><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>m</mml:mi></mml:msub></mml:mrow><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>B</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>m</mml:mi></mml:msub></mml:mrow></mml:mfrac><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mfrac><mml:mn>1</mml:mn><mml:mi>m</mml:mi></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover><mml:mrow><mml:msub><mml:mi>a</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mstyle></mml:mrow><mml:mrow><mml:mfrac><mml:mn>1</mml:mn><mml:mi>m</mml:mi></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover><mml:mrow><mml:msub><mml:mi>b</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mstyle></mml:mrow></mml:mfrac><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mrow><mml:mtext>a.s.</mml:mtext></mml:mrow></mml:munderover><mml:mfrac><mml:mi>A</mml:mi><mml:mi>B</mml:mi></mml:mfrac><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mrow></mml:math></alternatives> <label>(10)</label></disp-formula>
a strong result that implies <inline-formula id="pgen.1009241.e068"><alternatives><graphic id="pgen.1009241.e068g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e068" xlink:type="simple"/><mml:math display="inline" id="M68"><mml:mrow><mml:mo form="prefix">E</mml:mo><mml:mo>[</mml:mo><mml:mfrac><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>m</mml:mi></mml:msub><mml:msub><mml:mover accent="true"><mml:mi>B</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>m</mml:mi></mml:msub></mml:mfrac><mml:mo>]</mml:mo><mml:mo>→</mml:mo><mml:mfrac><mml:mi>A</mml:mi><mml:mi>B</mml:mi></mml:mfrac></mml:mrow></mml:math></alternatives></inline-formula>, justifying previous work [<xref ref-type="bibr" rid="pgen.1009241.ref004">4</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref017">17</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref023">23</xref>]. Moreover, the error between these expectations scales with <inline-formula id="pgen.1009241.e069"><alternatives><graphic id="pgen.1009241.e069g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e069" xlink:type="simple"/><mml:math display="inline" id="M69"><mml:mfrac><mml:mn>1</mml:mn><mml:mi>m</mml:mi></mml:mfrac></mml:math></alternatives></inline-formula> (<xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref>), just as for standard ratio estimators [<xref ref-type="bibr" rid="pgen.1009241.ref069">69</xref>]. Although real loci are not independent due to genetic linkage, their dependence is very localized, so this estimator will perform well if the effective number of independent loci is large.</p>
<p>In order to test if a given ratio-of-means estimator converges to its ratio of expectations as in <xref ref-type="disp-formula" rid="pgen.1009241.e067">Eq (10)</xref>, the following three conditions can be tested. (i) The expected values of each term <italic>a</italic><sub><italic>i</italic></sub>, <italic>b</italic><sub><italic>i</italic></sub> must be calculated and shown to be of the form E[<italic>a</italic><sub><italic>i</italic></sub>] = <italic>Ac</italic><sub><italic>i</italic></sub> and E[<italic>b</italic><sub><italic>i</italic></sub>] = <italic>Bc</italic><sub><italic>i</italic></sub> for some <italic>A</italic> and <italic>B</italic> shared by all loci <italic>i</italic> and some <italic>c</italic><sub><italic>i</italic></sub> that may vary per locus <italic>i</italic> but must be shared by both E[<italic>a</italic><sub><italic>i</italic></sub>], E[<italic>b</italic><sub><italic>i</italic></sub>]. In the estimators we study, <italic>A</italic> and <italic>B</italic> are functions of IBD probabilities such as <inline-formula id="pgen.1009241.e070"><alternatives><graphic id="pgen.1009241.e070g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e070" xlink:type="simple"/><mml:math display="inline" id="M70"><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> and <italic>F</italic><sub>ST</sub>, while <italic>c</italic><sub><italic>i</italic></sub> is a function of <inline-formula id="pgen.1009241.e071"><alternatives><graphic id="pgen.1009241.e071g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e071" xlink:type="simple"/><mml:math display="inline" id="M71"><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> only. (ii) The mean <italic>c</italic><sub><italic>i</italic></sub> must converge to a non-zero value for infinite loci. (iii) Both |<italic>a</italic><sub><italic>i</italic></sub>|, |<italic>b</italic><sub><italic>i</italic></sub>| ≤ <italic>C</italic> must be bounded for all <italic>i</italic> by some finite <italic>C</italic> (the estimators we study usually have <italic>C</italic> = 1 or <italic>C</italic> = 4). If these conditions are satisfied, then <xref ref-type="disp-formula" rid="pgen.1009241.e067">Eq (10)</xref> holds for independent loci and the <italic>A</italic> and <italic>B</italic> found in the first step. See the next section for an example application of this procedure to an <italic>F</italic><sub>ST</sub> estimator.</p>
<p>Another approach is the “mean-of-ratios” estimator <inline-formula id="pgen.1009241.e072"><alternatives><graphic id="pgen.1009241.e072g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e072" xlink:type="simple"/><mml:math display="inline" id="M72"><mml:mrow><mml:mfrac><mml:mn>1</mml:mn><mml:mi>m</mml:mi></mml:mfrac><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:msubsup><mml:mfrac><mml:msub><mml:mi>a</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:msub><mml:mi>b</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mfrac></mml:mrow></mml:math></alternatives></inline-formula>, used often to estimate kinship coefficients [<xref ref-type="bibr" rid="pgen.1009241.ref016">16</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref027">27</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref030">30</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref035">35</xref>] and <italic>F</italic><sub>ST</sub> [<xref ref-type="bibr" rid="pgen.1009241.ref046">46</xref>]. If each <inline-formula id="pgen.1009241.e073"><alternatives><graphic id="pgen.1009241.e073g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e073" xlink:type="simple"/><mml:math display="inline" id="M73"><mml:mfrac><mml:msub><mml:mi>a</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:msub><mml:mi>b</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mfrac></mml:math></alternatives></inline-formula> is biased, their average across loci will also be biased, even as <italic>m</italic> → ∞. However, if <inline-formula id="pgen.1009241.e074"><alternatives><graphic id="pgen.1009241.e074g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e074" xlink:type="simple"/><mml:math display="inline" id="M74"><mml:mrow><mml:mo form="prefix">E</mml:mo><mml:mrow><mml:mo>[</mml:mo><mml:mfrac><mml:msub><mml:mi>a</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:msub><mml:mi>b</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mfrac><mml:mo>]</mml:mo></mml:mrow><mml:mo>→</mml:mo><mml:mfrac><mml:mi>A</mml:mi><mml:mi>B</mml:mi></mml:mfrac></mml:mrow></mml:math></alternatives></inline-formula> for all loci <italic>i</italic> = 1, …, <italic>m</italic> as the number of individuals <italic>n</italic> → ∞, and <inline-formula id="pgen.1009241.e075"><alternatives><graphic id="pgen.1009241.e075g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e075" xlink:type="simple"/><mml:math display="inline" id="M75"><mml:mrow><mml:mo form="prefix">Var</mml:mo><mml:mo>(</mml:mo><mml:mfrac><mml:msub><mml:mi>a</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:msub><mml:mi>b</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mfrac><mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula> is bounded, then
<disp-formula id="pgen.1009241.e076"><alternatives><graphic id="pgen.1009241.e076g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e076" xlink:type="simple"/><mml:math display="block" id="M76"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mfrac><mml:mn>1</mml:mn><mml:mi>m</mml:mi></mml:mfrac><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover><mml:mfrac><mml:msub><mml:mi>a</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:msub><mml:mi>b</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mfrac><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>n</mml:mi><mml:mo>,</mml:mo><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:mfrac><mml:mi>A</mml:mi><mml:mi>B</mml:mi></mml:mfrac><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(11)</label></disp-formula>
Therefore, mean-of-ratios estimators must satisfy more restrictive conditions than ratio-of-means estimators, as well as large <italic>n</italic> (in addition to the large <italic>m</italic> needed by both estimators), to estimate <inline-formula id="pgen.1009241.e077"><alternatives><graphic id="pgen.1009241.e077g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e077" xlink:type="simple"/><mml:math display="inline" id="M77"><mml:mfrac><mml:mi>A</mml:mi><mml:mi>B</mml:mi></mml:mfrac></mml:math></alternatives></inline-formula> well. We do not provide a procedure to test whether a given mean-of-ratios estimator converges as shown above.</p>
</sec>
</sec>
<sec id="sec008">
<title><italic>F</italic><sub>ST</sub> estimation based on the independent subpopulations model</title>
<p>Now that we have detailed how ratio estimators may be evaluated for their accuracy, we turn to existing estimators and assess their accuracy under arbitrary population structures. We study the <italic>F</italic><sub>ST</sub> estimators Weir-Cockerham (WC) [<xref ref-type="bibr" rid="pgen.1009241.ref017">17</xref>], Weir-Hill [<xref ref-type="bibr" rid="pgen.1009241.ref004">4</xref>], “Hudson” [<xref ref-type="bibr" rid="pgen.1009241.ref023">23</xref>], and Weir-Goudet (equals HudsonK below for biallelic loci; <xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref>) [<xref ref-type="bibr" rid="pgen.1009241.ref021">21</xref>]. The panel “Indep. Subpop. <italic>F</italic><sub>ST</sub> Estimator” in <xref ref-type="fig" rid="pgen.1009241.g001">Fig 1</xref> provides an overview of our results, which we detail in this section.</p>
<sec id="sec009">
<title>The <italic>F</italic><sub>ST</sub> estimator for independent subpopulations and infinite subpopulation sample sizes</title>
<p>The WC, Weir-Hill, and Hudson method-of-moments estimators have small sample size corrections that remarkably make them consistent (as the number of independent loci <italic>m</italic> goes to infinity) for finite numbers of individuals. However, these small sample corrections also make the estimators unnecessarily cumbersome for our purposes (see <xref ref-type="sec" rid="sec028">Methods</xref>, section <bold>Previous <italic>F</italic><sub>ST</sub> estimators for the independent subpopulations model</bold> for complete formulas). In order to illustrate clearly how these estimators behave, both under the independent subpopulations model and for arbitrary structure, here we construct simplified versions that assume infinite sample sizes per subpopulation (<xref ref-type="sec" rid="sec028">Methods</xref>, section <bold>Previous <italic>F</italic><sub>ST</sub> estimators for the independent subpopulations model</bold>). This simplification corresponds to eliminating statistical sampling, leaving only genetic sampling to analyze [<xref ref-type="bibr" rid="pgen.1009241.ref071">71</xref>]. Note that our simplified estimator nevertheless illustrates the general behavior of the WC, Weir-Hill, and Hudson estimators under arbitrary structure, and the results are equivalent to those we would obtain under finite sample sizes of individuals. While the Hudson <italic>F</italic><sub>ST</sub> estimator compares two subpopulations [<xref ref-type="bibr" rid="pgen.1009241.ref023">23</xref>], based on that work we derive a generalized “HudsonK” estimator for more than two subpopulations in <xref ref-type="sec" rid="sec028">Methods</xref>, section <bold>Generalized HudsonK <italic>F</italic><sub>ST</sub> estimator</bold>. Note that HudsonK, first derived in [<xref ref-type="bibr" rid="pgen.1009241.ref058">58</xref>], also equals the Weir-Goudet <italic>F</italic><sub>ST</sub> estimator for subpopulations [<xref ref-type="bibr" rid="pgen.1009241.ref021">21</xref>] when loci are biallelic, which was derived independently using allele matching (<xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref>).</p>
<p>Under infinite subpopulation sample sizes, the allele frequencies at each locus and every subpopulation are known. Let <italic>j</italic> ∈ {1, …, <italic>n</italic>} index subpopulations rather than individuals and <italic>π</italic><sub><italic>ij</italic></sub> be the true allele frequency in subpopulation <italic>j</italic> at locus <italic>i</italic>. Note that <italic>π</italic><sub><italic>ij</italic></sub> are not estimated allele frequencies, but rather true subpopulation allele frequencies; this abstraction does not result in a practical estimation approach, but it greatly simplifies understanding of bias for subpopulations in a setting where there there is no statistical sampling. Although in this analysis of <italic>F</italic><sub>ST</sub> estimators the <italic>π</italic><sub><italic>ij</italic></sub> values are applied to subpopulations, for coherence with our previous work we shall call them “individual-specific allele frequencies” (IAF) [<xref ref-type="bibr" rid="pgen.1009241.ref060">60</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref061">61</xref>]. Whether for individuals or subpopulations, the key assumption is that IAFs satisfy the coancestry model of <xref ref-type="disp-formula" rid="pgen.1009241.e048">Eq (6)</xref>. In this special case of infinite subpopulation sample sizes, all of WC, Weir-Hill, and HudsonK simplify to the following <italic>F</italic><sub>ST</sub> estimator for independent subpopulations (“indep”; derived in <xref ref-type="sec" rid="sec028">Methods</xref>, section <bold>Previous <italic>F</italic><sub>ST</sub> estimators for the independent subpopulations model</bold>): 
<disp-formula id="pgen.1009241.e078"><alternatives><graphic id="pgen.1009241.e078g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e078" xlink:type="simple"/><mml:math display="block" id="M78"><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo></mml:mrow></mml:math></alternatives> <label>(11)</label></disp-formula>
<disp-formula id="pgen.1009241.e079"><alternatives><graphic id="pgen.1009241.e079g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e079" xlink:type="simple"/><mml:math display="block" id="M79"><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mi>n</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mfrac><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover><mml:mrow><mml:msup><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:mrow><mml:mo>,</mml:mo></mml:mrow></mml:math></alternatives> <label>(12)</label></disp-formula>
<disp-formula id="pgen.1009241.e080"><alternatives><graphic id="pgen.1009241.e080g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e080" xlink:type="simple"/><mml:math display="block" id="M80"><mml:mrow><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mrow><mml:mtext>indep</mml:mtext></mml:mrow></mml:msubsup></mml:mrow><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:mstyle></mml:mrow><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mrow></mml:mstyle><mml:mo>(</mml:mo><mml:mrow><mml:mn>1</mml:mn><mml:mo>−</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mrow><mml:mo>)</mml:mo><mml:mo>+</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:mfrac><mml:mo>.</mml:mo></mml:mrow></mml:mrow></mml:math></alternatives> <label>(13)</label></disp-formula>
The goal is to estimate <inline-formula id="pgen.1009241.e081"><alternatives><graphic id="pgen.1009241.e081g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e081" xlink:type="simple"/><mml:math display="inline" id="M81"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mrow></mml:math></alternatives></inline-formula>, which is the special case of <xref ref-type="disp-formula" rid="pgen.1009241.e053">Eq (9)</xref> that weighs every subpopulation <italic>j</italic> equally (<inline-formula id="pgen.1009241.e082"><alternatives><graphic id="pgen.1009241.e082g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e082" xlink:type="simple"/><mml:math display="inline" id="M82"><mml:mrow><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:mspace width="0.277778em"/><mml:mo>∀</mml:mo><mml:mi>j</mml:mi></mml:mrow></mml:math></alternatives></inline-formula>).</p>
</sec>
<sec id="sec010">
<title><italic>F</italic><sub>ST</sub> estimation under the independent subpopulations model</title>
<p>Under the independent subpopulations model <inline-formula id="pgen.1009241.e083"><alternatives><graphic id="pgen.1009241.e083g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e083" xlink:type="simple"/><mml:math display="inline" id="M83"><mml:mrow><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> for <italic>j</italic> ≠ <italic>k</italic>, where <italic>T</italic> is the most recent common ancestor (MRCA) population of the set of subpopulations. Note that the estimator in <xref ref-type="disp-formula" rid="pgen.1009241.e080">Eq (13)</xref> can be derived directly from <xref ref-type="disp-formula" rid="pgen.1009241.e048">Eq (6)</xref> and these assumptions using the method of moments (ignoring the existence of previous <italic>F</italic><sub>ST</sub> estimators; <xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref>). The expectations of the two recurrent terms in <xref ref-type="disp-formula" rid="pgen.1009241.e080">Eq (13)</xref> are
<disp-formula id="pgen.1009241.e084"><alternatives><graphic id="pgen.1009241.e084g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e084" xlink:type="simple"/><mml:math display="block" id="M84"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mo form="prefix">E</mml:mo><mml:mo>[</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>m</mml:mi></mml:mfrac><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mrow><mml:mo>|</mml:mo><mml:mi>T</mml:mi></mml:mrow><mml:mo>]</mml:mo></mml:mrow></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:msup><mml:mover><mml:mrow><mml:mi>p</mml:mi><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:mi>p</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mo form="prefix">E</mml:mo><mml:mo>[</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>m</mml:mi></mml:mfrac><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:mrow><mml:mo>|</mml:mo><mml:mi>T</mml:mi></mml:mrow><mml:mo>]</mml:mo></mml:mrow></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:msup><mml:mover><mml:mrow><mml:mi>p</mml:mi><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:mi>p</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:mfrac><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mi>n</mml:mi></mml:mfrac><mml:mo>)</mml:mo><mml:mo>,</mml:mo><mml:mspace width="1em"/><mml:mtext>where</mml:mtext></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd columnalign="right"><mml:msup><mml:mover><mml:mrow><mml:mi>p</mml:mi><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:mi>p</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>m</mml:mi></mml:mfrac><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
Eliminating <inline-formula id="pgen.1009241.e085"><alternatives><graphic id="pgen.1009241.e085g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e085" xlink:type="simple"/><mml:math display="inline" id="M85"><mml:msup><mml:mover><mml:mrow><mml:mi>p</mml:mi><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:mi>p</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula> and solving for <italic>F</italic><sub>ST</sub> in this system of equations recovers the estimator in <xref ref-type="disp-formula" rid="pgen.1009241.e080">Eq (13)</xref>.</p>
<p>Before applying the convergence result in <xref ref-type="disp-formula" rid="pgen.1009241.e067">Eq (10)</xref>, we test that the three conditions listed in section <bold>Assessing the accuracy of genome-wide ratio estimators</bold> are met. Condition (i): The locus <italic>i</italic> terms are <inline-formula id="pgen.1009241.e086"><alternatives><graphic id="pgen.1009241.e086g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e086" xlink:type="simple"/><mml:math display="inline" id="M86"><mml:mrow><mml:msub><mml:mi>a</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009241.e087"><alternatives><graphic id="pgen.1009241.e087g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e087" xlink:type="simple"/><mml:math display="inline" id="M87"><mml:mrow><mml:msub><mml:mi>b</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:mo>+</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:math></alternatives></inline-formula>, which satisfy E[<italic>a</italic><sub><italic>i</italic></sub>] = <italic>Ac</italic><sub><italic>i</italic></sub> and E[<italic>b</italic><sub><italic>i</italic></sub>] = <italic>Bc</italic><sub><italic>i</italic></sub> with <italic>A</italic> = <italic>F</italic><sub>ST</sub>, <italic>B</italic> = 1, and <inline-formula id="pgen.1009241.e088"><alternatives><graphic id="pgen.1009241.e088g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e088" xlink:type="simple"/><mml:math display="inline" id="M88"><mml:mrow><mml:msub><mml:mi>c</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula>. Condition (ii): <inline-formula id="pgen.1009241.e089"><alternatives><graphic id="pgen.1009241.e089g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e089" xlink:type="simple"/><mml:math display="inline" id="M89"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>c</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>m</mml:mi></mml:msub><mml:mo>→</mml:mo><mml:mi>c</mml:mi><mml:mo>=</mml:mo><mml:mo form="prefix">E</mml:mo><mml:mo>[</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:mrow><mml:mo>|</mml:mo><mml:mi>T</mml:mi></mml:mrow><mml:mo>]</mml:mo><mml:mo>≠</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> over the <inline-formula id="pgen.1009241.e090"><alternatives><graphic id="pgen.1009241.e090g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e090" xlink:type="simple"/><mml:math display="inline" id="M90"><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> distribution across loci. Condition (iii): Since <inline-formula id="pgen.1009241.e091"><alternatives><graphic id="pgen.1009241.e091g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e091" xlink:type="simple"/><mml:math display="inline" id="M91"><mml:mrow><mml:mn>0</mml:mn><mml:mo>≤</mml:mo><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>≤</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>, then <inline-formula id="pgen.1009241.e092"><alternatives><graphic id="pgen.1009241.e092g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e092" xlink:type="simple"/><mml:math display="inline" id="M92"><mml:mrow><mml:mn>0</mml:mn><mml:mo>≤</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mo>≤</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009241.e093"><alternatives><graphic id="pgen.1009241.e093g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e093" xlink:type="simple"/><mml:math display="inline" id="M93"><mml:mrow><mml:mn>0</mml:mn><mml:mo>≤</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:mo>≤</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mn>4</mml:mn></mml:mfrac></mml:mrow></mml:math></alternatives></inline-formula>, and since <italic>n</italic> ≥ 2, <italic>C</italic> = 1 bounds both |<italic>a</italic><sub><italic>i</italic></sub>| and |<italic>b</italic><sub><italic>i</italic></sub>|. Therefore, for independent loci,
<disp-formula id="pgen.1009241.e094"><alternatives><graphic id="pgen.1009241.e094g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e094" xlink:type="simple"/><mml:math display="block" id="M94"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula></p>
</sec>
<sec id="sec011">
<title><italic>F</italic><sub>ST</sub> estimation under arbitrary coancestry</title>
<p>Now we consider applying the independent subpopulations <italic>F</italic><sub>ST</sub> estimator to dependent subpopulations. The key difference is that now <inline-formula id="pgen.1009241.e095"><alternatives><graphic id="pgen.1009241.e095g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e095" xlink:type="simple"/><mml:math display="inline" id="M95"><mml:mrow><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>≠</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> for every (<italic>j</italic>, <italic>k</italic>) will be assumed in our coancestry model in <xref ref-type="disp-formula" rid="pgen.1009241.e048">Eq (6)</xref>, and now <italic>T</italic> may be either the MRCA population of all subpopulations or a more ancestral population. In this general setting, (<italic>j</italic>, <italic>k</italic>) may index either subpopulations or individuals. The two terms of <inline-formula id="pgen.1009241.e096"><alternatives><graphic id="pgen.1009241.e096g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e096" xlink:type="simple"/><mml:math display="inline" id="M96"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> now satisfy
<disp-formula id="pgen.1009241.e097"><alternatives><graphic id="pgen.1009241.e097g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e097" xlink:type="simple"/><mml:math display="block" id="M97"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mo form="prefix">E</mml:mo><mml:mo>[</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>m</mml:mi></mml:mfrac><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mrow><mml:mo>|</mml:mo><mml:mi>T</mml:mi></mml:mrow><mml:mo>]</mml:mo></mml:mrow></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:msup><mml:mover><mml:mrow><mml:mi>p</mml:mi><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:mi>p</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>(</mml:mo><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>-</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>)</mml:mo><mml:mfrac><mml:mi>n</mml:mi><mml:mrow><mml:mi>n</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mfrac><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mo form="prefix">E</mml:mo><mml:mo>[</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>m</mml:mi></mml:mfrac><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:mrow><mml:mo>|</mml:mo><mml:mi>T</mml:mi></mml:mrow><mml:mo>]</mml:mo></mml:mrow></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:msup><mml:mover><mml:mrow><mml:mi>p</mml:mi><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:mi>p</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>)</mml:mo><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
where <inline-formula id="pgen.1009241.e098"><alternatives><graphic id="pgen.1009241.e098g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e098" xlink:type="simple"/><mml:math display="inline" id="M98"><mml:mrow><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:msup><mml:mi>n</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mfrac><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>k</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mrow></mml:math></alternatives></inline-formula> is the mean coancestry with uniform weights. There are two equations but three unknowns: <italic>F</italic><sub>ST</sub>, <inline-formula id="pgen.1009241.e099"><alternatives><graphic id="pgen.1009241.e099g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e099" xlink:type="simple"/><mml:math display="inline" id="M99"><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula>, and <inline-formula id="pgen.1009241.e100"><alternatives><graphic id="pgen.1009241.e100g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e100" xlink:type="simple"/><mml:math display="inline" id="M100"><mml:msup><mml:mover><mml:mrow><mml:mi>p</mml:mi><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:mi>p</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula>. The independent subpopulations model satisfies <inline-formula id="pgen.1009241.e101"><alternatives><graphic id="pgen.1009241.e101g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e101" xlink:type="simple"/><mml:math display="inline" id="M101"><mml:mrow><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub></mml:mrow></mml:math></alternatives></inline-formula>, which allows for the consistent estimation of <italic>F</italic><sub>ST</sub>. Therefore, the new unknown <inline-formula id="pgen.1009241.e102"><alternatives><graphic id="pgen.1009241.e102g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e102" xlink:type="simple"/><mml:math display="inline" id="M102"><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula> precludes consistent <italic>F</italic><sub>ST</sub> estimation without additional assumptions. As shown later, our additional assumption is that we can identify unrelated individuals in the data, which determines all unknowns. We defer our complete solution to this problem until kinship and its estimation challenges have been presented.</p>
<p>The <italic>F</italic><sub>ST</sub> estimator for independent subpopulations converges more generally to
<disp-formula id="pgen.1009241.e103"><alternatives><graphic id="pgen.1009241.e103g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e103" xlink:type="simple"/><mml:math display="block" id="M103"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup><mml:mrow><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:mfrac><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>-</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>˜</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>˜</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:mfrac><mml:mo>,</mml:mo></mml:mrow></mml:math></alternatives> <label>(14)</label></disp-formula>
(the conclusion of panel “Indep. Subpop. <italic>F</italic><sub>ST</sub> Estimator” in <xref ref-type="fig" rid="pgen.1009241.g001">Fig 1</xref>), where
<disp-formula id="pgen.1009241.e104"><alternatives><graphic id="pgen.1009241.e104g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e104" xlink:type="simple"/><mml:math display="block" id="M104"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>˜</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mi>n</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mfrac><mml:mo>(</mml:mo><mml:mi>n</mml:mi><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>-</mml:mo><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>)</mml:mo><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mi>n</mml:mi><mml:mo>(</mml:mo><mml:mi>n</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn><mml:mo>)</mml:mo></mml:mrow></mml:mfrac><mml:munder><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>≠</mml:mo><mml:mi>k</mml:mi></mml:mrow></mml:munder><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
is the average of all between-subpopulation coancestry coefficients, in agreement with related calculations regarding the WC and Weir-Hill estimators [<xref ref-type="bibr" rid="pgen.1009241.ref004">4</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref021">21</xref>]. Therefore, under arbitrary structure the independent subpopulations estimator’s bias is due to the coancestry between subpopulations. While the limit in <xref ref-type="disp-formula" rid="pgen.1009241.e103">Eq (14)</xref> appears to vary depending on the choice of <italic>T</italic>, it is in fact a constant with respect to <italic>T</italic> (proof in <xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref>).</p>
<p>Since <inline-formula id="pgen.1009241.e105"><alternatives><graphic id="pgen.1009241.e105g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e105" xlink:type="simple"/><mml:math display="inline" id="M105"><mml:mrow><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>≤</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>≤</mml:mo><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub></mml:mrow></mml:math></alternatives></inline-formula> (<xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref>), this estimator has a downward bias in the general setting: it is asymptotically unbiased (<inline-formula id="pgen.1009241.e106"><alternatives><graphic id="pgen.1009241.e106g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e106" xlink:type="simple"/><mml:math display="inline" id="M106"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub></mml:mrow></mml:math></alternatives></inline-formula>) only when <inline-formula id="pgen.1009241.e107"><alternatives><graphic id="pgen.1009241.e107g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e107" xlink:type="simple"/><mml:math display="inline" id="M107"><mml:mrow><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub></mml:mrow></mml:math></alternatives></inline-formula>, while bias is maximal when <inline-formula id="pgen.1009241.e108"><alternatives><graphic id="pgen.1009241.e108g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e108" xlink:type="simple"/><mml:math display="inline" id="M108"><mml:mrow><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>=</mml:mo><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub></mml:mrow></mml:math></alternatives></inline-formula>, where <inline-formula id="pgen.1009241.e109"><alternatives><graphic id="pgen.1009241.e109g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e109" xlink:type="simple"/><mml:math display="inline" id="M109"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>. For example, if <inline-formula id="pgen.1009241.e110"><alternatives><graphic id="pgen.1009241.e110g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e110" xlink:type="simple"/><mml:math display="inline" id="M110"><mml:mrow><mml:mo form="prefix" movablelimits="true">min</mml:mo><mml:mspace width="4pt"/><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> so the MRCA population <italic>T</italic> is fixed, but <italic>n</italic> is large and <inline-formula id="pgen.1009241.e111"><alternatives><graphic id="pgen.1009241.e111g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e111" xlink:type="simple"/><mml:math display="inline" id="M111"><mml:mrow><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>≈</mml:mo><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub></mml:mrow></mml:math></alternatives></inline-formula> for most pairs of subpopulations, then <inline-formula id="pgen.1009241.e112"><alternatives><graphic id="pgen.1009241.e112g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e112" xlink:type="simple"/><mml:math display="inline" id="M112"><mml:mrow><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>≈</mml:mo><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub></mml:mrow></mml:math></alternatives></inline-formula> as well, and <inline-formula id="pgen.1009241.e113"><alternatives><graphic id="pgen.1009241.e113g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e113" xlink:type="simple"/><mml:math display="inline" id="M113"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup><mml:mo>≈</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>. Therefore, the magnitude of the bias of <inline-formula id="pgen.1009241.e114"><alternatives><graphic id="pgen.1009241.e114g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e114" xlink:type="simple"/><mml:math display="inline" id="M114"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> is unknown if <inline-formula id="pgen.1009241.e115"><alternatives><graphic id="pgen.1009241.e115g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e115" xlink:type="simple"/><mml:math display="inline" id="M115"><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula> is unknown, and small <inline-formula id="pgen.1009241.e116"><alternatives><graphic id="pgen.1009241.e116g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e116" xlink:type="simple"/><mml:math display="inline" id="M116"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> estimates may arise even if <italic>F</italic><sub>ST</sub> is very large.</p>
</sec>
<sec id="sec012">
<title>Coancestry estimation as a method of moments</title>
<p>Since the generalized <italic>F</italic><sub>ST</sub> is given by coancestry coefficients <inline-formula id="pgen.1009241.e117"><alternatives><graphic id="pgen.1009241.e117g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e117" xlink:type="simple"/><mml:math display="inline" id="M117"><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e053">Eq (9)</xref>, a new <italic>F</italic><sub>ST</sub> estimator could be derived from estimates of <inline-formula id="pgen.1009241.e118"><alternatives><graphic id="pgen.1009241.e118g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e118" xlink:type="simple"/><mml:math display="inline" id="M118"><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula>. Here we attempt to define a method-of-moments estimator for <inline-formula id="pgen.1009241.e119"><alternatives><graphic id="pgen.1009241.e119g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e119" xlink:type="simple"/><mml:math display="inline" id="M119"><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula>, and find an underdetermined estimation problem, just as for <italic>F</italic><sub>ST</sub>. This is consistent with IBD parameters in general requiring a reference population to be determined [<xref ref-type="bibr" rid="pgen.1009241.ref040">40</xref>], whereas in this subsection this reference population is unspecified.</p>
<p>Given IAFs and the coancestry model of <xref ref-type="disp-formula" rid="pgen.1009241.e048">Eq (6)</xref>, the first and second moments that average across loci are
<disp-formula id="pgen.1009241.e120"><alternatives><graphic id="pgen.1009241.e120g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e120" xlink:type="simple"/><mml:math display="block" id="M120"><mml:mrow><mml:mo form="prefix">E</mml:mo><mml:mo>[</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>m</mml:mi></mml:mfrac><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo>|</mml:mo><mml:mi>T</mml:mi></mml:mrow><mml:mo>]</mml:mo></mml:mrow><mml:mrow><mml:mo>=</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>,</mml:mo></mml:mrow></mml:math></alternatives> <label>(15)</label></disp-formula>
<disp-formula id="pgen.1009241.e121"><alternatives><graphic id="pgen.1009241.e121g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e121" xlink:type="simple"/><mml:math display="block" id="M121"><mml:mrow><mml:mo form="prefix">E</mml:mo><mml:mo>[</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>m</mml:mi></mml:mfrac><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo>|</mml:mo><mml:mi>T</mml:mi></mml:mrow><mml:mo>]</mml:mo></mml:mrow><mml:mrow><mml:mo>=</mml:mo><mml:msup><mml:mover><mml:msup><mml:mi>p</mml:mi><mml:mn>2</mml:mn></mml:msup><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>+</mml:mo><mml:msup><mml:mover><mml:mrow><mml:mi>p</mml:mi><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:mi>p</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>,</mml:mo></mml:mrow></mml:math></alternatives> <label>(16)</label></disp-formula>
where <inline-formula id="pgen.1009241.e122"><alternatives><graphic id="pgen.1009241.e122g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e122" xlink:type="simple"/><mml:math display="inline" id="M122"><mml:mrow><mml:msup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>m</mml:mi></mml:mfrac><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:msubsup><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mrow></mml:math></alternatives></inline-formula>, <inline-formula id="pgen.1009241.e123"><alternatives><graphic id="pgen.1009241.e123g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e123" xlink:type="simple"/><mml:math display="inline" id="M123"><mml:mrow><mml:msup><mml:mrow><mml:mover accent="true"><mml:mrow><mml:msup><mml:mi>p</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mrow><mml:mo stretchy="true">¯</mml:mo></mml:mover></mml:mrow><mml:mi>T</mml:mi></mml:msup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>m</mml:mi></mml:mfrac><mml:msubsup><mml:mstyle displaystyle="true" mathsize="140%"><mml:mo>∑</mml:mo></mml:mstyle><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:msubsup><mml:msup><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mrow><mml:mo>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:math></alternatives></inline-formula>, and <inline-formula id="pgen.1009241.e124"><alternatives><graphic id="pgen.1009241.e124g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e124" xlink:type="simple"/><mml:math display="inline" id="M124"><mml:msup><mml:mover><mml:mrow><mml:mi>p</mml:mi><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:mi>p</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula> is as before.</p>
<p>Suppose first that only <inline-formula id="pgen.1009241.e125"><alternatives><graphic id="pgen.1009241.e125g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e125" xlink:type="simple"/><mml:math display="inline" id="M125"><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> are of interest. There are <italic>n</italic> estimators given by <xref ref-type="disp-formula" rid="pgen.1009241.e121">Eq (16)</xref> with <italic>j</italic> = <italic>k</italic>, each corresponding to an unknown <inline-formula id="pgen.1009241.e126"><alternatives><graphic id="pgen.1009241.e126g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e126" xlink:type="simple"/><mml:math display="inline" id="M126"><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula>. However, all these estimators share two nuisance parameters: <inline-formula id="pgen.1009241.e127"><alternatives><graphic id="pgen.1009241.e127g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e127" xlink:type="simple"/><mml:math display="inline" id="M127"><mml:msup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009241.e128"><alternatives><graphic id="pgen.1009241.e128g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e128" xlink:type="simple"/><mml:math display="inline" id="M128"><mml:msup><mml:mover><mml:msup><mml:mi>p</mml:mi><mml:mn>2</mml:mn></mml:msup><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula>. While <inline-formula id="pgen.1009241.e129"><alternatives><graphic id="pgen.1009241.e129g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e129" xlink:type="simple"/><mml:math display="inline" id="M129"><mml:msup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula> can be estimated from <xref ref-type="disp-formula" rid="pgen.1009241.e120">Eq (15)</xref>, there are no more equations left to estimate <inline-formula id="pgen.1009241.e130"><alternatives><graphic id="pgen.1009241.e130g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e130" xlink:type="simple"/><mml:math display="inline" id="M130"><mml:msup><mml:mover><mml:msup><mml:mi>p</mml:mi><mml:mn>2</mml:mn></mml:msup><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula>, so this system is underdetermined. The estimation problem remains underdetermined if all <inline-formula id="pgen.1009241.e131"><alternatives><graphic id="pgen.1009241.e131g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e131" xlink:type="simple"/><mml:math display="inline" id="M131"><mml:mfrac><mml:mrow><mml:mi>n</mml:mi><mml:mo>(</mml:mo><mml:mi>n</mml:mi><mml:mo>+</mml:mo><mml:mn>1</mml:mn><mml:mo>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:mfrac></mml:math></alternatives></inline-formula> estimators in <xref ref-type="disp-formula" rid="pgen.1009241.e121">Eq (16)</xref> are considered rather than only the <italic>j</italic> = <italic>k</italic> cases. Therefore, we cannot estimate coancestry coefficients consistently using only the first two moments without additional assumptions.</p>
</sec>
</sec>
<sec id="sec013">
<title>Characterizing a kinship estimator and its relationship to <italic>F</italic><sub>ST</sub></title>
<p>Given the biases we see for <inline-formula id="pgen.1009241.e132"><alternatives><graphic id="pgen.1009241.e132g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e132" xlink:type="simple"/><mml:math display="inline" id="M132"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> under arbitrary structures in the previous section, we now turn to the generalized definition of <italic>F</italic><sub>ST</sub> and pursue an estimate of it. Recall that our generalized <italic>F</italic><sub>ST</sub> in <xref ref-type="disp-formula" rid="pgen.1009241.e032">Eq (3)</xref> is defined in terms of inbreeding coefficients, which are a special case of the kinship coefficient. Kinship coefficients also determine the bias of <inline-formula id="pgen.1009241.e133"><alternatives><graphic id="pgen.1009241.e133g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e133" xlink:type="simple"/><mml:math display="inline" id="M133"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e103">Eq (14)</xref> (since coancestry and kinship coefficients are closely related: see panel “Coancestry in Terms of Kinship” in <xref ref-type="fig" rid="pgen.1009241.g001">Fig 1</xref>). Therefore, we will consider estimates of kinship and inbreeding in this section. Estimating kinship is also important for GWAS approaches that control for population structure [<xref ref-type="bibr" rid="pgen.1009241.ref016">16</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref024">24</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref035">35</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref072">72</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref073">73</xref>].</p>
<p>In this section, we focus on a standard kinship method-of-moments estimator and calculate its limit for the first time (panel “Existing Kinship Estimator” in <xref ref-type="fig" rid="pgen.1009241.g001">Fig 1</xref>). We study estimators that use genotypes or IAFs, and construct <italic>F</italic><sub>ST</sub> estimators from their kinship estimates. We find biases comparable to those of <inline-formula id="pgen.1009241.e134"><alternatives><graphic id="pgen.1009241.e134g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e134" xlink:type="simple"/><mml:math display="inline" id="M134"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> in the previous section, and define unbiased <italic>F</italic><sub>ST</sub> estimators that require knowing the mean kinship or coancestry, or its proportion relative to <italic>F</italic><sub>ST</sub>. The results of this section directly motivate and help construct our new kinship and <italic>F</italic><sub>ST</sub> estimation approach in the following section.</p>
<sec id="sec014">
<title>Characterization of the standard kinship estimator</title>
<p>Here we analyze a standard kinship estimator that is frequently used [<xref ref-type="bibr" rid="pgen.1009241.ref016">16</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref027">27</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref030">30</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref036">36</xref>]. We generalize this estimator to use weights in estimating the ancestral allele frequencies, and we write it as a ratio-of-means estimator due to the favorable theoretical properties of this format as detailed in the earlier section <bold>Assessing the accuracy of genome-wide ratio estimators</bold>: 
<disp-formula id="pgen.1009241.e135"><alternatives><graphic id="pgen.1009241.e135g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e135" xlink:type="simple"/><mml:math display="block" id="M135"><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mn>2</mml:mn></mml:mfrac><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo></mml:mrow></mml:math></alternatives> <label>(17)</label></disp-formula>
<disp-formula id="pgen.1009241.e136"><alternatives><graphic id="pgen.1009241.e136g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e136" xlink:type="simple"/><mml:math display="block" id="M136"><mml:mrow><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup></mml:mrow><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>−</mml:mo><mml:mn>2</mml:mn><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mrow><mml:mo>)</mml:mo><mml:mo>(</mml:mo><mml:mrow><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>−</mml:mo><mml:mn>2</mml:mn><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mstyle></mml:mrow><mml:mrow><mml:mn>4</mml:mn><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mrow><mml:mn>1</mml:mn><mml:mo>−</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mstyle></mml:mrow></mml:mfrac><mml:mo>.</mml:mo></mml:mrow></mml:mrow></mml:math></alternatives> <label>(18)</label></disp-formula>
The estimator in <xref ref-type="disp-formula" rid="pgen.1009241.e136">Eq (18)</xref> resembles the sample covariance estimator applied to genotypes, but centers by locus <italic>i</italic> rather than by individuals <italic>j</italic> and <italic>k</italic>, and normalizes using estimates of <inline-formula id="pgen.1009241.e137"><alternatives><graphic id="pgen.1009241.e137g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e137" xlink:type="simple"/><mml:math display="inline" id="M137"><mml:mrow><mml:mn>4</mml:mn><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula>. We derive <xref ref-type="disp-formula" rid="pgen.1009241.e136">Eq (18)</xref> directly using the method of moments in <xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref>. The weights in <xref ref-type="disp-formula" rid="pgen.1009241.e135">Eq (17)</xref> must satisfy <italic>w</italic><sub><italic>j</italic></sub> &gt; 0 and <inline-formula id="pgen.1009241.e138"><alternatives><graphic id="pgen.1009241.e138g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e138" xlink:type="simple"/><mml:math display="inline" id="M138"><mml:mrow><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>, so that <inline-formula id="pgen.1009241.e139"><alternatives><graphic id="pgen.1009241.e139g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e139" xlink:type="simple"/><mml:math display="inline" id="M139"><mml:mrow><mml:mn>0</mml:mn><mml:mo>≤</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>≤</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009241.e140"><alternatives><graphic id="pgen.1009241.e140g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e140" xlink:type="simple"/><mml:math display="inline" id="M140"><mml:mrow><mml:mo form="prefix">E</mml:mo><mml:mo>[</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mrow><mml:mo>|</mml:mo><mml:mi>T</mml:mi></mml:mrow><mml:mo>]</mml:mo><mml:mo>=</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mrow></mml:math></alternatives></inline-formula>.</p>
<p>Utilizing the kinship model for genotypes from <xref ref-type="disp-formula" rid="pgen.1009241.e045">Eq (5)</xref>, we find that <xref ref-type="disp-formula" rid="pgen.1009241.e136">Eq (18)</xref> converges to
<disp-formula id="pgen.1009241.e141"><alternatives><graphic id="pgen.1009241.e141g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e141" xlink:type="simple"/><mml:math display="block" id="M141"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:mfrac><mml:mrow><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>j</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>k</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>+</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:mfrac><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(19)</label></disp-formula>
where <inline-formula id="pgen.1009241.e142"><alternatives><graphic id="pgen.1009241.e142g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e142" xlink:type="simple"/><mml:math display="inline" id="M142"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>j</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:msup><mml:mi>k</mml:mi><mml:mo>′</mml:mo></mml:msup><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:msub><mml:mi>w</mml:mi><mml:msup><mml:mi>k</mml:mi><mml:mo>′</mml:mo></mml:msup></mml:msub><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:msup><mml:mi>k</mml:mi><mml:mo>′</mml:mo></mml:msup></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mrow></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009241.e143"><alternatives><graphic id="pgen.1009241.e143g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e143" xlink:type="simple"/><mml:math display="inline" id="M143"><mml:mrow><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>=</mml:mo><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:msup><mml:mi>j</mml:mi><mml:mo>′</mml:mo></mml:msup><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:msup><mml:mi>k</mml:mi><mml:mo>′</mml:mo></mml:msup><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:msub><mml:mi>w</mml:mi><mml:msup><mml:mi>j</mml:mi><mml:mo>′</mml:mo></mml:msup></mml:msub><mml:msub><mml:mi>w</mml:mi><mml:msup><mml:mi>k</mml:mi><mml:mo>′</mml:mo></mml:msup></mml:msub><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:msup><mml:mi>j</mml:mi><mml:mo>′</mml:mo></mml:msup><mml:msup><mml:mi>k</mml:mi><mml:mo>′</mml:mo></mml:msup></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mrow></mml:math></alternatives></inline-formula>, which agrees with related derivations [<xref ref-type="bibr" rid="pgen.1009241.ref021">21</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref062">62</xref>]. (This is the conclusion of panel “Existing Kinship Estimator” in <xref ref-type="fig" rid="pgen.1009241.g001">Fig 1</xref>; see <xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref> for intermediate calculations that lead to <xref ref-type="disp-formula" rid="pgen.1009241.e141">Eq (19)</xref>.) Therefore, the bias of <inline-formula id="pgen.1009241.e144"><alternatives><graphic id="pgen.1009241.e144g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e144" xlink:type="simple"/><mml:math display="inline" id="M144"><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula> varies per pair of individuals <italic>j</italic> and <italic>k</italic>. Analogous distortions have been observed for sample covariances of genotypes [<xref ref-type="bibr" rid="pgen.1009241.ref074">74</xref>]. The limit of <inline-formula id="pgen.1009241.e145"><alternatives><graphic id="pgen.1009241.e145g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e145" xlink:type="simple"/><mml:math display="inline" id="M145"><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e141">Eq (19)</xref> is constant with respect to <italic>T</italic> (proof in <xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref>). Similarly, inbreeding coefficient estimates derived from <xref ref-type="disp-formula" rid="pgen.1009241.e136">Eq (18)</xref> converge to
<disp-formula id="pgen.1009241.e146"><alternatives><graphic id="pgen.1009241.e146g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e146" xlink:type="simple"/><mml:math display="block" id="M146"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>f</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mn>2</mml:mn><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>-</mml:mo><mml:mn>1</mml:mn><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:mfrac><mml:mrow><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>-</mml:mo><mml:mn>4</mml:mn><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>j</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>+</mml:mo><mml:mn>3</mml:mn><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:mfrac><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(20)</label></disp-formula>
The difference between the bias of <inline-formula id="pgen.1009241.e147"><alternatives><graphic id="pgen.1009241.e147g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e147" xlink:type="simple"/><mml:math display="inline" id="M147"><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula> for <italic>j</italic> ≠ <italic>k</italic> in <xref ref-type="disp-formula" rid="pgen.1009241.e141">Eq (19)</xref> and <inline-formula id="pgen.1009241.e148"><alternatives><graphic id="pgen.1009241.e148g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e148" xlink:type="simple"/><mml:math display="inline" id="M148"><mml:msubsup><mml:mover accent="true"><mml:mi>f</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e146">Eq (20)</xref> is visible in the kinship estimates shown toward the end of the results section. The limits of the ratio-of-means versions of two more <inline-formula id="pgen.1009241.e149"><alternatives><graphic id="pgen.1009241.e149g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e149" xlink:type="simple"/><mml:math display="inline" id="M149"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> estimators [<xref ref-type="bibr" rid="pgen.1009241.ref032">32</xref>] are, if <inline-formula id="pgen.1009241.e150"><alternatives><graphic id="pgen.1009241.e150g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e150" xlink:type="simple"/><mml:math display="inline" id="M150"><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> uses <xref ref-type="disp-formula" rid="pgen.1009241.e135">Eq (17)</xref>,
<disp-formula id="pgen.1009241.e151"><alternatives><graphic id="pgen.1009241.e151g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e151" xlink:type="simple"/><mml:math display="block" id="M151"><mml:mrow><mml:mtable equalcolumns="true" equalrows="true"><mml:mtr><mml:mtd><mml:mrow><mml:mtable equalcolumns="true" equalrows="true"><mml:mtr><mml:mtd><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>f</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>j</mml:mi><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>stdII</mml:mtext></mml:mrow></mml:msubsup></mml:mrow></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo>−</mml:mo><mml:mfrac><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover><mml:mrow><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>(</mml:mo><mml:mrow><mml:mn>2</mml:mn><mml:mo>−</mml:mo><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mstyle></mml:mrow><mml:mrow><mml:mn>2</mml:mn><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mrow><mml:mn>1</mml:mn><mml:mo>−</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mstyle></mml:mrow></mml:mfrac><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mrow><mml:mtext>a.s.</mml:mtext></mml:mrow></mml:munderover><mml:mfrac><mml:mrow><mml:msubsup><mml:mi>f</mml:mi><mml:mi>j</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>−</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>−</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:mfrac><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>f</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>j</mml:mi><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>stdIII</mml:mtext></mml:mrow></mml:msubsup></mml:mrow></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover><mml:mrow><mml:msubsup><mml:mi>x</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:mstyle><mml:mo>−</mml:mo><mml:mo>(</mml:mo><mml:mrow><mml:mn>1</mml:mn><mml:mo>+</mml:mo><mml:mn>2</mml:mn><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mrow><mml:mo>)</mml:mo><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:mn>2</mml:mn><mml:msup><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mrow><mml:mo>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:mrow><mml:mrow><mml:mn>2</mml:mn><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mrow><mml:mn>1</mml:mn><mml:mo>−</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mstyle></mml:mrow></mml:mfrac><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mrow><mml:mtext>a.s.</mml:mtext></mml:mrow></mml:munderover><mml:mfrac><mml:mrow><mml:msubsup><mml:mi>f</mml:mi><mml:mi>j</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>+</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>−</mml:mo><mml:mn>2</mml:mn><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>j</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>−</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:mfrac><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mrow></mml:math></alternatives> <label>(21)</label></disp-formula></p>
<p>The estimators in Eqs <xref ref-type="disp-formula" rid="pgen.1009241.e136">(18)</xref> and <xref ref-type="disp-formula" rid="pgen.1009241.e151">(21)</xref> are unbiased when <inline-formula id="pgen.1009241.e152"><alternatives><graphic id="pgen.1009241.e152g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e152" xlink:type="simple"/><mml:math display="inline" id="M152"><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> is replaced by <inline-formula id="pgen.1009241.e153"><alternatives><graphic id="pgen.1009241.e153g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e153" xlink:type="simple"/><mml:math display="inline" id="M153"><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> [<xref ref-type="bibr" rid="pgen.1009241.ref016">16</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref032">32</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref036">36</xref>], and are consistent when <inline-formula id="pgen.1009241.e154"><alternatives><graphic id="pgen.1009241.e154g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e154" xlink:type="simple"/><mml:math display="inline" id="M154"><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> is consistent [<xref ref-type="bibr" rid="pgen.1009241.ref060">60</xref>]. Surprisingly, <inline-formula id="pgen.1009241.e155"><alternatives><graphic id="pgen.1009241.e155g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e155" xlink:type="simple"/><mml:math display="inline" id="M155"><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e135">Eq (17)</xref> is not consistent (it does not converge almost surely to <inline-formula id="pgen.1009241.e156"><alternatives><graphic id="pgen.1009241.e156g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e156" xlink:type="simple"/><mml:math display="inline" id="M156"><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula>) for arbitrary population structures, which is at the root of the bias in Eqs <xref ref-type="disp-formula" rid="pgen.1009241.e141">(19)</xref> to <xref ref-type="disp-formula" rid="pgen.1009241.e151">(21)</xref>. In particular, although <inline-formula id="pgen.1009241.e157"><alternatives><graphic id="pgen.1009241.e157g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e157" xlink:type="simple"/><mml:math display="inline" id="M157"><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> is unbiased, its variance (<xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref>, and some special cases shown elsewhere, <italic>e.g.</italic>, [<xref ref-type="bibr" rid="pgen.1009241.ref019">19</xref>]),
<disp-formula id="pgen.1009241.e158"><alternatives><graphic id="pgen.1009241.e158g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e158" xlink:type="simple"/><mml:math display="block" id="M158"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mo form="prefix">Var</mml:mo><mml:mo>(</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mrow><mml:mo>|</mml:mo><mml:mi>T</mml:mi></mml:mrow><mml:mo>)</mml:mo><mml:mo>=</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(22)</label></disp-formula>
may be asymptotically non-zero as <italic>n</italic> → ∞, since <inline-formula id="pgen.1009241.e159"><alternatives><graphic id="pgen.1009241.e159g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e159" xlink:type="simple"/><mml:math display="inline" id="M159"><mml:mrow><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>∈</mml:mo><mml:mrow><mml:mo>(</mml:mo><mml:mn>0</mml:mn><mml:mo>,</mml:mo><mml:mn>1</mml:mn><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:math></alternatives></inline-formula> is fixed and <inline-formula id="pgen.1009241.e160"><alternatives><graphic id="pgen.1009241.e160g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e160" xlink:type="simple"/><mml:math display="inline" id="M160"><mml:mrow><mml:msub><mml:mo form="prefix" movablelimits="true">lim</mml:mo><mml:mrow><mml:mi>n</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow></mml:msub><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:math></alternatives></inline-formula> may take on any value between zero and one for arbitrary population structures. Further, <inline-formula id="pgen.1009241.e161"><alternatives><graphic id="pgen.1009241.e161g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e161" xlink:type="simple"/><mml:math display="inline" id="M161"><mml:mrow><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>→</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> as <italic>n</italic> → ∞ if and only if <inline-formula id="pgen.1009241.e162"><alternatives><graphic id="pgen.1009241.e162g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e162" xlink:type="simple"/><mml:math display="inline" id="M162"><mml:mrow><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> for almost all pairs of individuals (<italic>j</italic>, <italic>k</italic>). These observations hold for any weights such that <inline-formula id="pgen.1009241.e163"><alternatives><graphic id="pgen.1009241.e163g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e163" xlink:type="simple"/><mml:math display="inline" id="M163"><mml:mrow><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>&gt;</mml:mo><mml:mn>0</mml:mn><mml:mo>,</mml:mo><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>. An important consequence is that the plug-in estimate of <inline-formula id="pgen.1009241.e164"><alternatives><graphic id="pgen.1009241.e164g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e164" xlink:type="simple"/><mml:math display="inline" id="M164"><mml:mrow><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula> is biased (<xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref>), 
<disp-formula id="pgen.1009241.e165"><alternatives><graphic id="pgen.1009241.e165g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e165" xlink:type="simple"/><mml:math display="block" id="M165"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mo form="prefix">E</mml:mo><mml:mo>[</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:mrow><mml:mo>|</mml:mo><mml:mi>T</mml:mi></mml:mrow><mml:mo>]</mml:mo><mml:mo>=</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>)</mml:mo><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
which is present in all estimators we have studied.</p>
</sec>
<sec id="sec015">
<title>Estimation of coancestry coefficients from IAFs</title>
<p>Here we form a coancestry coefficient estimator analogous to <xref ref-type="disp-formula" rid="pgen.1009241.e136">Eq (18)</xref> but using IAFs. Assuming the moments in <xref ref-type="disp-formula" rid="pgen.1009241.e048">Eq (6)</xref>, this estimator and its limit are 
<disp-formula id="pgen.1009241.e166"><alternatives><graphic id="pgen.1009241.e166g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e166" xlink:type="simple"/><mml:math display="block" id="M166"><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mrow><mml:mo>=</mml:mo><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo></mml:mrow></mml:math></alternatives> <label>(23)</label></disp-formula>
<disp-formula id="pgen.1009241.e400"><alternatives><graphic id="pgen.1009241.e400g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e400" xlink:type="simple"/><mml:math display="block" id="M400"><mml:msubsup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:mo>(</mml:mo><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:mo>(</mml:mo><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo></mml:mrow></mml:mfrac><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:mfrac><mml:mrow><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>j</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>k</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>+</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:mfrac><mml:mo>,</mml:mo></mml:mrow></mml:math></alternatives> <label>(24)</label></disp-formula>
where <inline-formula id="pgen.1009241.e167"><alternatives><graphic id="pgen.1009241.e167g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e167" xlink:type="simple"/><mml:math display="inline" id="M167"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>j</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>k</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:msub><mml:mi>w</mml:mi><mml:mi>k</mml:mi></mml:msub><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mrow></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009241.e168"><alternatives><graphic id="pgen.1009241.e168g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e168" xlink:type="simple"/><mml:math display="inline" id="M168"><mml:mrow><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>=</mml:mo><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>k</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:msub><mml:mi>w</mml:mi><mml:mi>k</mml:mi></mml:msub><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mrow></mml:math></alternatives></inline-formula> are analogous to <inline-formula id="pgen.1009241.e169"><alternatives><graphic id="pgen.1009241.e169g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e169" xlink:type="simple"/><mml:math display="inline" id="M169"><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>j</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009241.e170"><alternatives><graphic id="pgen.1009241.e170g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e170" xlink:type="simple"/><mml:math display="inline" id="M170"><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula>. <xref ref-type="disp-formula" rid="pgen.1009241.e166">Eq (23)</xref> generalizes <xref ref-type="disp-formula" rid="pgen.1009241.e078">Eq (11)</xref> for arbitrary weights. Thus, use of IAFs does not ameliorate the estimation problems we have identified for genotypes. Like <xref ref-type="disp-formula" rid="pgen.1009241.e158">Eq (22)</xref>, <inline-formula id="pgen.1009241.e171"><alternatives><graphic id="pgen.1009241.e171g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e171" xlink:type="simple"/><mml:math display="inline" id="M171"><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e166">Eq (23)</xref> is not consistent because <inline-formula id="pgen.1009241.e172"><alternatives><graphic id="pgen.1009241.e172g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e172" xlink:type="simple"/><mml:math display="inline" id="M172"><mml:mrow><mml:mtext>Var</mml:mtext><mml:mo>(</mml:mo><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>|</mml:mo><mml:mi>T</mml:mi></mml:mrow><mml:mo>)</mml:mo><mml:mo>=</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mrow><mml:mn>1</mml:mn><mml:mo>−</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mrow><mml:mo>)</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:math></alternatives></inline-formula> may not converge to zero for arbitrary population structures, which causes the bias observed in <xref ref-type="disp-formula" rid="pgen.1009241.e400">Eq (24)</xref>.</p>
</sec>
<sec id="sec016">
<title><italic>F</italic><sub>ST</sub> estimator based on the standard kinship estimator</title>
<p>Since the generalized <italic>F</italic><sub>ST</sub> is defined as a mean inbreeding coefficient in <xref ref-type="disp-formula" rid="pgen.1009241.e032">Eq (3)</xref>, here we study the <italic>F</italic><sub>ST</sub> estimator constructed as <inline-formula id="pgen.1009241.e173"><alternatives><graphic id="pgen.1009241.e173g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e173" xlink:type="simple"/><mml:math display="inline" id="M173"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup><mml:mo>=</mml:mo><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:msubsup><mml:mover accent="true"><mml:mi>f</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup></mml:mrow></mml:math></alternatives></inline-formula> where <inline-formula id="pgen.1009241.e174"><alternatives><graphic id="pgen.1009241.e174g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e174" xlink:type="simple"/><mml:math display="inline" id="M174"><mml:msubsup><mml:mover accent="true"><mml:mi>f</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula> is the inbreeding estimator derived from the standard kinship estimator. Although <inline-formula id="pgen.1009241.e175"><alternatives><graphic id="pgen.1009241.e175g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e175" xlink:type="simple"/><mml:math display="inline" id="M175"><mml:msubsup><mml:mover accent="true"><mml:mi>f</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula> is biased, we nevertheless plug it into our definition of <italic>F</italic><sub>ST</sub> so that we may study how bias manifests. Note that we do not recommend utilizing this <italic>F</italic><sub>ST</sub> estimator in practice, but we find these results informative for identifying how to proceed in deriving new estimators in the following section.</p>
<p>Remarkably, the three <inline-formula id="pgen.1009241.e176"><alternatives><graphic id="pgen.1009241.e176g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e176" xlink:type="simple"/><mml:math display="inline" id="M176"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> estimators in Eqs <xref ref-type="disp-formula" rid="pgen.1009241.e146">(20)</xref> and <xref ref-type="disp-formula" rid="pgen.1009241.e151">(21)</xref> give exactly the same plug-in <inline-formula id="pgen.1009241.e177"><alternatives><graphic id="pgen.1009241.e177g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e177" xlink:type="simple"/><mml:math display="inline" id="M177"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> if the weights in <italic>F</italic><sub>ST</sub> and <inline-formula id="pgen.1009241.e178"><alternatives><graphic id="pgen.1009241.e178g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e178" xlink:type="simple"/><mml:math display="inline" id="M178"><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e135">Eq (17)</xref> match, namely
<disp-formula id="pgen.1009241.e179"><alternatives><graphic id="pgen.1009241.e179g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e179" xlink:type="simple"/><mml:math display="block" id="M179"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:msubsup><mml:mover accent="true"><mml:mi>f</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:msup><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:mn>2</mml:mn><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:mrow><mml:mrow><mml:mn>2</mml:mn><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo></mml:mrow></mml:mfrac><mml:mo>-</mml:mo><mml:mn>1</mml:mn><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:mfrac><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>-</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:mfrac><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(25)</label></disp-formula>
where the limit assumes locally-outbred individuals so <xref ref-type="disp-formula" rid="pgen.1009241.e042">Eq (4)</xref> holds. The analogous <italic>F</italic><sub>ST</sub> estimator for IAFs and its limit are
<disp-formula id="pgen.1009241.e180"><alternatives><graphic id="pgen.1009241.e180g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e180" xlink:type="simple"/><mml:math display="block" id="M180"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:msubsup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:msup><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:mrow><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo></mml:mrow></mml:mfrac><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:mfrac><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>-</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:mfrac><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(26)</label></disp-formula>
The estimators in Eqs <xref ref-type="disp-formula" rid="pgen.1009241.e179">(25)</xref> and <xref ref-type="disp-formula" rid="pgen.1009241.e180">(26)</xref> for individuals and their limits resemble those of classical <italic>F</italic><sub>ST</sub> estimators for populations of the form <inline-formula id="pgen.1009241.e181"><alternatives><graphic id="pgen.1009241.e181g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e181" xlink:type="simple"/><mml:math display="inline" id="M181"><mml:mfrac><mml:msubsup><mml:mi>σ</mml:mi><mml:mi>p</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mrow><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mrow><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mfrac></mml:math></alternatives></inline-formula> [<xref ref-type="bibr" rid="pgen.1009241.ref004">4</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref005">5</xref>]. <inline-formula id="pgen.1009241.e182"><alternatives><graphic id="pgen.1009241.e182g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e182" xlink:type="simple"/><mml:math display="inline" id="M182"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e180">Eq (26)</xref> for subpopulations <italic>j</italic> with uniform weight and one locus is also <italic>G</italic><sub>ST</sub> for two alleles [<xref ref-type="bibr" rid="pgen.1009241.ref075">75</xref>]. Compared to <inline-formula id="pgen.1009241.e183"><alternatives><graphic id="pgen.1009241.e183g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e183" xlink:type="simple"/><mml:math display="inline" id="M183"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e080">Eq (13)</xref>, <inline-formula id="pgen.1009241.e184"><alternatives><graphic id="pgen.1009241.e184g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e184" xlink:type="simple"/><mml:math display="inline" id="M184"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e180">Eq (26)</xref> admits arbitrary weights and, by forgoing bias correction under the independent subpopulations model, is a simpler target of study.</p>
<p>Like <inline-formula id="pgen.1009241.e185"><alternatives><graphic id="pgen.1009241.e185g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e185" xlink:type="simple"/><mml:math display="inline" id="M185"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e080">Eq (13)</xref>, <inline-formula id="pgen.1009241.e186"><alternatives><graphic id="pgen.1009241.e186g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e186" xlink:type="simple"/><mml:math display="inline" id="M186"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> in Eqs <xref ref-type="disp-formula" rid="pgen.1009241.e179">(25)</xref> and <xref ref-type="disp-formula" rid="pgen.1009241.e180">(26)</xref> are downwardly biased since <inline-formula id="pgen.1009241.e187"><alternatives><graphic id="pgen.1009241.e187g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e187" xlink:type="simple"/><mml:math display="inline" id="M187"><mml:mrow><mml:mn>0</mml:mn><mml:mo>≤</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>,</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:math></alternatives></inline-formula>. <inline-formula id="pgen.1009241.e188"><alternatives><graphic id="pgen.1009241.e188g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e188" xlink:type="simple"/><mml:math display="inline" id="M188"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e180">Eq (26)</xref> may converge arbitrarily close to zero since <inline-formula id="pgen.1009241.e189"><alternatives><graphic id="pgen.1009241.e189g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e189" xlink:type="simple"/><mml:math display="inline" id="M189"><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula> can be arbitrarily close to <italic>F</italic><sub>ST</sub> (<xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref>). Moreover, although <inline-formula id="pgen.1009241.e190"><alternatives><graphic id="pgen.1009241.e190g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e190" xlink:type="simple"/><mml:math display="inline" id="M190"><mml:mrow><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>≈</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:math></alternatives></inline-formula> for large <italic>n</italic> (see <xref ref-type="disp-formula" rid="pgen.1009241.e051">Eq (8)</xref> and panel “Coancestry in Terms of Kinship” in <xref ref-type="fig" rid="pgen.1009241.g001">Fig 1</xref>), in extreme cases <inline-formula id="pgen.1009241.e191"><alternatives><graphic id="pgen.1009241.e191g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e191" xlink:type="simple"/><mml:math display="inline" id="M191"><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula> can exceed <italic>F</italic><sub>ST</sub> under the coancestry model (where <inline-formula id="pgen.1009241.e192"><alternatives><graphic id="pgen.1009241.e192g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e192" xlink:type="simple"/><mml:math display="inline" id="M192"><mml:mrow><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>≤</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:math></alternatives></inline-formula>) and also under extreme local kinship, where <inline-formula id="pgen.1009241.e193"><alternatives><graphic id="pgen.1009241.e193g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e193" xlink:type="simple"/><mml:math display="inline" id="M193"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e179">Eq (25)</xref> converges to a negative value.</p>
</sec>
<sec id="sec017">
<title>Adjusted consistent oracle <italic>F</italic><sub>ST</sub> estimators and the “bias coefficient”</title>
<p>Here we explore two adjustments to <inline-formula id="pgen.1009241.e194"><alternatives><graphic id="pgen.1009241.e194g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e194" xlink:type="simple"/><mml:math display="inline" id="M194"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> from IAFs in <xref ref-type="disp-formula" rid="pgen.1009241.e180">Eq (26)</xref> that rely on having minimal additional information needed to correct its bias. These “oracle” approaches require information that is not known in practice, but this exercise helps us understand the problem more deeply and finds further connections between the various <italic>F</italic><sub>ST</sub> estimators.</p>
<p>If <inline-formula id="pgen.1009241.e195"><alternatives><graphic id="pgen.1009241.e195g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e195" xlink:type="simple"/><mml:math display="inline" id="M195"><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula> is known, the bias in <xref ref-type="disp-formula" rid="pgen.1009241.e180">Eq (26)</xref> can be reversed, yielding the consistent estimator
<disp-formula id="pgen.1009241.e196"><alternatives><graphic id="pgen.1009241.e196g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e196" xlink:type="simple"/><mml:math display="block" id="M196"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mo>′</mml:mo></mml:msubsup><mml:mo>=</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup><mml:mrow><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>)</mml:mo></mml:mrow><mml:mo>+</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(27)</label></disp-formula>
Consistent estimates are also possible if a scaled version of <inline-formula id="pgen.1009241.e197"><alternatives><graphic id="pgen.1009241.e197g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e197" xlink:type="simple"/><mml:math display="inline" id="M197"><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula> is known, namely
<disp-formula id="pgen.1009241.e198"><alternatives><graphic id="pgen.1009241.e198g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e198" xlink:type="simple"/><mml:math display="block" id="M198"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msup><mml:mi>s</mml:mi><mml:mi>T</mml:mi></mml:msup><mml:mo>=</mml:mo><mml:mfrac><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub></mml:mfrac><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>k</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:msub><mml:mi>w</mml:mi><mml:mi>k</mml:mi></mml:msub><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mrow><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mrow></mml:mfrac><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(28)</label></disp-formula>
which we call the “bias coefficient” and which has interesting properties. The bias coefficient quantifies the departure from the independent subpopulations model by comparing the mean coancestry (<inline-formula id="pgen.1009241.e199"><alternatives><graphic id="pgen.1009241.e199g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e199" xlink:type="simple"/><mml:math display="inline" id="M199"><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula>) to the mean inbreeding coefficient (<inline-formula id="pgen.1009241.e200"><alternatives><graphic id="pgen.1009241.e200g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e200" xlink:type="simple"/><mml:math display="inline" id="M200"><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula>), and given <italic>F</italic><sub>ST</sub> &gt; 0 satisfies 0 &lt; <italic>s</italic><sup><italic>T</italic></sup> ≤ 1 (<xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref>). The limit in <xref ref-type="disp-formula" rid="pgen.1009241.e180">Eq (26)</xref> in terms of <italic>s</italic><sup><italic>T</italic></sup> is
<disp-formula id="pgen.1009241.e201"><alternatives><graphic id="pgen.1009241.e201g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e201" xlink:type="simple"/><mml:math display="block" id="M201"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mfrac><mml:mrow><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msup><mml:mi>s</mml:mi><mml:mi>T</mml:mi></mml:msup></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msup><mml:mi>s</mml:mi><mml:mi>T</mml:mi></mml:msup><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub></mml:mrow></mml:mfrac><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(29)</label></disp-formula>
Treating the limit as equality and solving for <italic>F</italic><sub>ST</sub> yields the following consistent estimator: 
<disp-formula id="pgen.1009241.e202"><alternatives><graphic id="pgen.1009241.e202g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e202" xlink:type="simple"/><mml:math display="block" id="M202"><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msup><mml:mi>s</mml:mi><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:msup><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup><mml:mo>,</mml:mo></mml:mrow></mml:math></alternatives> <label>(30)</label></disp-formula>
<disp-formula id="pgen.1009241.e203"><alternatives><graphic id="pgen.1009241.e203g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e203" xlink:type="simple"/><mml:math display="block" id="M203"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mrow><mml:mo>′</mml:mo><mml:mo>′</mml:mo></mml:mrow></mml:msubsup><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup><mml:mrow><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msup><mml:mi>s</mml:mi><mml:mi>T</mml:mi></mml:msup><mml:mrow><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mfrac><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:mo>+</mml:mo><mml:msup><mml:mi>s</mml:mi><mml:mi>T</mml:mi></mml:msup><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:mfrac><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>.</mml:mo></mml:mrow></mml:math></alternatives> <label>(31)</label></disp-formula>
Note that <inline-formula id="pgen.1009241.e204"><alternatives><graphic id="pgen.1009241.e204g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e204" xlink:type="simple"/><mml:math display="inline" id="M204"><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009241.e205"><alternatives><graphic id="pgen.1009241.e205g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e205" xlink:type="simple"/><mml:math display="inline" id="M205"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> from Eqs <xref ref-type="disp-formula" rid="pgen.1009241.e079">(12)</xref> and <xref ref-type="disp-formula" rid="pgen.1009241.e080">(13)</xref> are the special case of Eqs <xref ref-type="disp-formula" rid="pgen.1009241.e202">(30)</xref> and <xref ref-type="disp-formula" rid="pgen.1009241.e203">(31)</xref> for uniform weights and <inline-formula id="pgen.1009241.e206"><alternatives><graphic id="pgen.1009241.e206g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e206" xlink:type="simple"/><mml:math display="inline" id="M206"><mml:mrow><mml:msup><mml:mi>s</mml:mi><mml:mi>T</mml:mi></mml:msup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac></mml:mrow></mml:math></alternatives></inline-formula>; hence, <inline-formula id="pgen.1009241.e207"><alternatives><graphic id="pgen.1009241.e207g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e207" xlink:type="simple"/><mml:math display="inline" id="M207"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mrow><mml:mo>′</mml:mo><mml:mo>′</mml:mo></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula> generalizes <inline-formula id="pgen.1009241.e208"><alternatives><graphic id="pgen.1009241.e208g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e208" xlink:type="simple"/><mml:math display="inline" id="M208"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula>.</p>
<p>Lastly, using either Eqs <xref ref-type="disp-formula" rid="pgen.1009241.e180">(26)</xref> or <xref ref-type="disp-formula" rid="pgen.1009241.e201">(29)</xref>, the relative error of <inline-formula id="pgen.1009241.e209"><alternatives><graphic id="pgen.1009241.e209g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e209" xlink:type="simple"/><mml:math display="inline" id="M209"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> converges to
<disp-formula id="pgen.1009241.e210"><alternatives><graphic id="pgen.1009241.e210g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e210" xlink:type="simple"/><mml:math display="block" id="M210"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:mfrac><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub></mml:mfrac><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:mfrac><mml:mrow><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>)</mml:mo></mml:mrow></mml:mfrac><mml:mo>=</mml:mo><mml:msup><mml:mi>s</mml:mi><mml:mi>T</mml:mi></mml:msup><mml:mfrac><mml:mrow><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msup><mml:mi>s</mml:mi><mml:mi>T</mml:mi></mml:msup><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub></mml:mrow></mml:mfrac><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(32)</label></disp-formula>
which is approximated by <italic>s</italic><sup><italic>T</italic></sup> if <italic>F</italic><sub>ST</sub> ≪ 1, hence the name “bias coefficient”. Note <italic>s</italic><sup><italic>T</italic></sup> varies depending on the choice of <italic>T</italic>, which is necessary since <italic>F</italic><sub>ST</sub> (and hence the relative bias of <inline-formula id="pgen.1009241.e211"><alternatives><graphic id="pgen.1009241.e211g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e211" xlink:type="simple"/><mml:math display="inline" id="M211"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> from <italic>F</italic><sub>ST</sub>) depends on the choice of <italic>T</italic>.</p>
</sec>
</sec>
<sec id="sec018">
<title>A new approach for kinship and <italic>F</italic><sub>ST</sub> estimation</title>
<p>Here, we propose a new estimation approach for kinship coefficients that has properties favorable for obtaining nearly unbiased estimates (panel “New Kinship Estimator” in <xref ref-type="fig" rid="pgen.1009241.g001">Fig 1</xref>). These new kinship estimates yield an improved <italic>F</italic><sub>ST</sub> estimator. We present the general approach and implement a simple version of one key estimator that results in the complete proof-of-principle estimator that is evaluated in the next section and applied to human data in [<xref ref-type="bibr" rid="pgen.1009241.ref059">59</xref>]. We also compare our approach to a related estimator of non-IBD linearly-transformed kinship values [<xref ref-type="bibr" rid="pgen.1009241.ref020">20</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref022">22</xref>] that was proposed concurrently to ours [<xref ref-type="bibr" rid="pgen.1009241.ref058">58</xref>].</p>
<sec id="sec019">
<title>General approach</title>
<p>In this subsection we develop our new estimator in two steps. First, we compute a new statistic <italic>A</italic><sub><italic>jk</italic></sub> that is proportional in the limit of infinite loci to <inline-formula id="pgen.1009241.e212"><alternatives><graphic id="pgen.1009241.e212g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e212" xlink:type="simple"/><mml:math display="inline" id="M212"><mml:mrow><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> times a nuisance factor <italic>v</italic><sup><italic>T</italic></sup>. Second, we estimate and remove <italic>v</italic><sup><italic>T</italic></sup> to yield the proposed estimator <inline-formula id="pgen.1009241.e213"><alternatives><graphic id="pgen.1009241.e213g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e213" xlink:type="simple"/><mml:math display="inline" id="M213"><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>new</mml:mtext></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula>. <inline-formula id="pgen.1009241.e214"><alternatives><graphic id="pgen.1009241.e214g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e214" xlink:type="simple"/><mml:math display="inline" id="M214"><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>min</mml:mtext></mml:msub></mml:math></alternatives></inline-formula>—an estimator of the limit of the minimum <italic>A</italic><sub><italic>jk</italic></sub>—yields <italic>v</italic><sup><italic>T</italic></sup> if the least related pair of individuals in the data has <inline-formula id="pgen.1009241.e215"><alternatives><graphic id="pgen.1009241.e215g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e215" xlink:type="simple"/><mml:math display="inline" id="M215"><mml:mrow><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>, which sets <italic>T</italic> to the MRCA population of all the individuals in the data. The new kinship estimator immediately results in new inbreeding (<inline-formula id="pgen.1009241.e216"><alternatives><graphic id="pgen.1009241.e216g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e216" xlink:type="simple"/><mml:math display="inline" id="M216"><mml:msubsup><mml:mover accent="true"><mml:mi>f</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>new</mml:mtext></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula>) and <italic>F</italic><sub>ST</sub> (<inline-formula id="pgen.1009241.e217"><alternatives><graphic id="pgen.1009241.e217g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e217" xlink:type="simple"/><mml:math display="inline" id="M217"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>new</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula>) estimators. This general approach leaves the implementation of <inline-formula id="pgen.1009241.e218"><alternatives><graphic id="pgen.1009241.e218g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e218" xlink:type="simple"/><mml:math display="inline" id="M218"><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>min</mml:mtext></mml:msub></mml:math></alternatives></inline-formula> open; the simple implementation applied in this work is described in subsection <bold>Proof-of-principle kinship estimator using subpopulation labels</bold>, but our method can be readily improved by substituting in a better <inline-formula id="pgen.1009241.e219"><alternatives><graphic id="pgen.1009241.e219g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e219" xlink:type="simple"/><mml:math display="inline" id="M219"><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>min</mml:mtext></mml:msub></mml:math></alternatives></inline-formula> in the future.</p>
<p>Applying the method of moments to <xref ref-type="disp-formula" rid="pgen.1009241.e045">Eq (5)</xref>, we derive the following statistic (<xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref>), whose expectation is proportional to <inline-formula id="pgen.1009241.e220"><alternatives><graphic id="pgen.1009241.e220g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e220" xlink:type="simple"/><mml:math display="inline" id="M220"><mml:mrow><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>: 
<disp-formula id="pgen.1009241.e221"><alternatives><graphic id="pgen.1009241.e221g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e221" xlink:type="simple"/><mml:math display="block" id="M221"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:msub><mml:mi>A</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>m</mml:mi></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:mn>1</mml:mn><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:mn>1</mml:mn><mml:mo>)</mml:mo></mml:mrow><mml:mo>-</mml:mo><mml:mn>1</mml:mn><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mo form="prefix">E</mml:mo><mml:mo>[</mml:mo><mml:msub><mml:mi>A</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo>|</mml:mo><mml:mi>T</mml:mi></mml:mrow><mml:mo>]</mml:mo></mml:mrow></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:mo>(</mml:mo><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>-</mml:mo><mml:mn>1</mml:mn><mml:mo>)</mml:mo><mml:msubsup><mml:mi>v</mml:mi><mml:mi>m</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>,</mml:mo><mml:mspace width="1em"/><mml:mtext>where</mml:mtext></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd columnalign="right"><mml:msubsup><mml:mi>v</mml:mi><mml:mi>m</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mn>4</mml:mn><mml:mi>m</mml:mi></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(33)</label></disp-formula>
Compared to the standard kinship estimator in <xref ref-type="disp-formula" rid="pgen.1009241.e141">Eq (19)</xref>, which has a complex asymptotic bias determined by <italic>n</italic> parameters (<inline-formula id="pgen.1009241.e222"><alternatives><graphic id="pgen.1009241.e222g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e222" xlink:type="simple"/><mml:math display="inline" id="M222"><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>j</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> for each <italic>j</italic> ∈ {1, …, <italic>n</italic>}), the <italic>A</italic><sub><italic>jk</italic></sub> statistics estimate kinship with a bias controlled by the sole unknown parameter <inline-formula id="pgen.1009241.e223"><alternatives><graphic id="pgen.1009241.e223g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e223" xlink:type="simple"/><mml:math display="inline" id="M223"><mml:msubsup><mml:mi>v</mml:mi><mml:mi>m</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> shared by all pairs of individuals. The key to estimating <inline-formula id="pgen.1009241.e224"><alternatives><graphic id="pgen.1009241.e224g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e224" xlink:type="simple"/><mml:math display="inline" id="M224"><mml:msubsup><mml:mi>v</mml:mi><mml:mi>m</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> is to notice that if <inline-formula id="pgen.1009241.e225"><alternatives><graphic id="pgen.1009241.e225g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e225" xlink:type="simple"/><mml:math display="inline" id="M225"><mml:mrow><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> then <inline-formula id="pgen.1009241.e226"><alternatives><graphic id="pgen.1009241.e226g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e226" xlink:type="simple"/><mml:math display="inline" id="M226"><mml:mrow><mml:mo form="prefix">E</mml:mo><mml:mrow><mml:mo>[</mml:mo><mml:msub><mml:mi>A</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>|</mml:mo><mml:mi>T</mml:mi><mml:mo>]</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mo>-</mml:mo><mml:msubsup><mml:mi>v</mml:mi><mml:mi>m</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mrow></mml:math></alternatives></inline-formula>. Thus, assuming <inline-formula id="pgen.1009241.e227"><alternatives><graphic id="pgen.1009241.e227g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e227" xlink:type="simple"/><mml:math display="inline" id="M227"><mml:mrow><mml:msub><mml:mo form="prefix" movablelimits="true">min</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>,</mml:mo><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>, which sets <italic>T</italic> to the MRCA population, then the minimum <italic>A</italic><sub><italic>jk</italic></sub> yields the nuisance parameter. However, we recommend using a more stable estimate than the minimum <italic>A</italic><sub><italic>jk</italic></sub> to unbias all <italic>A</italic><sub><italic>jk</italic></sub>, such as the estimator presented in the next subsection.</p>
<p>In general, suppose <inline-formula id="pgen.1009241.e228"><alternatives><graphic id="pgen.1009241.e228g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e228" xlink:type="simple"/><mml:math display="inline" id="M228"><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>min</mml:mtext></mml:msub></mml:math></alternatives></inline-formula> is a consistent estimator of the limit of the minimum <italic>E</italic>[<italic>A</italic><sub><italic>jk</italic></sub>|<italic>T</italic>], or equivalently,
<disp-formula id="pgen.1009241.e229"><alternatives><graphic id="pgen.1009241.e229g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e229" xlink:type="simple"/><mml:math display="block" id="M229"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>min</mml:mtext></mml:msub><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:mo>-</mml:mo><mml:msup><mml:mi>v</mml:mi><mml:mi>T</mml:mi></mml:msup><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
along with the assumption that <inline-formula id="pgen.1009241.e230"><alternatives><graphic id="pgen.1009241.e230g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e230" xlink:type="simple"/><mml:math display="inline" id="M230"><mml:mrow><mml:msubsup><mml:mi>v</mml:mi><mml:mi>m</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:munder><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow></mml:munder><mml:msup><mml:mi>v</mml:mi><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:math></alternatives></inline-formula> for some <italic>v</italic><sup><italic>T</italic></sup> ≠ 0. Our new kinship estimator follows directly from replacing <inline-formula id="pgen.1009241.e231"><alternatives><graphic id="pgen.1009241.e231g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e231" xlink:type="simple"/><mml:math display="inline" id="M231"><mml:msubsup><mml:mi>v</mml:mi><mml:mi>m</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> with <inline-formula id="pgen.1009241.e232"><alternatives><graphic id="pgen.1009241.e232g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e232" xlink:type="simple"/><mml:math display="inline" id="M232"><mml:mrow><mml:mo>-</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>min</mml:mtext></mml:msub></mml:mrow></mml:math></alternatives></inline-formula> and solving for <inline-formula id="pgen.1009241.e233"><alternatives><graphic id="pgen.1009241.e233g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e233" xlink:type="simple"/><mml:math display="inline" id="M233"><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e221">Eq (33)</xref>, which results in a consistent kinship estimator (given the convergence proof of section <bold>Assessing the accuracy of genome-wide ratio estimators</bold>):
<disp-formula id="pgen.1009241.e234"><alternatives><graphic id="pgen.1009241.e234g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e234" xlink:type="simple"/><mml:math display="block" id="M234"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>new</mml:mtext></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:mfrac><mml:msub><mml:mi>A</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>min</mml:mtext></mml:msub></mml:mfrac><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(34)</label></disp-formula>
The resulting new inbreeding coefficient estimator is
<disp-formula id="pgen.1009241.e235"><alternatives><graphic id="pgen.1009241.e235g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e235" xlink:type="simple"/><mml:math display="block" id="M235"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>f</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>new</mml:mtext></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mn>2</mml:mn><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>new</mml:mtext></mml:mrow></mml:msubsup><mml:mo>-</mml:mo><mml:mn>1</mml:mn><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(35)</label></disp-formula>
and the new <italic>F</italic><sub>ST</sub> estimator is consistent for locally-outbred individuals (estimates <xref ref-type="disp-formula" rid="pgen.1009241.e042">Eq (4)</xref>):
<disp-formula id="pgen.1009241.e236"><alternatives><graphic id="pgen.1009241.e236g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e236" xlink:type="simple"/><mml:math display="block" id="M236"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>new</mml:mtext></mml:msubsup><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:msubsup><mml:mover accent="true"><mml:mi>f</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>new</mml:mtext></mml:mrow></mml:msubsup><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(36)</label></disp-formula>
Thus, only the implementation of <inline-formula id="pgen.1009241.e237"><alternatives><graphic id="pgen.1009241.e237g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e237" xlink:type="simple"/><mml:math display="inline" id="M237"><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>min</mml:mtext></mml:msub></mml:math></alternatives></inline-formula> is left unspecified from this general estimation approach of kinship and <italic>F</italic><sub>ST</sub>. The implementation of <inline-formula id="pgen.1009241.e238"><alternatives><graphic id="pgen.1009241.e238g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e238" xlink:type="simple"/><mml:math display="inline" id="M238"><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>min</mml:mtext></mml:msub></mml:math></alternatives></inline-formula> used in the analyses in this work is given in the next subsection.</p>
</sec>
<sec id="sec020">
<title>Proof-of-principle kinship estimator using subpopulation labels</title>
<p>To showcase the potential of the new estimators, we implement a simple proof-of-principle version of <inline-formula id="pgen.1009241.e239"><alternatives><graphic id="pgen.1009241.e239g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e239" xlink:type="simple"/><mml:math display="inline" id="M239"><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>min</mml:mtext></mml:msub></mml:math></alternatives></inline-formula> needed for our new kinship estimator (<inline-formula id="pgen.1009241.e240"><alternatives><graphic id="pgen.1009241.e240g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e240" xlink:type="simple"/><mml:math display="inline" id="M240"><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>new</mml:mtext></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e234">Eq (34)</xref>). This <inline-formula id="pgen.1009241.e241"><alternatives><graphic id="pgen.1009241.e241g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e241" xlink:type="simple"/><mml:math display="inline" id="M241"><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>min</mml:mtext></mml:msub></mml:math></alternatives></inline-formula> relies on an appropriate partition of the <italic>n</italic> individuals into <italic>K</italic> subpopulations (denoted <italic>S</italic><sub><italic>u</italic></sub> for <italic>u</italic> ∈ {1, …, <italic>K</italic>}), where the only requirement is that the kinship coefficients between pairs of individuals across the two most unrelated subpopulations is zero, as detailed below. Note that, unlike the the independent subpopulations model of section <bold><italic>F</italic><sub>ST</sub> estimation based on the independent subpopulations model</bold>, these <italic>K</italic> subpopulations need not be independent nor unstructured. The desired estimator <inline-formula id="pgen.1009241.e242"><alternatives><graphic id="pgen.1009241.e242g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e242" xlink:type="simple"/><mml:math display="inline" id="M242"><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>min</mml:mtext></mml:msub></mml:math></alternatives></inline-formula> is the minimum average <italic>A</italic><sub><italic>jk</italic></sub> over all subpopulation pairs:
<disp-formula id="pgen.1009241.e243"><alternatives><graphic id="pgen.1009241.e243g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e243" xlink:type="simple"/><mml:math display="block" id="M243"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>min</mml:mtext></mml:msub><mml:mo>=</mml:mo><mml:munder><mml:mo form="prefix" movablelimits="true">min</mml:mo><mml:mrow><mml:mi>u</mml:mi><mml:mo>≠</mml:mo><mml:mi>v</mml:mi></mml:mrow></mml:munder><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mrow><mml:mo>|</mml:mo></mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub><mml:mrow><mml:mo>|</mml:mo><mml:mo>|</mml:mo></mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>v</mml:mi></mml:msub><mml:mrow><mml:mo>|</mml:mo></mml:mrow></mml:mrow></mml:mfrac><mml:munder><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>∈</mml:mo><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow></mml:munder><mml:munder><mml:mo>∑</mml:mo><mml:mrow><mml:mi>k</mml:mi><mml:mo>∈</mml:mo><mml:msub><mml:mi>S</mml:mi><mml:mi>v</mml:mi></mml:msub></mml:mrow></mml:munder><mml:msub><mml:mi>A</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(37)</label></disp-formula>
This <inline-formula id="pgen.1009241.e244"><alternatives><graphic id="pgen.1009241.e244g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e244" xlink:type="simple"/><mml:math display="inline" id="M244"><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>min</mml:mtext></mml:msub></mml:math></alternatives></inline-formula> consistently estimates the limit of the minimum <italic>A</italic><sub><italic>jk</italic></sub> if <inline-formula id="pgen.1009241.e245"><alternatives><graphic id="pgen.1009241.e245g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e245" xlink:type="simple"/><mml:math display="inline" id="M245"><mml:mrow><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mn>0</mml:mn><mml:mspace width="3.33333pt"/><mml:mo>∀</mml:mo><mml:mi>j</mml:mi><mml:mo>∈</mml:mo><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub><mml:mo>,</mml:mo><mml:mo>∀</mml:mo><mml:mi>k</mml:mi><mml:mo>∈</mml:mo><mml:msub><mml:mi>S</mml:mi><mml:mi>v</mml:mi></mml:msub></mml:mrow></mml:math></alternatives></inline-formula> for the least related pair of subpopulations <italic>S</italic><sub><italic>u</italic></sub>, <italic>S</italic><sub><italic>v</italic></sub>.</p>
<p>This estimator should work well for individuals truly divided into subpopulations, but may be biased for a poor choice of subpopulations, in particular if the minimum mean <inline-formula id="pgen.1009241.e246"><alternatives><graphic id="pgen.1009241.e246g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e246" xlink:type="simple"/><mml:math display="inline" id="M246"><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> between subpopulations is far greater than zero. For this reason, inspection of the kinship estimates is required and careful construction of appropriate subpopulations may be needed. See our analysis of human data for detailed examples [<xref ref-type="bibr" rid="pgen.1009241.ref059">59</xref>]. Future work could focus on a more general <inline-formula id="pgen.1009241.e247"><alternatives><graphic id="pgen.1009241.e247g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e247" xlink:type="simple"/><mml:math display="inline" id="M247"><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>min</mml:mtext></mml:msub></mml:math></alternatives></inline-formula> that circumvents the need for subpopulations of our proof-of-principle estimator.</p>
</sec>
<sec id="sec021">
<title>Comparison to the Weir-Goudet kinship estimator for individuals</title>
<p>Here we analyze the Weir-Goudet (WG) kinship estimator for individuals [<xref ref-type="bibr" rid="pgen.1009241.ref020">20</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref022">22</xref>]. This has connections to our new estimator but differs in having the goal of estimating linearly-transformed kinship values. In our framework, the WG estimator is given by
<disp-formula id="pgen.1009241.e248"><alternatives><graphic id="pgen.1009241.e248g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e248" xlink:type="simple"/><mml:math display="block" id="M248"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>WG</mml:mtext></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:mfrac><mml:msub><mml:mi>A</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>avg</mml:mtext></mml:msub></mml:mfrac><mml:mo>,</mml:mo><mml:mspace width="1em"/><mml:mtext>where</mml:mtext><mml:mspace width="1em"/><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>avg</mml:mtext></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>2</mml:mn><mml:mrow><mml:mi>n</mml:mi><mml:mo>(</mml:mo><mml:mi>n</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn><mml:mo>)</mml:mo></mml:mrow></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>2</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>k</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>j</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:munderover></mml:mstyle><mml:msub><mml:mi>A</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
Therefore, this estimator differs from our proposal [<xref ref-type="bibr" rid="pgen.1009241.ref058">58</xref>] by replacing our <inline-formula id="pgen.1009241.e249"><alternatives><graphic id="pgen.1009241.e249g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e249" xlink:type="simple"/><mml:math display="inline" id="M249"><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>min</mml:mtext></mml:msub></mml:math></alternatives></inline-formula> with <inline-formula id="pgen.1009241.e250"><alternatives><graphic id="pgen.1009241.e250g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e250" xlink:type="simple"/><mml:math display="inline" id="M250"><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>avg</mml:mtext></mml:msub></mml:math></alternatives></inline-formula>. Under the kinship model, the expectation of <inline-formula id="pgen.1009241.e251"><alternatives><graphic id="pgen.1009241.e251g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e251" xlink:type="simple"/><mml:math display="inline" id="M251"><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>avg</mml:mtext></mml:msub></mml:math></alternatives></inline-formula> is
<disp-formula id="pgen.1009241.e252"><alternatives><graphic id="pgen.1009241.e252g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e252" xlink:type="simple"/><mml:math display="block" id="M252"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mo form="prefix">E</mml:mo><mml:mo>[</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>A</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mtext>avg</mml:mtext></mml:msub><mml:mrow><mml:mo>|</mml:mo><mml:mi>T</mml:mi></mml:mrow><mml:mo>]</mml:mo><mml:mo>=</mml:mo><mml:mo>(</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>˜</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>-</mml:mo><mml:mn>1</mml:mn><mml:mo>)</mml:mo><mml:msubsup><mml:mi>v</mml:mi><mml:mi>m</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>,</mml:mo><mml:mspace width="1em"/><mml:mtext>where</mml:mtext><mml:mspace width="1em"/><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>˜</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>2</mml:mn><mml:mrow><mml:mi>n</mml:mi><mml:mo>(</mml:mo><mml:mi>n</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn><mml:mo>)</mml:mo></mml:mrow></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>2</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>k</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>j</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:munderover></mml:mstyle><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
Therefore, the limit of this estimator is
<disp-formula id="pgen.1009241.e253"><alternatives><graphic id="pgen.1009241.e253g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e253" xlink:type="simple"/><mml:math display="block" id="M253"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>WG</mml:mtext></mml:mrow></mml:msubsup><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mrow><mml:mtext>a.s.</mml:mtext></mml:mrow></mml:munderover><mml:mfrac><mml:mrow><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>−</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>˜</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>−</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>˜</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:mfrac><mml:mo>,</mml:mo></mml:mrow></mml:math></alternatives> <label>(38)</label></disp-formula>
which agrees with calculations in the original WG work [<xref ref-type="bibr" rid="pgen.1009241.ref020">20</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref022">22</xref>]. Note that, assuming that kinship coefficients must be non-negative, the above estimator recovers the kinship IBD probabilities if and only if <inline-formula id="pgen.1009241.e254"><alternatives><graphic id="pgen.1009241.e254g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e254" xlink:type="simple"/><mml:math display="inline" id="M254"><mml:mrow><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>˜</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> which holds if and only if <inline-formula id="pgen.1009241.e255"><alternatives><graphic id="pgen.1009241.e255g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e255" xlink:type="simple"/><mml:math display="inline" id="M255"><mml:mrow><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> for every pair of individuals <italic>j</italic> ≠ <italic>k</italic>. The resulting WG inbreeding coefficient estimator is
<disp-formula id="pgen.1009241.e256"><alternatives><graphic id="pgen.1009241.e256g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e256" xlink:type="simple"/><mml:math display="block" id="M256"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>f</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>WG</mml:mtext></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mn>2</mml:mn><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>WG</mml:mtext></mml:mrow></mml:msubsup><mml:mo>−</mml:mo><mml:mn>1</mml:mn><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mrow><mml:mtext>a.s.</mml:mtext></mml:mrow></mml:munderover><mml:mfrac><mml:mrow><mml:msubsup><mml:mi>f</mml:mi><mml:mi>j</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>−</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>˜</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>−</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>˜</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:mfrac><mml:mo>,</mml:mo></mml:mrow></mml:math></alternatives></disp-formula>
which estimates linearly-transformed inbreeding values [<xref ref-type="bibr" rid="pgen.1009241.ref021">21</xref>]. Therefore, the resulting WG <italic>F</italic><sub>ST</sub> estimator (for individuals) also targets a linearly-transformed <italic>F</italic><sub>ST</sub> value (under locally-outbred individuals, where <italic>F</italic><sub>ST</sub> is given by <xref ref-type="disp-formula" rid="pgen.1009241.e042">Eq (4)</xref>), namely
<disp-formula id="pgen.1009241.e257"><alternatives><graphic id="pgen.1009241.e257g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e257" xlink:type="simple"/><mml:math display="block" id="M257"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mrow><mml:mtext>WG</mml:mtext></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:mstyle displaystyle="true"><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>f</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>j</mml:mi><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>WG</mml:mtext></mml:mrow></mml:msubsup></mml:mrow></mml:mstyle><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mrow><mml:mtext>a.s.</mml:mtext></mml:mrow></mml:munderover><mml:mfrac><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow></mml:msub><mml:mo>−</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>˜</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>−</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>˜</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:mfrac><mml:mo>.</mml:mo></mml:mrow></mml:math></alternatives></disp-formula>
The WG authors also briefly consider a variant of their kinship estimator that is normalized using the minimum kinship value as we did, developed concurrently with our approach [<xref ref-type="bibr" rid="pgen.1009241.ref058">58</xref>], but was largely dismissed as an unnecessary correction [<xref ref-type="bibr" rid="pgen.1009241.ref021">21</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref076">76</xref>]. See <xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref> for a detailed proof that the general estimator framework we propose here (Eqs <xref ref-type="disp-formula" rid="pgen.1009241.e221">(33)</xref> and <xref ref-type="disp-formula" rid="pgen.1009241.e234">(34)</xref>) is algebraically equivalent to our original formulation in [<xref ref-type="bibr" rid="pgen.1009241.ref058">58</xref>].</p>
<p>Note that the original WG does not estimate <italic>F</italic><sub>ST</sub> from individuals as considered above; instead, <italic>F</italic><sub>ST</sub> is estimated from coancestry estimates for subpopulations (which equals our HudsonK for biallelic loci, <xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref>) [<xref ref-type="bibr" rid="pgen.1009241.ref020">20</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref022">22</xref>]. For completeness, we consider both kinds of <italic>F</italic><sub>ST</sub> estimates in the evaluations that follow.</p>
</sec>
</sec>
<sec id="sec022">
<title>Simulations evaluating <italic>F</italic><sub>ST</sub> and kinship estimators</title>
<sec id="sec023">
<title>Overview of simulations</title>
<p>We simulate genotypes from two models to illustrate our results when the true population structure parameters are known. Both simulations have clearly-defined IBD probability parameters in terms of the MRCA population. The first simulation satisfies the independent subpopulations model that existing <italic>F</italic><sub>ST</sub> estimators assume. The second simulation is from an admixture model with no independent subpopulations and pervasive kinship designed to induce large downward biases in existing kinship and <italic>F</italic><sub>ST</sub> estimators (<xref ref-type="fig" rid="pgen.1009241.g002">Fig 2</xref>). This admixture scenario resembles the population structure we estimated for Hispanics in the 1000 Genomes Project [<xref ref-type="bibr" rid="pgen.1009241.ref059">59</xref>]: compare the simulated kinship matrix (<xref ref-type="fig" rid="pgen.1009241.g002">Fig 2B</xref>) and admixture proportions (<xref ref-type="fig" rid="pgen.1009241.g003">Fig 3C</xref>) to our estimates on the real data [<xref ref-type="bibr" rid="pgen.1009241.ref059">59</xref>]. Both simulations have <italic>n</italic> = 1000 individuals, <italic>m</italic> = 300, 000 loci, and <italic>K</italic> = 10 subpopulations or intermediate subpopulations. These simulations have <italic>F</italic><sub>ST</sub> = 0.1, comparable to previous estimates between human populations (in 1000 Genomes, the estimated <italic>F</italic><sub>ST</sub> between CEU (European-Americans) and CHB (Chinese) is 0.106, between CEU and YRI (Yoruba from Nigeria) it is 0.139, and between CHB and YRI it is 0.161 [<xref ref-type="bibr" rid="pgen.1009241.ref023">23</xref>]).</p>
<fig id="pgen.1009241.g002" position="float">
<object-id pub-id-type="doi">10.1371/journal.pgen.1009241.g002</object-id>
<label>Fig 2</label>
<caption>
<title>Coancestry matrices of simulations.</title>
<p>Both panels have <italic>n</italic> = 1000 individuals along both axes, <italic>K</italic> = 10 subpopulations (final or intermediate), and <italic>F</italic><sub>ST</sub> = 0.1. Color corresponds to <inline-formula id="pgen.1009241.e258"><alternatives><graphic id="pgen.1009241.e258g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e258" xlink:type="simple"/><mml:math display="inline" id="M258"><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> between individuals <italic>j</italic> and <italic>k</italic> (equal to <inline-formula id="pgen.1009241.e259"><alternatives><graphic id="pgen.1009241.e259g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e259" xlink:type="simple"/><mml:math display="inline" id="M259"><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> off-diagonal, <inline-formula id="pgen.1009241.e260"><alternatives><graphic id="pgen.1009241.e260g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e260" xlink:type="simple"/><mml:math display="inline" id="M260"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> along the diagonal). (A) The independent subpopulations model has <inline-formula id="pgen.1009241.e261"><alternatives><graphic id="pgen.1009241.e261g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e261" xlink:type="simple"/><mml:math display="inline" id="M261"><mml:mrow><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> between subpopulations, and varying <inline-formula id="pgen.1009241.e262"><alternatives><graphic id="pgen.1009241.e262g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e262" xlink:type="simple"/><mml:math display="inline" id="M262"><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> per subpopulation, resulting in a block-diagonal coancestry matrix. (B) Our admixture scenario models a 1D geography with extensive admixture and intermediate subpopulation differentiation that increases with distance, resulting in a smooth coancestry matrix with no independent subpopulations (no <inline-formula id="pgen.1009241.e263"><alternatives><graphic id="pgen.1009241.e263g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e263" xlink:type="simple"/><mml:math display="inline" id="M263"><mml:mrow><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> between blocks). Individuals are ordered along each axis by geographical position.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pgen.1009241.g002" xlink:type="simple"/>
</fig>
<fig id="pgen.1009241.g003" position="float">
<object-id pub-id-type="doi">10.1371/journal.pgen.1009241.g003</object-id>
<label>Fig 3</label>
<caption>
<title>1D admixture scenario.</title>
<p>We model a 1D geography population that departs strongly from the independent subpopulations model. (A) <italic>K</italic> = 10 intermediate subpopulations, evenly spaced on a line, evolved independently in the past with <italic>F</italic><sub>ST</sub> increasing with distance, which models a sequence of increasing founder effects (from left to right) to mimic the global human population. (B) Once differentiated, individuals in these intermediate subpopulations spread by random walk modeled by Normal densities. (C) <italic>n</italic> = 1000 individuals, sampled evenly in the same geographical range, are admixed proportionally to the previous Normal densities. Thus, each individual draws most of its alleles from the closest intermediate subpopulation, and draws the fewest alleles from the most distant populations. Long-distance random walks of intermediate subpopulation individuals results in kinship for admixed individuals that decays smoothly with distance in <xref ref-type="fig" rid="pgen.1009241.g002">Fig 2B</xref>. (D) For <italic>F</italic><sub>ST</sub> estimators that require a partition of individuals into subpopulations, individuals are clustered by geographical position (<italic>K</italic> = 10).</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pgen.1009241.g003" xlink:type="simple"/>
</fig>
<p>The independent subpopulations simulation satisfies the HudsonK and BayeScan estimator assumptions: each independent subpopulation <italic>S</italic><sub><italic>u</italic></sub> has a different <italic>F</italic><sub>ST</sub> value of <inline-formula id="pgen.1009241.e264"><alternatives><graphic id="pgen.1009241.e264g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e264" xlink:type="simple"/><mml:math display="inline" id="M264"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> relative to the MRCA population <italic>T</italic> (<xref ref-type="fig" rid="pgen.1009241.g002">Fig 2A</xref>). Ancestral allele frequencies <inline-formula id="pgen.1009241.e265"><alternatives><graphic id="pgen.1009241.e265g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e265" xlink:type="simple"/><mml:math display="inline" id="M265"><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> are drawn uniformly between 0.01 and 0.5. Allele frequencies <inline-formula id="pgen.1009241.e266"><alternatives><graphic id="pgen.1009241.e266g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e266" xlink:type="simple"/><mml:math display="inline" id="M266"><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:msubsup></mml:math></alternatives></inline-formula> for <italic>S</italic><sub><italic>u</italic></sub> and locus <italic>i</italic> are drawn independently from the Balding-Nichols (BN) distribution [<xref ref-type="bibr" rid="pgen.1009241.ref003">3</xref>] with parameters <inline-formula id="pgen.1009241.e267"><alternatives><graphic id="pgen.1009241.e267g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e267" xlink:type="simple"/><mml:math display="inline" id="M267"><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009241.e268"><alternatives><graphic id="pgen.1009241.e268g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e268" xlink:type="simple"/><mml:math display="inline" id="M268"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula>. Every individual <italic>j</italic> in subpopulation <italic>S</italic><sub><italic>u</italic></sub> draws alleles randomly with probability <inline-formula id="pgen.1009241.e269"><alternatives><graphic id="pgen.1009241.e269g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e269" xlink:type="simple"/><mml:math display="inline" id="M269"><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:msubsup></mml:math></alternatives></inline-formula>. Subpopulation sample sizes are drawn randomly (<xref ref-type="sec" rid="sec028">Methods</xref>, section <bold>Simulations</bold>).</p>
<p>The admixture simulation corresponds to a “BN-PSD” model [<xref ref-type="bibr" rid="pgen.1009241.ref006">6</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref027">27</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref034">34</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref060">60</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref077">77</xref>]: the intermediate subpopulations are independent subpopulations that draw <inline-formula id="pgen.1009241.e270"><alternatives><graphic id="pgen.1009241.e270g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e270" xlink:type="simple"/><mml:math display="inline" id="M270"><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:msubsup></mml:math></alternatives></inline-formula> from the BN model, then each individual <italic>j</italic> constructs its allele frequencies as <inline-formula id="pgen.1009241.e271"><alternatives><graphic id="pgen.1009241.e271g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e271" xlink:type="simple"/><mml:math display="inline" id="M271"><mml:mrow><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>u</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>K</mml:mi></mml:msubsup><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:msubsup><mml:msub><mml:mi>q</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>u</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></alternatives></inline-formula>, which is a weighted average of the subpopulation allele frequencies <inline-formula id="pgen.1009241.e272"><alternatives><graphic id="pgen.1009241.e272g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e272" xlink:type="simple"/><mml:math display="inline" id="M272"><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:msubsup></mml:math></alternatives></inline-formula> with the admixture proportions <italic>q</italic><sub><italic>ju</italic></sub> of individual <italic>j</italic> and subpopulation <italic>u</italic> as weights (which satisfy <inline-formula id="pgen.1009241.e273"><alternatives><graphic id="pgen.1009241.e273g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e273" xlink:type="simple"/><mml:math display="inline" id="M273"><mml:mrow><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>u</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>K</mml:mi></mml:msubsup><mml:msub><mml:mi>q</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>u</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>), as in the Pritchard-Stephens-Donnelly (PSD) admixture model [<xref ref-type="bibr" rid="pgen.1009241.ref063">63</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref065">65</xref>]. We constructed <italic>q</italic><sub><italic>ju</italic></sub> that model admixture resulting from spread by random walk of the intermediate subpopulations along a one-dimensional geography, as follows. Intermediate subpopulations <italic>S</italic><sub><italic>u</italic></sub> are placed on a line with differentiation <inline-formula id="pgen.1009241.e274"><alternatives><graphic id="pgen.1009241.e274g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e274" xlink:type="simple"/><mml:math display="inline" id="M274"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> that grows with distance, which corresponds to a serial founder effect (<xref ref-type="fig" rid="pgen.1009241.g003">Fig 3A</xref>). Upon differentiation, individuals in each <italic>S</italic><sub><italic>u</italic></sub> spread by random walk, a process modeled by Normal densities (<xref ref-type="fig" rid="pgen.1009241.g003">Fig 3B</xref>). Admixed individuals derive their ancestry proportional from these Normal densities, resulting in a genetic structure governed by geography (Figs <xref ref-type="fig" rid="pgen.1009241.g003">3C</xref> and <xref ref-type="fig" rid="pgen.1009241.g002">2B</xref>) and departing strongly from the independent subpopulations model (<xref ref-type="fig" rid="pgen.1009241.g003">Fig 3D</xref>). The amount of spread—which sets the mean kinship across all individuals—was chosen to give a bias coefficient of <inline-formula id="pgen.1009241.e275"><alternatives><graphic id="pgen.1009241.e275g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e275" xlink:type="simple"/><mml:math display="inline" id="M275"><mml:mrow><mml:msup><mml:mi>s</mml:mi><mml:mi>T</mml:mi></mml:msup><mml:mo>=</mml:mo><mml:mfrac><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub></mml:mfrac><mml:mo>=</mml:mo><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>5</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>, which by <xref ref-type="disp-formula" rid="pgen.1009241.e210">Eq (32)</xref> results in a large downward bias for <inline-formula id="pgen.1009241.e276"><alternatives><graphic id="pgen.1009241.e276g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e276" xlink:type="simple"/><mml:math display="inline" id="M276"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> (in contrast, the independent subpopulations simulation has <italic>s</italic><sup><italic>T</italic></sup> = 0.1). The true coancestry and <italic>F</italic><sub>ST</sub> parameters of this simulation are given by the <inline-formula id="pgen.1009241.e277"><alternatives><graphic id="pgen.1009241.e277g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e277" xlink:type="simple"/><mml:math display="inline" id="M277"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> values of the intermediate subpopulations and the admixture coefficients <italic>q</italic><sub><italic>ju</italic></sub> of the individuals via the following equations [<xref ref-type="bibr" rid="pgen.1009241.ref057">57</xref>]:
<disp-formula id="pgen.1009241.e278"><alternatives><graphic id="pgen.1009241.e278g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e278" xlink:type="simple"/><mml:math display="block" id="M278"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>u</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>K</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mi>q</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>u</mml:mi></mml:mrow></mml:msub><mml:msub><mml:mi>q</mml:mi><mml:mrow><mml:mi>k</mml:mi><mml:mi>u</mml:mi></mml:mrow></mml:msub><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd columnalign="right"><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>u</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>K</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:msubsup><mml:mi>q</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>u</mml:mi></mml:mrow><mml:mn>2</mml:mn></mml:msubsup><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(39)</label></disp-formula>
The first equation above connecting coancestry to admixture proportions was derived independently in other work [<xref ref-type="bibr" rid="pgen.1009241.ref062">62</xref>], but the <italic>F</italic><sub>ST</sub> for the admixed individuals was absent and instead follows from our generalized <italic>F</italic><sub>ST</sub> definition given in <xref ref-type="disp-formula" rid="pgen.1009241.e053">Eq (9)</xref>. See <xref ref-type="sec" rid="sec028">Methods</xref>, section <bold>Simulations</bold> for additional details regarding these simulations.</p>
</sec>
<sec id="sec024">
<title>Evaluation of <italic>F</italic><sub>ST</sub> estimators</title>
<p>Our admixture simulation illustrates the large biases that can arise if existing <italic>F</italic><sub>ST</sub> estimators that require independent subpopulations or <italic>F</italic><sub>ST</sub> estimates derived from existing kinship estimators are misapplied to arbitrary population structures to estimate the generalized <italic>F</italic><sub>ST</sub>, and demonstrate the higher accuracy of our new <italic>F</italic><sub>ST</sub> estimator (<inline-formula id="pgen.1009241.e279"><alternatives><graphic id="pgen.1009241.e279g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e279" xlink:type="simple"/><mml:math display="inline" id="M279"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>new</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> given by the combination of Eqs <xref ref-type="disp-formula" rid="pgen.1009241.e236">(36)</xref> and <xref ref-type="disp-formula" rid="pgen.1009241.e243">(37)</xref>). The WC <italic>F</italic><sub>IT</sub> (total inbreeding) estimator was also evaluated.</p>
<p>First, we test these estimators in our independent subpopulations simulation. The HudsonK (<xref ref-type="sec" rid="sec028">Methods</xref>, section <bold>Generalized HudsonK <italic>F</italic><sub>ST</sub> estimator</bold>) and BayeScan <italic>F</italic><sub>ST</sub> estimators are consistent in this simulation, since their assumptions are satisfied (<xref ref-type="fig" rid="pgen.1009241.g004">Fig 4A</xref>). The WC <italic>F</italic><sub>ST</sub> estimator assumes that <inline-formula id="pgen.1009241.e280"><alternatives><graphic id="pgen.1009241.e280g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e280" xlink:type="simple"/><mml:math display="inline" id="M280"><mml:mrow><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub></mml:mrow></mml:math></alternatives></inline-formula> for all subpopulations <italic>S</italic><sub><italic>u</italic></sub>, which does not hold; nevertheless, WC has only a small bias (<xref ref-type="fig" rid="pgen.1009241.g004">Fig 4A</xref>). The WC <italic>F</italic><sub>IT</sub> estimator arrives at similar estimates, as it should since there is no local inbreeding, so the true <italic>F</italic><sub>IT</sub> also equals <italic>F</italic><sub>ST</sub>. The Weir-Hill estimator permits different <inline-formula id="pgen.1009241.e281"><alternatives><graphic id="pgen.1009241.e281g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e281" xlink:type="simple"/><mml:math display="inline" id="M281"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> values per subpopulation, but assigns equal weight to individuals rather than subpopulations (<xref ref-type="sec" rid="sec028">Methods</xref>, section <bold>The Weir-Hill <italic>F</italic><sub>ST</sub> estimator</bold>), resulting in a slightly different target <italic>F</italic><sub>ST</sub> (we verified that these estimates are unbiased for this <italic>F</italic><sub>ST</sub>). For comparison, we show the standard kinship-based <inline-formula id="pgen.1009241.e282"><alternatives><graphic id="pgen.1009241.e282g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e282" xlink:type="simple"/><mml:math display="inline" id="M282"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e179">Eq (25)</xref> (weights from <xref ref-type="sec" rid="sec028">Methods</xref>, section <bold>Simulations</bold>) and <inline-formula id="pgen.1009241.e283"><alternatives><graphic id="pgen.1009241.e283g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e283" xlink:type="simple"/><mml:math display="inline" id="M283"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>WG</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> based on the Weir-Goudet kinship estimates for individuals, both of which do not have corrections that would make them consistent under the independent subpopulations model. Since the number of subpopulations <italic>K</italic> is large, <inline-formula id="pgen.1009241.e284"><alternatives><graphic id="pgen.1009241.e284g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e284" xlink:type="simple"/><mml:math display="inline" id="M284"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> has a small relative bias of about <inline-formula id="pgen.1009241.e285"><alternatives><graphic id="pgen.1009241.e285g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e285" xlink:type="simple"/><mml:math display="inline" id="M285"><mml:mrow><mml:msup><mml:mi>s</mml:mi><mml:mi>T</mml:mi></mml:msup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>K</mml:mi></mml:mfrac><mml:mo>=</mml:mo><mml:mn>10</mml:mn><mml:mo>%</mml:mo></mml:mrow></mml:math></alternatives></inline-formula> (<xref ref-type="fig" rid="pgen.1009241.g004">Fig 4A</xref>); greater bias is expected for smaller <italic>K</italic>. Our new <italic>F</italic><sub>ST</sub> estimator has a very small bias in this simulation resulting from estimating the minimum kinship from the smallest kinship between subpopulations (see <xref ref-type="disp-formula" rid="pgen.1009241.e243">Eq (37)</xref>) rather than their average as HudsonK does implicitly (<xref ref-type="fig" rid="pgen.1009241.g004">Fig 4A</xref>).</p>
<fig id="pgen.1009241.g004" position="float">
<object-id pub-id-type="doi">10.1371/journal.pgen.1009241.g004</object-id>
<label>Fig 4</label>
<caption>
<title>Evaluation of <italic>F</italic><sub>ST</sub> estimators.</title>
<p>The Weir-Cockerham, Weir-Hill, Weir-Goudet (for individuals), HudsonK (equal to Weir-Goudet for subpopulations, <xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref>), BayeScan, <inline-formula id="pgen.1009241.e286"><alternatives><graphic id="pgen.1009241.e286g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e286" xlink:type="simple"/><mml:math display="inline" id="M286"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e179">Eq (25)</xref> derived from the standard kinship estimator, and our new <italic>F</italic><sub>ST</sub> estimator in Eqs <xref ref-type="disp-formula" rid="pgen.1009241.e234">(34)</xref> and <xref ref-type="disp-formula" rid="pgen.1009241.e243">(37)</xref>, are evaluated on simulated genotypes from our two models (<xref ref-type="fig" rid="pgen.1009241.g002">Fig 2</xref>). The Weir-Cockerham <italic>F</italic><sub>IT</sub> estimator was also included to show that estimation of total inbreeding behaves similarly to <italic>F</italic><sub>ST</sub> estimators. (A) The independent subpopulations model required by the Weir-Hill, HudsonK, and BayeScan <italic>F</italic><sub>ST</sub> estimators. All but standard kinship (<inline-formula id="pgen.1009241.e287"><alternatives><graphic id="pgen.1009241.e287g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e287" xlink:type="simple"/><mml:math display="inline" id="M287"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula>) and Weir-Goudet (for individuals) recover the target <italic>F</italic><sub>ST</sub> IBD probability in <xref ref-type="disp-formula" rid="pgen.1009241.e053">Eq (9)</xref> (red line) with small errors. (B) Our admixture scenario, which has no independent subpopulations, was constructed so <inline-formula id="pgen.1009241.e288"><alternatives><graphic id="pgen.1009241.e288g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e288" xlink:type="simple"/><mml:math display="inline" id="M288"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup><mml:mo>≈</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mn>2</mml:mn></mml:mfrac><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub></mml:mrow></mml:math></alternatives></inline-formula>. Only our new estimates are accurate. The rest of these estimators give values smaller than the target <italic>F</italic><sub>ST</sub> IBD probability, which result from treating kinship as zero between every subpopulations imposed by geographic clustering (or between individuals for Standard Kinship and Weir-Goudet). The <inline-formula id="pgen.1009241.e289"><alternatives><graphic id="pgen.1009241.e289g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e289" xlink:type="simple"/><mml:math display="inline" id="M289"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> estimator limit in <xref ref-type="disp-formula" rid="pgen.1009241.e103">Eq (14)</xref> (green dotted line) overlaps the true <italic>F</italic><sub>ST</sub> (red line) in (A) but not (B). Estimates (blue) include 95% prediction intervals (often too narrow to see) from 39 independently-simulated genotype matrices for each model (<xref ref-type="sec" rid="sec028">Methods</xref>, section <bold>Prediction intervals</bold>).</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pgen.1009241.g004" xlink:type="simple"/>
</fig>
<p>Next we test these estimators in our admixture simulation. To apply the <italic>F</italic><sub>ST</sub> estimators that require subpopulations to the admixture model, individuals are clustered into subpopulations by their geographical position (<xref ref-type="fig" rid="pgen.1009241.g003">Fig 3D</xref>). We find that estimates of all existing methods are smaller than the true <italic>F</italic><sub>ST</sub> by nearly half, as predicted by the limit of <inline-formula id="pgen.1009241.e290"><alternatives><graphic id="pgen.1009241.e290g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e290" xlink:type="simple"/><mml:math display="inline" id="M290"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e103">Eq (14)</xref> (<xref ref-type="fig" rid="pgen.1009241.g004">Fig 4B</xref>). The WC <italic>F</italic><sub>IT</sub> estimator obtains slightly larger estimates than the WC <italic>F</italic><sub>ST</sub> estimator, but overall remains as biased as the other <italic>F</italic><sub>ST</sub> estimators, showing that the use of a total inbreeding estimator for independent subpopulations displays the same bias as the corresponding <italic>F</italic><sub>ST</sub> estimator. By construction, the kinship-based <inline-formula id="pgen.1009241.e291"><alternatives><graphic id="pgen.1009241.e291g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e291" xlink:type="simple"/><mml:math display="inline" id="M291"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> also has a large relative bias of about <italic>s</italic><sup><italic>T</italic></sup> = 50%; remarkably, all existing <italic>F</italic><sub>ST</sub> estimators for subpopulations suffer from comparable biases. Thus, the corrections for independent subpopulations present in the WC, Weir-Hill and HudsonK estimators, or the Bayesian likelihood modeling of BayeScan, are insufficient for accurate estimation of the target generalized <italic>F</italic><sub>ST</sub> (<xref ref-type="disp-formula" rid="pgen.1009241.e053">Eq (9)</xref>) in this admixture scenario. Only our new <italic>F</italic><sub>ST</sub> estimator achieves accurate estimates of the generalized <italic>F</italic><sub>ST</sub> in the admixture simulation (<xref ref-type="fig" rid="pgen.1009241.g004">Fig 4B</xref>).</p>
</sec>
<sec id="sec025">
<title>Evaluation of kinship estimators</title>
<p>Our admixture simulation illustrates the distortions of the standard kinship estimator <inline-formula id="pgen.1009241.e292"><alternatives><graphic id="pgen.1009241.e292g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e292" xlink:type="simple"/><mml:math display="inline" id="M292"><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e136">Eq (18)</xref>, the linearly-transformed kinship values given by the Weir-Goudet estimator, and demonstrates the improved accuracy of our new kinship estimator <inline-formula id="pgen.1009241.e293"><alternatives><graphic id="pgen.1009241.e293g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e293" xlink:type="simple"/><mml:math display="inline" id="M293"><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>new</mml:mtext></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula> given by the combination of Eqs <xref ref-type="disp-formula" rid="pgen.1009241.e234">(34)</xref> and <xref ref-type="disp-formula" rid="pgen.1009241.e243">(37)</xref>. Kinship matrix estimates and their limits are visualized as heatmaps in <xref ref-type="fig" rid="pgen.1009241.g005">Fig 5</xref>, whereas estimator accuracy is shown directly in <xref ref-type="fig" rid="pgen.1009241.g006">Fig 6</xref>. The limit of the standard estimator <inline-formula id="pgen.1009241.e294"><alternatives><graphic id="pgen.1009241.e294g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e294" xlink:type="simple"/><mml:math display="inline" id="M294"><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e136">Eq (18)</xref> would have had a uniform bias if <inline-formula id="pgen.1009241.e295"><alternatives><graphic id="pgen.1009241.e295g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e295" xlink:type="simple"/><mml:math display="inline" id="M295"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>j</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:math></alternatives></inline-formula> held for all individuals <italic>j</italic>. For that reason, our admixture simulation has varying differentiation <inline-formula id="pgen.1009241.e296"><alternatives><graphic id="pgen.1009241.e296g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e296" xlink:type="simple"/><mml:math display="inline" id="M296"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> per intermediate subpopulation <italic>S</italic><sub><italic>u</italic></sub> (<xref ref-type="fig" rid="pgen.1009241.g003">Fig 3A</xref>), which causes large differences in <inline-formula id="pgen.1009241.e297"><alternatives><graphic id="pgen.1009241.e297g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e297" xlink:type="simple"/><mml:math display="inline" id="M297"><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>j</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> per individual <italic>j</italic> and therefore large distortions in <inline-formula id="pgen.1009241.e298"><alternatives><graphic id="pgen.1009241.e298g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e298" xlink:type="simple"/><mml:math display="inline" id="M298"><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula>. The Weir-Goudet approach estimates the linearly-transformed kinship values calculated in <xref ref-type="disp-formula" rid="pgen.1009241.e253">Eq (38)</xref>.</p>
<fig id="pgen.1009241.g005" position="float">
<object-id pub-id-type="doi">10.1371/journal.pgen.1009241.g005</object-id>
<label>Fig 5</label>
<caption>
<title>Evaluation of kinship estimators.</title>
<p>Observed accuracy for two existing kinship coefficient estimators is illustrated in our admixture simulation and contrasted to the nearly unbiased estimates of our new estimator. Plots show <italic>n</italic> = 1000 individuals along both axes, and color corresponds to <inline-formula id="pgen.1009241.e299"><alternatives><graphic id="pgen.1009241.e299g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e299" xlink:type="simple"/><mml:math display="inline" id="M299"><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> between individuals <italic>j</italic> ≠ <italic>k</italic> and to <inline-formula id="pgen.1009241.e300"><alternatives><graphic id="pgen.1009241.e300g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e300" xlink:type="simple"/><mml:math display="inline" id="M300"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> along the diagonal (<inline-formula id="pgen.1009241.e301"><alternatives><graphic id="pgen.1009241.e301g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e301" xlink:type="simple"/><mml:math display="inline" id="M301"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> is in the same scale as <inline-formula id="pgen.1009241.e302"><alternatives><graphic id="pgen.1009241.e302g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e302" xlink:type="simple"/><mml:math display="inline" id="M302"><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> for <italic>j</italic> ≠ <italic>k</italic>; plotting <inline-formula id="pgen.1009241.e303"><alternatives><graphic id="pgen.1009241.e303g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e303" xlink:type="simple"/><mml:math display="inline" id="M303"><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula>, which have a minimum value of <inline-formula id="pgen.1009241.e304"><alternatives><graphic id="pgen.1009241.e304g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e304" xlink:type="simple"/><mml:math display="inline" id="M304"><mml:mfrac><mml:mn>1</mml:mn><mml:mn>2</mml:mn></mml:mfrac></mml:math></alternatives></inline-formula>, would result in a discontinuity in this figure). (A) True kinship matrix. (B) Estimated kinship using our new estimator in Eqs <xref ref-type="disp-formula" rid="pgen.1009241.e234">(34)</xref> and <xref ref-type="disp-formula" rid="pgen.1009241.e243">(37)</xref> from simulated genotypes recovers the true kinship matrix with high accuracy. (C) Theoretical limit of <inline-formula id="pgen.1009241.e305"><alternatives><graphic id="pgen.1009241.e305g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e305" xlink:type="simple"/><mml:math display="inline" id="M305"><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e141">Eq (19)</xref> as the number of independent loci goes to infinity demonstrates the accuracy of our bias predictions under the kinship model. (D) Standard kinship estimates <inline-formula id="pgen.1009241.e306"><alternatives><graphic id="pgen.1009241.e306g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e306" xlink:type="simple"/><mml:math display="inline" id="M306"><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula> given by <xref ref-type="disp-formula" rid="pgen.1009241.e136">Eq (18)</xref> from simulated genotypes are downwardly biased on average and distorted by pair-specific amounts. (E) Theoretical limit of the Weir-Goudet kinship estimator given by <xref ref-type="disp-formula" rid="pgen.1009241.e253">Eq (38)</xref>. (F) Weir-Goudet kinship estimates from the same simulated genotypes agree with our calculated limit.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pgen.1009241.g005" xlink:type="simple"/>
</fig>
<fig id="pgen.1009241.g006" position="float">
<object-id pub-id-type="doi">10.1371/journal.pgen.1009241.g006</object-id>
<label>Fig 6</label>
<caption>
<title>Accuracy of kinship estimators.</title>
<p>Here the estimated kinship values are directly compared to their true values, in the same admixture simulation data (<italic>n</italic> = 1000 individuals) shown in the previous figure. (A) Kinship between different individuals (excluding inbreeding). The new estimator has practically no bias in this evaluation (falls on the 1-1 dashed gray line). The standard estimator has a complex, non-linear bias that covers a large area of errors. (B) Inbreeding comparison, shows the bias of the standard estimate follows a different pattern for inbreeding compared to kinship between individuals. To better visualize and compare data across panels, a random subset of <italic>n</italic> points (out of the original <italic>n</italic>(<italic>n</italic> − 1)/2 unique individual pairs) were plotted in (A), matching the number of individuals (number of points in (B)).</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pgen.1009241.g006" xlink:type="simple"/>
</fig>
<p>Our new kinship estimator (<xref ref-type="fig" rid="pgen.1009241.g005">Fig 5B</xref>) recovers the true kinship matrix of this complex population structure (<xref ref-type="fig" rid="pgen.1009241.g005">Fig 5A</xref>), with an RMSE of 2.83% relative to the mean <inline-formula id="pgen.1009241.e307"><alternatives><graphic id="pgen.1009241.e307g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e307" xlink:type="simple"/><mml:math display="inline" id="M307"><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> (<xref ref-type="fig" rid="pgen.1009241.g006">Fig 6</xref>). In contrast, estimates using the standard estimator have a large overall downward bias (<xref ref-type="fig" rid="pgen.1009241.g005">Fig 5C</xref>), resulting in an RMSE of 115.72% from the true <inline-formula id="pgen.1009241.e308"><alternatives><graphic id="pgen.1009241.e308g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e308" xlink:type="simple"/><mml:math display="inline" id="M308"><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> relative to the mean <inline-formula id="pgen.1009241.e309"><alternatives><graphic id="pgen.1009241.e309g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e309" xlink:type="simple"/><mml:math display="inline" id="M309"><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> (<xref ref-type="fig" rid="pgen.1009241.g006">Fig 6</xref>). Additionally, estimates from <inline-formula id="pgen.1009241.e310"><alternatives><graphic id="pgen.1009241.e310g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e310" xlink:type="simple"/><mml:math display="inline" id="M310"><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula> are very distorted, with an abundance of <inline-formula id="pgen.1009241.e311"><alternatives><graphic id="pgen.1009241.e311g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e311" xlink:type="simple"/><mml:math display="inline" id="M311"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup><mml:mo>&lt;</mml:mo><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mrow></mml:math></alternatives></inline-formula> cases—some of which are negative estimates (blue in <xref ref-type="fig" rid="pgen.1009241.g005">Fig 5C</xref>)—but remarkably also cases with <inline-formula id="pgen.1009241.e312"><alternatives><graphic id="pgen.1009241.e312g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e312" xlink:type="simple"/><mml:math display="inline" id="M312"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup><mml:mo>&gt;</mml:mo><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mrow></mml:math></alternatives></inline-formula> (top left corner of Figs <xref ref-type="fig" rid="pgen.1009241.g005">5C</xref> and <xref ref-type="fig" rid="pgen.1009241.g006">6</xref>).</p>
<p>Now we compare the convergence of the ratio-of-means and mean-of-ratios versions of the standard kinship estimator to their biased limit we calculated in <xref ref-type="disp-formula" rid="pgen.1009241.e141">Eq (19)</xref> (<xref ref-type="fig" rid="pgen.1009241.g005">Fig 5D</xref>). The ratio-of-means estimate <inline-formula id="pgen.1009241.e313"><alternatives><graphic id="pgen.1009241.e313g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e313" xlink:type="simple"/><mml:math display="inline" id="M313"><mml:msubsup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mtext>std</mml:mtext></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula> (<xref ref-type="fig" rid="pgen.1009241.g005">Fig 5C</xref>) has an RMSE of 2.14% from its limit relative to the mean <inline-formula id="pgen.1009241.e314"><alternatives><graphic id="pgen.1009241.e314g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e314" xlink:type="simple"/><mml:math display="inline" id="M314"><mml:msubsup><mml:mi>φ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula>. In contrast, the mean-of-ratios estimates that are prevalent in the literature have a greater RMSE of 10.77% from the same limit in <xref ref-type="disp-formula" rid="pgen.1009241.e141">Eq (19)</xref>. Thus, as expected from our theoretical results in section <bold>Assessing the accuracy of genome-wide ratio estimators</bold>, the ratio-of-means estimate is much closer to the desired limit than the mean-of-ratio estimate. The distortions are similar for the estimator that uses IAFs in <xref ref-type="disp-formula" rid="pgen.1009241.e400">Eq (24)</xref>, with reduced RMSEs from its limit of 0.32% and 8.82% for the ratio-of-means and mean-of-ratios estimates, respectively.</p>
</sec>
<sec id="sec026">
<title>Evaluation of oracle-adjusted <italic>F</italic><sub>ST</sub> estimators</title>
<p>Here we verify additional calculations for the bias of the standard kinship-based estimator <inline-formula id="pgen.1009241.e315"><alternatives><graphic id="pgen.1009241.e315g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e315" xlink:type="simple"/><mml:math display="inline" id="M315"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> and the unbiased adjusted “oracle” <italic>F</italic><sub>ST</sub> estimators that require the true mean kinship <inline-formula id="pgen.1009241.e316"><alternatives><graphic id="pgen.1009241.e316g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e316" xlink:type="simple"/><mml:math display="inline" id="M316"><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula> or the bias coefficient <italic>s</italic><sup><italic>T</italic></sup> to be known. Note that <inline-formula id="pgen.1009241.e317"><alternatives><graphic id="pgen.1009241.e317g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e317" xlink:type="simple"/><mml:math display="inline" id="M317"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>new</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e236">Eq (36)</xref> is related but not identical to these oracle estimators. We tested both IAF (<xref ref-type="fig" rid="pgen.1009241.g007">Fig 7A</xref>) and genotype (<xref ref-type="fig" rid="pgen.1009241.g007">Fig 7B</xref>) versions of these estimators. The unadjusted <inline-formula id="pgen.1009241.e318"><alternatives><graphic id="pgen.1009241.e318g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e318" xlink:type="simple"/><mml:math display="inline" id="M318"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> in <xref ref-type="disp-formula" rid="pgen.1009241.e180">Eq (26)</xref> is severely biased (blue in <xref ref-type="fig" rid="pgen.1009241.g007">Fig 7</xref>) by construction, and matches the calculated limit for IAFs and genotypes (green lines in <xref ref-type="fig" rid="pgen.1009241.g007">Fig 7</xref>, which are close because <inline-formula id="pgen.1009241.e319"><alternatives><graphic id="pgen.1009241.e319g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e319" xlink:type="simple"/><mml:math display="inline" id="M319"><mml:mrow><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>≈</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:math></alternatives></inline-formula>). In contrast, the two consistent adjusted estimators <inline-formula id="pgen.1009241.e320"><alternatives><graphic id="pgen.1009241.e320g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e320" xlink:type="simple"/><mml:math display="inline" id="M320"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mo>′</mml:mo></mml:msubsup></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009241.e321"><alternatives><graphic id="pgen.1009241.e321g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e321" xlink:type="simple"/><mml:math display="inline" id="M321"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mrow><mml:mo>′</mml:mo><mml:mo>′</mml:mo></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula> in Eqs <xref ref-type="disp-formula" rid="pgen.1009241.e196">(27)</xref> and <xref ref-type="disp-formula" rid="pgen.1009241.e203">(31)</xref> estimate <italic>F</italic><sub>ST</sub> quite well (blue predictions overlap the true <italic>F</italic><sub>ST</sub> red line in <xref ref-type="fig" rid="pgen.1009241.g007">Fig 7</xref>). However, <inline-formula id="pgen.1009241.e322"><alternatives><graphic id="pgen.1009241.e322g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e322" xlink:type="simple"/><mml:math display="inline" id="M322"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mo>′</mml:mo></mml:msubsup></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009241.e323"><alternatives><graphic id="pgen.1009241.e323g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e323" xlink:type="simple"/><mml:math display="inline" id="M323"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mrow><mml:mo>′</mml:mo><mml:mo>′</mml:mo></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula> are oracle methods, since they require parameters (<inline-formula id="pgen.1009241.e324"><alternatives><graphic id="pgen.1009241.e324g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e324" xlink:type="simple"/><mml:math display="inline" id="M324"><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula>, <inline-formula id="pgen.1009241.e325"><alternatives><graphic id="pgen.1009241.e325g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e325" xlink:type="simple"/><mml:math display="inline" id="M325"><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula>, <italic>s</italic><sup><italic>T</italic></sup>) that are not known in practice.</p>
<fig id="pgen.1009241.g007" position="float">
<object-id pub-id-type="doi">10.1371/journal.pgen.1009241.g007</object-id>
<label>Fig 7</label>
<caption>
<title>Evaluation of standard and adjusted <italic>F</italic><sub>ST</sub> estimators.</title>
<p>The convergence values we calculated for the standard kinship plug-in and adjusted <italic>F</italic><sub>ST</sub> estimators are validated using our admixture simulation. All adjusted estimators are unbiased but are “oracle” methods, since the mean kinship (<inline-formula id="pgen.1009241.e326"><alternatives><graphic id="pgen.1009241.e326g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e326" xlink:type="simple"/><mml:math display="inline" id="M326"><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula>), mean coancestry (<inline-formula id="pgen.1009241.e327"><alternatives><graphic id="pgen.1009241.e327g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e327" xlink:type="simple"/><mml:math display="inline" id="M327"><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula>), or bias coefficient (<inline-formula id="pgen.1009241.e328"><alternatives><graphic id="pgen.1009241.e328g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e328" xlink:type="simple"/><mml:math display="inline" id="M328"><mml:mrow><mml:msup><mml:mi>s</mml:mi><mml:mi>T</mml:mi></mml:msup><mml:mo>=</mml:mo><mml:mfrac><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub></mml:mfrac></mml:mrow></mml:math></alternatives></inline-formula> for IAFs, replaced by <inline-formula id="pgen.1009241.e329"><alternatives><graphic id="pgen.1009241.e329g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e329" xlink:type="simple"/><mml:math display="inline" id="M329"><mml:mfrac><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub></mml:mfrac></mml:math></alternatives></inline-formula> for genotypes) are usually unknown. (A) Estimation from individual-specific allele frequencies (IAFs): <inline-formula id="pgen.1009241.e330"><alternatives><graphic id="pgen.1009241.e330g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e330" xlink:type="simple"/><mml:math display="inline" id="M330"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> is the standard coancestry plug-in estimator in <xref ref-type="disp-formula" rid="pgen.1009241.e180">Eq (26)</xref>; <inline-formula id="pgen.1009241.e331"><alternatives><graphic id="pgen.1009241.e331g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e331" xlink:type="simple"/><mml:math display="inline" id="M331"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mo>′</mml:mo></mml:msubsup></mml:math></alternatives></inline-formula> “Adj. <inline-formula id="pgen.1009241.e332"><alternatives><graphic id="pgen.1009241.e332g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e332" xlink:type="simple"/><mml:math display="inline" id="M332"><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula>” is in <xref ref-type="disp-formula" rid="pgen.1009241.e196">Eq (27)</xref>; <inline-formula id="pgen.1009241.e333"><alternatives><graphic id="pgen.1009241.e333g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e333" xlink:type="simple"/><mml:math display="inline" id="M333"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mrow><mml:mo>′</mml:mo><mml:mo>′</mml:mo></mml:mrow></mml:msubsup></mml:math></alternatives></inline-formula> “Adj. <italic>s</italic>” is in <xref ref-type="disp-formula" rid="pgen.1009241.e203">Eq (31)</xref>. (B) For genotypes, <inline-formula id="pgen.1009241.e334"><alternatives><graphic id="pgen.1009241.e334g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e334" xlink:type="simple"/><mml:math display="inline" id="M334"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> is given in <xref ref-type="disp-formula" rid="pgen.1009241.e179">Eq (25)</xref>, and the adjusted estimators use <inline-formula id="pgen.1009241.e335"><alternatives><graphic id="pgen.1009241.e335g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e335" xlink:type="simple"/><mml:math display="inline" id="M335"><mml:msup><mml:mover accent="true"><mml:mi>φ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula> rather than <inline-formula id="pgen.1009241.e336"><alternatives><graphic id="pgen.1009241.e336g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e336" xlink:type="simple"/><mml:math display="inline" id="M336"><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula>. Lines: true <italic>F</italic><sub>ST</sub> (red line), limits of biased estimators <inline-formula id="pgen.1009241.e337"><alternatives><graphic id="pgen.1009241.e337g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e337" xlink:type="simple"/><mml:math display="inline" id="M337"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>std</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> (green lines, which differ slightly per panel). Estimates (blue) include 95% prediction intervals (too narrow to see) from 39 independently-simulated genotype matrices for our admixture model (<xref ref-type="sec" rid="sec028">Methods</xref>, section <bold>Prediction intervals</bold>).</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pgen.1009241.g007" xlink:type="simple"/>
</fig>
<p>Prediction intervals were computed from estimates over 39 independently-simulated IAF and genotype matrices (<xref ref-type="sec" rid="sec028">Methods</xref>, section <bold>Prediction intervals</bold>). Estimator limits are always contained in these intervals because the number of independent loci (<italic>m</italic> = 300, 000) is sufficiently large. Estimates that use genotypes have wider intervals than estimates from IAFs; however, IAFs are not known in practice, and use of estimated IAFs might increase noise. Genetic linkage, not present in our simulation, will also increase noise in real data.</p>
</sec>
</sec>
</sec>
<sec id="sec027" sec-type="conclusions">
<title>Discussion</title>
<p>We studied analytically the most commonly-used estimators of <italic>F</italic><sub>ST</sub> and kinship, which can be derived using the method of moments. We determined the estimation limits of convergence of these approaches under two models of arbitrary population structure (<xref ref-type="fig" rid="pgen.1009241.g001">Fig 1</xref>). We found that no existing approaches estimate the generalized <italic>F</italic><sub>ST</sub> (an IBD probability) accurately (but note that some of these approaches intended to estimate a linearly-transformed <italic>F</italic><sub>ST</sub> quantity and not the IBD probability). We also showed that the standard kinship estimator is biased on structured populations (particularly when the average kinship is comparable to the kinship coefficients of interest), and this bias varies for each pair of individuals. These results led us to a new kinship estimator, which is consistent if the minimum kinship is estimated consistently (<xref ref-type="fig" rid="pgen.1009241.g001">Fig 1</xref>). We presented an implementation of this approach, which is practically unbiased in our simulations. Our kinship and <italic>F</italic><sub>ST</sub> estimates in human data are consistent with the African Origins model while suggesting that human differentiation is considerably greater than previously estimated [<xref ref-type="bibr" rid="pgen.1009241.ref059">59</xref>].</p>
<p>Estimation of <italic>F</italic><sub>ST</sub> in the correct scale is crucial for its interpretation as an IBD probability, for obtaining comparable estimates in different datasets and across species, as well as for DNA forensics [<xref ref-type="bibr" rid="pgen.1009241.ref003">3</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref007">7</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref019">19</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref020">20</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref078">78</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref080">80</xref>]. Our framework results in a new unbiased genome-wide <italic>F</italic><sub>ST</sub> estimator. However, our findings may not have direct implications for single-locus <italic>F</italic><sub>ST</sub> estimate approaches where only the relative ranking matters, such as for the identification of loci under selection [<xref ref-type="bibr" rid="pgen.1009241.ref008">8</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref010">10</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref081">81</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref086">86</xref>], assuming that the bias of the genome-wide estimator carries over uniformly to all single-locus estimates. Our convergence calculations in section <bold>Assessing the accuracy of genome-wide ratio estimators</bold> require large numbers of loci, so they do not apply to single-locus estimates. Moreover, various methods for single-locus <italic>F</italic><sub>ST</sub> estimation for multiple alleles suffer from a strong dependence to the maximum allele frequency and heterozygosity [<xref ref-type="bibr" rid="pgen.1009241.ref083">83</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref085">85</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref087">87</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref090">90</xref>] that suggests that a more complicated bias is present in these single-locus <italic>F</italic><sub>ST</sub> estimators.</p>
<p>We have shown that the misapplication of existing <italic>F</italic><sub>ST</sub> estimators for independent subpopulations may lead to downwardly-biased estimates that can approach zero even when the true generalized <italic>F</italic><sub>ST</sub> is large. Weir-Cockerham [<xref ref-type="bibr" rid="pgen.1009241.ref017">17</xref>], Weir-Hill [<xref ref-type="bibr" rid="pgen.1009241.ref004">4</xref>], HudsonK (which generalizes the Hudson pairwise <italic>F</italic><sub>ST</sub> estimator [<xref ref-type="bibr" rid="pgen.1009241.ref023">23</xref>] to <italic>K</italic> independent populations; also equals the Weir-Goudet approach for subpopulations [<xref ref-type="bibr" rid="pgen.1009241.ref021">21</xref>]; <xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref>), and BayeScan [<xref ref-type="bibr" rid="pgen.1009241.ref010">10</xref>]<italic>F</italic><sub>ST</sub> estimates in our admixture simulation are all smaller than the <italic>F</italic><sub>ST</sub> target by nearly a factor of two (<xref ref-type="fig" rid="pgen.1009241.g004">Fig 4B</xref>), and differ from our new <italic>F</italic><sub>ST</sub> estimates in humans by nearly a factor of three [<xref ref-type="bibr" rid="pgen.1009241.ref059">59</xref>]. To be accurate, existing <italic>F</italic><sub>ST</sub> estimators require independent subpopulations, so the observed biases arise from their misapplication to subpopulations that are neither independent not homogeneous. Nevertheless, natural populations—particularly humans—often do not adhere to the independent subpopulations model [<xref ref-type="bibr" rid="pgen.1009241.ref059">59</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref091">91</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref095">95</xref>].</p>
<p>The standard kinship coefficient estimator we investigated is often used to control for population structure in GWAS and to estimate genome-wide heritability [<xref ref-type="bibr" rid="pgen.1009241.ref016">16</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref027">27</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref030">30</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref035">35</xref>]. While this estimator was known to be biased [<xref ref-type="bibr" rid="pgen.1009241.ref016">16</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref035">35</xref>], no closed-form limit had been calculated until very recently [<xref ref-type="bibr" rid="pgen.1009241.ref021">21</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref062">62</xref>]. These kinship estimates are biased downwards on average, but bias also varies for each pair of individuals (Figs <xref ref-type="fig" rid="pgen.1009241.g001">1</xref> and <xref ref-type="fig" rid="pgen.1009241.g005">5</xref>). Thus, the use of these distorted kinship estimates may be problematic in GWAS or for estimating heritability, but the extent of the problem remains to be determined.</p>
<p>We developed a theoretical framework for assessing genome-wide ratio estimators of <italic>F</italic><sub>ST</sub> and kinship. We proved that common ratio-of-means estimators converge almost surely to the ratio of expectations for infinite independent loci (<xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref>). Our result justifies approximating the expectation of a ratio-of-means estimator with the ratio of expectations [<xref ref-type="bibr" rid="pgen.1009241.ref004">4</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref017">17</xref>, <xref ref-type="bibr" rid="pgen.1009241.ref023">23</xref>]. However, mean-of-ratios estimators may not converge to the ratio of expectations for infinite loci. Mean-of-ratios estimators are potentially asymptotically unbiased for infinite individuals, but it is unclear which estimators have this behavior. We found that the ratio-of-means kinship estimator had much smaller errors from the ratio of expectations than the more common mean-of-ratios estimator, whose convergence value is unknown. Therefore, we recommend ratio-of-means estimators, whose asymptotic behavior is well understood.</p>
<p>Our new framework enables accurate <italic>F</italic><sub>ST</sub> estimation in more complex datasets than before, but challenges remain. One challenge is the estimation of local inbreeding coefficients, which are required for estimating the generalized <italic>F</italic><sub>ST</sub> when not all individuals are locally outbred. To this end, we suggest employing existing approaches that infer inbreeding from large runs of homozygosity or related strategies [<xref ref-type="bibr" rid="pgen.1009241.ref066">66</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref068">68</xref>], particularly when such self-IBD blocks are much larger than observed between individuals in the same subpopulation. A streamlined approach for jointly estimating total and local inbreeding is desirable, but will require an appropriate evaluation featuring realistic simulation of local inbreeding in a complex population structure. Another challenge is the estimation of the minimum kinship value without the use of subpopulation labels, so that accurate <italic>F</italic><sub>ST</sub> estimates can be obtained with even less user supervision. A more general unsupervised method could better ensure accuracy under extreme cases, such as when there are few unrelated individual pairs. These challenges can be overcome with the estimators we have presented, although supervision is needed to ensure that local inbreeding and the minimum kinship are estimated correctly.</p>
<p>We have demonstrated the need for new models and methods to study complex population structures, and have proposed a new approach for kinship and <italic>F</italic><sub>ST</sub> estimation that provides nearly unbiased estimates in this setting. Extending our implementation to deliver consistent accuracy in arbitrary population structures will require further innovation, and the results provided here may be useful in leading to more robust estimators in the future.</p>
</sec>
<sec id="sec028" sec-type="materials|methods">
<title>Methods</title>
<sec id="sec029">
<title>Previous <italic>F</italic><sub>ST</sub> estimators for the independent subpopulations model</title>
<p>Here we summarize the previous Weir-Cockerham, Weir-Hill, and Hudson <italic>F</italic><sub>ST</sub> estimators for independent subpopulations and derive the generalized HudsonK estimator for more than two subpopulations (which also equals the recent Weir-Goudet <italic>F</italic><sub>ST</sub> estimator for subpopulations under biallelic loci; <xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref>). We show that each of these estimators reduces, under infinite subpopulation sizes, to <inline-formula id="pgen.1009241.e338"><alternatives><graphic id="pgen.1009241.e338g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e338" xlink:type="simple"/><mml:math display="inline" id="M338"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> in Eqs <xref ref-type="disp-formula" rid="pgen.1009241.e078">(11)</xref> to <xref ref-type="disp-formula" rid="pgen.1009241.e080">(13)</xref> that was studied in the results. In this section, let <italic>i</italic> index the <italic>m</italic> loci, <italic>j</italic> index the <italic>n</italic> subpopulations, <italic>n</italic><sub><italic>j</italic></sub> be the number of individuals sampled from subpopulation <italic>j</italic>, and <inline-formula id="pgen.1009241.e339"><alternatives><graphic id="pgen.1009241.e339g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e339" xlink:type="simple"/><mml:math display="inline" id="M339"><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:math></alternatives></inline-formula> be the sample reference allele frequency at locus <italic>i</italic> in subpopulation <italic>j</italic>.</p>
<sec id="sec030">
<title>The Weir-Cockerham <italic>F</italic><sub>ST</sub> estimator</title>
<p>The Weir-Cockerham (WC) <italic>F</italic><sub>ST</sub> estimator [<xref ref-type="bibr" rid="pgen.1009241.ref017">17</xref>] estimates the coancestry parameter <italic>θ</italic><sup><italic>T</italic></sup> shared by each of the <italic>n</italic> independent subpopulation in consideration. Let <inline-formula id="pgen.1009241.e340"><alternatives><graphic id="pgen.1009241.e340g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e340" xlink:type="simple"/><mml:math display="inline" id="M340"><mml:msub><mml:mover accent="true"><mml:mi>h</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:math></alternatives></inline-formula> denote the fraction of heterozygotes in subpopulation <italic>j</italic> for locus <italic>i</italic>. The ratio-of-means WC <italic>F</italic><sub>ST</sub> estimator and its limit for independent subpopulations (<inline-formula id="pgen.1009241.e341"><alternatives><graphic id="pgen.1009241.e341g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e341" xlink:type="simple"/><mml:math display="inline" id="M341"><mml:mrow><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> for <italic>j</italic> ≠ <italic>k</italic>) with equal differentiation (<inline-formula id="pgen.1009241.e342"><alternatives><graphic id="pgen.1009241.e342g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e342" xlink:type="simple"/><mml:math display="inline" id="M342"><mml:mrow><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:msup><mml:mi>θ</mml:mi><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:math></alternatives></inline-formula>) is
<disp-formula id="pgen.1009241.e343"><alternatives><graphic id="pgen.1009241.e343g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e343" xlink:type="simple"/><mml:math display="block" id="M343"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mover accent="true"><mml:mi>n</mml:mi><mml:mo>¯</mml:mo></mml:mover></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mi>n</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>,</mml:mo><mml:mspace width="1em"/><mml:msup><mml:mi>C</mml:mi><mml:mn>2</mml:mn></mml:msup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:msup><mml:mover accent="true"><mml:mi>n</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mn>2</mml:mn></mml:msup><mml:mrow><mml:mo>(</mml:mo><mml:mi>n</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msup><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mi>n</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:mover accent="true"><mml:mi>n</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mo>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd columnalign="right"><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:mfrac><mml:msub><mml:mi>n</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mover accent="true"><mml:mi>n</mml:mi><mml:mo>¯</mml:mo></mml:mover></mml:mfrac><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:mspace width="1em"/><mml:msub><mml:mover accent="true"><mml:mi>h</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>i</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:mfrac><mml:msub><mml:mi>n</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mover accent="true"><mml:mi>n</mml:mi><mml:mo>¯</mml:mo></mml:mover></mml:mfrac><mml:msub><mml:mover accent="true"><mml:mi>h</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:mspace width="1em"/><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mi>n</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:mfrac><mml:msub><mml:mi>n</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mover accent="true"><mml:mi>n</mml:mi><mml:mo>¯</mml:mo></mml:mover></mml:mfrac><mml:msup><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd columnalign="right"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>WC</mml:mtext></mml:msubsup></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mo>-</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mover accent="true"><mml:mi>n</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mfrac><mml:mo>(</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:mo>-</mml:mo><mml:mfrac><mml:mrow><mml:mi>n</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:mfrac><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mo>-</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mn>4</mml:mn></mml:mfrac><mml:msub><mml:mover accent="true"><mml:mi>h</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>i</mml:mi></mml:msub><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:mfrac><mml:mrow><mml:mover accent="true"><mml:mi>n</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:msup><mml:mi>C</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mrow><mml:mrow><mml:mi>n</mml:mi><mml:mo>(</mml:mo><mml:mover accent="true"><mml:mi>n</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mo>-</mml:mo><mml:mn>1</mml:mn><mml:mo>)</mml:mo></mml:mrow></mml:mfrac><mml:mo>)</mml:mo><mml:mo>+</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>+</mml:mo><mml:mfrac><mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mi>n</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn><mml:mo>)</mml:mo></mml:mrow><mml:mover accent="true"><mml:mi>n</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:msup><mml:mi>C</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mrow><mml:mrow><mml:mi>n</mml:mi><mml:mo>(</mml:mo><mml:mover accent="true"><mml:mi>n</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mo>-</mml:mo><mml:mn>1</mml:mn><mml:mo>)</mml:mo></mml:mrow></mml:mfrac><mml:mo>)</mml:mo><mml:mo>+</mml:mo><mml:mfrac><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>h</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>i</mml:mi></mml:msub><mml:msup><mml:mi>C</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mrow><mml:mrow><mml:mn>4</mml:mn><mml:mi>n</mml:mi><mml:mo>(</mml:mo><mml:mover accent="true"><mml:mi>n</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mo>-</mml:mo><mml:mn>1</mml:mn><mml:mo>)</mml:mo></mml:mrow></mml:mfrac></mml:mrow></mml:mfrac></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd/><mml:mtd><mml:mrow><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>=</mml:mo><mml:msup><mml:mi>θ</mml:mi><mml:mi>T</mml:mi></mml:msup><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
Note that <inline-formula id="pgen.1009241.e344"><alternatives><graphic id="pgen.1009241.e344g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e344" xlink:type="simple"/><mml:math display="inline" id="M344"><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> above weighs every individual equally by weighing subpopulation <italic>j</italic> proportional to its sample size <italic>n</italic><sub><italic>j</italic></sub>, so it equals the estimator in <xref ref-type="disp-formula" rid="pgen.1009241.e135">Eq (17)</xref> with uniform weights.</p>
<p>Now we simplify this estimator as the sample size of every subpopulation becomes infinite. First set the sample size of every subpopulation <italic>n</italic><sub><italic>j</italic></sub> equal to their mean <inline-formula id="pgen.1009241.e345"><alternatives><graphic id="pgen.1009241.e345g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e345" xlink:type="simple"/><mml:math display="inline" id="M345"><mml:mover accent="true"><mml:mi>n</mml:mi><mml:mo>¯</mml:mo></mml:mover></mml:math></alternatives></inline-formula>, which implies <italic>C</italic><sup>2</sup> = 0 and
<disp-formula id="pgen.1009241.e346"><alternatives><graphic id="pgen.1009241.e346g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e346" xlink:type="simple"/><mml:math display="block" id="M346"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mtd><mml:mtd><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:mspace width="1em"/><mml:msub><mml:mover accent="true"><mml:mi>h</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>i</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mover accent="true"><mml:mi>h</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:mspace width="1em"/><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mi>n</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msup><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd columnalign="right"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>WC</mml:mtext></mml:msubsup></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mo>-</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mover accent="true"><mml:mi>n</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mfrac><mml:mo>(</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:mo>-</mml:mo><mml:mfrac><mml:mrow><mml:mi>n</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:mfrac><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mo>-</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mn>4</mml:mn></mml:mfrac><mml:msub><mml:mover accent="true"><mml:mi>h</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>i</mml:mi></mml:msub><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:mo>+</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:mfrac><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
Now we take the limit as the sample size <inline-formula id="pgen.1009241.e347"><alternatives><graphic id="pgen.1009241.e347g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e347" xlink:type="simple"/><mml:math display="inline" id="M347"><mml:mrow><mml:mover accent="true"><mml:mi>n</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow></mml:math></alternatives></inline-formula>, which results in sample allele frequencies converging to the true subpopulation allele frequencies <inline-formula id="pgen.1009241.e348"><alternatives><graphic id="pgen.1009241.e348g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e348" xlink:type="simple"/><mml:math display="inline" id="M348"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>→</mml:mo><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></alternatives></inline-formula> for every subpopulation <italic>j</italic> and locus <italic>i</italic>, and
<disp-formula id="pgen.1009241.e349"><alternatives><graphic id="pgen.1009241.e349g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e349" xlink:type="simple"/><mml:math display="block" id="M349"><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:mspace width="1em"/><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mi>n</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msup><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup><mml:mo>,</mml:mo><mml:mspace width="1em"/><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>WC</mml:mtext></mml:msubsup><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:mo>+</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:mfrac><mml:mo>,</mml:mo></mml:mrow></mml:math></alternatives></disp-formula>
which matches the <inline-formula id="pgen.1009241.e350"><alternatives><graphic id="pgen.1009241.e350g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e350" xlink:type="simple"/><mml:math display="inline" id="M350"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> in Eqs <xref ref-type="disp-formula" rid="pgen.1009241.e078">(11)</xref> to <xref ref-type="disp-formula" rid="pgen.1009241.e080">(13)</xref> as desired. Note the number of subpopulations <italic>n</italic> remains finite, and the sample heterozygosity <inline-formula id="pgen.1009241.e351"><alternatives><graphic id="pgen.1009241.e351g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e351" xlink:type="simple"/><mml:math display="inline" id="M351"><mml:msub><mml:mover accent="true"><mml:mi>h</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>i</mml:mi></mml:msub></mml:math></alternatives></inline-formula> is not needed in the limit.</p>
</sec>
<sec id="sec031">
<title>The Weir-Hill <italic>F</italic><sub>ST</sub> estimator</title>
<p>Weir and Hill developed new estimators for subpopulation-specific <italic>F</italic><sub>ST</sub> values and considered the effects of non-independent subpopulations [<xref ref-type="bibr" rid="pgen.1009241.ref004">4</xref>]. However, these estimators target linearly-transformed <italic>F</italic><sub>ST</sub> values, and recover the <italic>F</italic><sub>ST</sub> defined in <xref ref-type="disp-formula" rid="pgen.1009241.e053">Eq (9)</xref> only when subpopulations are independent [<xref ref-type="bibr" rid="pgen.1009241.ref004">4</xref>], so we group them here with other estimators that strictly assume independent subpopulations. For simplicity, here we only consider the global <italic>F</italic><sub>ST</sub> estimator; the estimators of the coancestry matrix of the subpopulations was found to have the same overall linear transformation [<xref ref-type="bibr" rid="pgen.1009241.ref004">4</xref>]. In the limit of infinite subpopulation sizes, this estimator also converges to the asymptotic <italic>F</italic><sub>ST</sub> estimator for independent subpopulations (<inline-formula id="pgen.1009241.e352"><alternatives><graphic id="pgen.1009241.e352g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e352" xlink:type="simple"/><mml:math display="inline" id="M352"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula>) discussed in the main text.</p>
<p>The Weir-Hill (WH) <italic>F</italic><sub>ST</sub> estimator, simplified here for biallelic loci but extended to average over loci, and its limit, are given by
<disp-formula id="pgen.1009241.e353"><alternatives><graphic id="pgen.1009241.e353g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e353" xlink:type="simple"/><mml:math display="block" id="M353"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:mspace width="1em"/><mml:mspace width="1em"/><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:msub><mml:mi>n</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mi>n</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:mfrac><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd columnalign="right"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>WH</mml:mtext></mml:msubsup></mml:mtd><mml:mtd><mml:mrow><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:mfrac><mml:mrow><mml:mo>(</mml:mo><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mi>n</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mrow><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>)</mml:mo></mml:mrow><mml:mo>)</mml:mo><mml:mo>(</mml:mo><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mfrac><mml:mrow><mml:mn>2</mml:mn><mml:msub><mml:mi>n</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow><mml:mrow><mml:mn>2</mml:mn><mml:msub><mml:mi>n</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mfrac><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>)</mml:mo><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mi>n</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:msup><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msub><mml:mi>n</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mrow><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>)</mml:mo></mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>)</mml:mo></mml:mrow></mml:mfrac><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:mfrac><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>-</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>˜</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>˜</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:mfrac><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
where the target <italic>F</italic><sub>ST</sub> and <inline-formula id="pgen.1009241.e354"><alternatives><graphic id="pgen.1009241.e354g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e354" xlink:type="simple"/><mml:math display="inline" id="M354"><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>˜</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup></mml:math></alternatives></inline-formula> both weigh individuals (rather than subpopulations) equally [<xref ref-type="bibr" rid="pgen.1009241.ref004">4</xref>]:
<disp-formula id="pgen.1009241.e355"><alternatives><graphic id="pgen.1009241.e355g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e355" xlink:type="simple"/><mml:math display="block" id="M355"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>,</mml:mo><mml:mspace width="1em"/><mml:mspace width="1em"/><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>˜</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>2</mml:mn><mml:mrow><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:msubsup><mml:mi>w</mml:mi><mml:mi>j</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>2</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>k</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>j</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:munderover></mml:mstyle><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:msub><mml:mi>w</mml:mi><mml:mi>k</mml:mi></mml:msub><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
For equal sample sizes <italic>n</italic><sub><italic>j</italic></sub> = <italic>n</italic><sub><italic>S</italic></sub>∀<italic>j</italic>, we have <inline-formula id="pgen.1009241.e356"><alternatives><graphic id="pgen.1009241.e356g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e356" xlink:type="simple"/><mml:math display="inline" id="M356"><mml:mrow><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac></mml:mrow></mml:math></alternatives></inline-formula>, <inline-formula id="pgen.1009241.e357"><alternatives><graphic id="pgen.1009241.e357g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e357" xlink:type="simple"/><mml:math display="inline" id="M357"><mml:mrow><mml:msub><mml:mi>n</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mi>n</mml:mi><mml:mi>S</mml:mi></mml:msub><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula>, and the estimator becomes
<disp-formula id="pgen.1009241.e358"><alternatives><graphic id="pgen.1009241.e358g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e358" xlink:type="simple"/><mml:math display="block" id="M358"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mtd><mml:mtd><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:mspace width="1em"/><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mi>n</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msup><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd columnalign="right"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>WH</mml:mtext></mml:msubsup></mml:mtd><mml:mtd><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mo>(</mml:mo><mml:mfrac><mml:mrow><mml:mn>2</mml:mn><mml:msub><mml:mi>n</mml:mi><mml:mi>S</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac></mml:mrow><mml:mrow><mml:mn>2</mml:mn><mml:msub><mml:mi>n</mml:mi><mml:mi>s</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mfrac><mml:mo>)</mml:mo><mml:mo>-</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:mrow><mml:mo>(</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mn>2</mml:mn><mml:msub><mml:mi>n</mml:mi><mml:mi>s</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mfrac><mml:mo>)</mml:mo></mml:mrow></mml:mrow><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:mo>+</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:mfrac><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
Therefore, as sample sizes per subpopulation go to infinity (<italic>n</italic><sub><italic>S</italic></sub> → ∞, which results in <inline-formula id="pgen.1009241.e359"><alternatives><graphic id="pgen.1009241.e359g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e359" xlink:type="simple"/><mml:math display="inline" id="M359"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>→</mml:mo><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></alternatives></inline-formula> for every (<italic>i</italic>, <italic>j</italic>)), we again recover the desired limiting <italic>F</italic><sub>ST</sub> estimator for independent subpopulations (<inline-formula id="pgen.1009241.e360"><alternatives><graphic id="pgen.1009241.e360g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e360" xlink:type="simple"/><mml:math display="inline" id="M360"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> in Eqs <xref ref-type="disp-formula" rid="pgen.1009241.e078">(11)</xref> to <xref ref-type="disp-formula" rid="pgen.1009241.e080">(13)</xref>).</p>
</sec>
<sec id="sec032">
<title>The Hudson <italic>F</italic><sub>ST</sub> estimator</title>
<p>The Hudson pairwise <italic>F</italic><sub>ST</sub> estimator [<xref ref-type="bibr" rid="pgen.1009241.ref023">23</xref>] measures the differentiation of two subpopulations (<italic>j</italic>, <italic>k</italic>). The estimator and its limit for two independent subpopulations (<inline-formula id="pgen.1009241.e361"><alternatives><graphic id="pgen.1009241.e361g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e361" xlink:type="simple"/><mml:math display="inline" id="M361"><mml:mrow><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>) is
<disp-formula id="pgen.1009241.e362"><alternatives><graphic id="pgen.1009241.e362g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e362" xlink:type="simple"/><mml:math display="block" id="M362"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>Hudson</mml:mtext></mml:msubsup><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:msup><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup><mml:mo>-</mml:mo><mml:mfrac><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:mn>2</mml:mn><mml:msub><mml:mi>n</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mfrac><mml:mo>-</mml:mo><mml:mfrac><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:mn>2</mml:mn><mml:msub><mml:mi>n</mml:mi><mml:mi>k</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mfrac></mml:mrow><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>)</mml:mo><mml:mo>+</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>)</mml:mo></mml:mrow></mml:mfrac><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>k</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mrow><mml:mn>2</mml:mn></mml:mfrac><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(40)</label></disp-formula></p>
</sec>
<sec id="sec033">
<title>Generalized HudsonK <italic>F</italic><sub>ST</sub> estimator</title>
<p>Here we derive the “HudsonK” estimator (first made available in [<xref ref-type="bibr" rid="pgen.1009241.ref058">58</xref>]), which generalizes the Hudson pairwise <italic>F</italic><sub>ST</sub> estimator in <xref ref-type="disp-formula" rid="pgen.1009241.e362">Eq (40)</xref> to <italic>n</italic> independent subpopulations. This estimator also equals the recent Weir-Goudet <italic>F</italic><sub>ST</sub> estimator for subpopulations [<xref ref-type="bibr" rid="pgen.1009241.ref021">21</xref>] (for biallelic loci; <xref ref-type="supplementary-material" rid="pgen.1009241.s001">S1 Text</xref>). Note that for independent subpopulations, the <italic>F</italic><sub>ST</sub> of all the subpopulations equals the mean pairwise <italic>F</italic><sub>ST</sub> of every pair of subpopulations:
<disp-formula id="pgen.1009241.e363"><alternatives><graphic id="pgen.1009241.e363g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e363" xlink:type="simple"/><mml:math display="block" id="M363"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mfrac><mml:mn>1</mml:mn><mml:msup><mml:mi>n</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>k</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:mo>(</mml:mo><mml:mfrac><mml:mrow><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>k</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mrow><mml:mn>2</mml:mn></mml:mfrac><mml:mo>)</mml:mo><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
For that reason, averaging numerators and denominators of the pairwise estimator in <xref ref-type="disp-formula" rid="pgen.1009241.e362">Eq (40)</xref> before computing the ratio, we obtain the generalized estimator and a limit under independent subpopulations of
<disp-formula id="pgen.1009241.e364"><alternatives><graphic id="pgen.1009241.e364g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e364" xlink:type="simple"/><mml:math display="block" id="M364"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:mspace width="1em"/><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mi>n</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msup><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup><mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd columnalign="right"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>HudsonK</mml:mtext></mml:msubsup></mml:mtd><mml:mtd><mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mo>-</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:mfrac><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:mn>2</mml:mn><mml:msub><mml:mi>n</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mfrac></mml:mrow><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:munderover></mml:mstyle><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mrow><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo></mml:mrow><mml:mo>+</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:msubsup><mml:mover accent="true"><mml:mi>σ</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:mfrac><mml:munderover><mml:mo>→</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>→</mml:mo><mml:mi>∞</mml:mi></mml:mrow><mml:mtext>a.s.</mml:mtext></mml:munderover><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
Note that unlike the WC and Weir-Hill estimators, <inline-formula id="pgen.1009241.e365"><alternatives><graphic id="pgen.1009241.e365g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e365" xlink:type="simple"/><mml:math display="inline" id="M365"><mml:msubsup><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> above weighs every subpopulation equally, so every individual is weighed inversely proportional to the sample sizes <italic>n</italic><sub><italic>j</italic></sub> of their subpopulation <italic>j</italic>.</p>
<p>Like WC and Weir-Hill, <inline-formula id="pgen.1009241.e366"><alternatives><graphic id="pgen.1009241.e366g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e366" xlink:type="simple"/><mml:math display="inline" id="M366"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>HudsonK</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> simplifies to <inline-formula id="pgen.1009241.e367"><alternatives><graphic id="pgen.1009241.e367g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e367" xlink:type="simple"/><mml:math display="inline" id="M367"><mml:msubsup><mml:mover accent="true"><mml:mi>F</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow><mml:mtext>indep</mml:mtext></mml:msubsup></mml:math></alternatives></inline-formula> in Eqs <xref ref-type="disp-formula" rid="pgen.1009241.e078">(11)</xref> to <xref ref-type="disp-formula" rid="pgen.1009241.e080">(13)</xref> in the limit of infinite sample sizes <italic>n</italic><sub><italic>j</italic></sub> → ∞, where <inline-formula id="pgen.1009241.e368"><alternatives><graphic id="pgen.1009241.e368g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e368" xlink:type="simple"/><mml:math display="inline" id="M368"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>→</mml:mo><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></alternatives></inline-formula> for every (<italic>i</italic>, <italic>j</italic>).</p>
</sec>
</sec>
<sec id="sec034">
<title>Simulations</title>
<sec id="sec035">
<title>Construction of subpopulation allele frequencies</title>
<p>We simulate <italic>K</italic> = 10 subpopulations <italic>S</italic><sub><italic>u</italic></sub> and <italic>m</italic> = 300, 000 independent loci. Every locus <italic>i</italic> draws <inline-formula id="pgen.1009241.e369"><alternatives><graphic id="pgen.1009241.e369g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e369" xlink:type="simple"/><mml:math display="inline" id="M369"><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>~</mml:mo><mml:mtext>Uniform</mml:mtext><mml:mo stretchy="false">(</mml:mo><mml:mn>0.01</mml:mn><mml:mo>,</mml:mo><mml:mn>0.5</mml:mn><mml:mo stretchy="false">)</mml:mo><mml:mo>.</mml:mo></mml:math></alternatives></inline-formula> We set <inline-formula id="pgen.1009241.e370"><alternatives><graphic id="pgen.1009241.e370g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e370" xlink:type="simple"/><mml:math display="inline" id="M370"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mfrac><mml:mi>u</mml:mi><mml:mi>K</mml:mi></mml:mfrac><mml:mi>τ</mml:mi><mml:mo>,</mml:mo></mml:math></alternatives></inline-formula> where <italic>τ</italic> ≤ 1 tunes <italic>F</italic><sub>ST</sub>. For the independent subpopulations model, <inline-formula id="pgen.1009241.e371"><alternatives><graphic id="pgen.1009241.e371g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e371" xlink:type="simple"/><mml:math display="inline" id="M371"><mml:msub><mml:mi>F</mml:mi><mml:mrow><mml:mtext>ST</mml:mtext></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>K</mml:mi></mml:mfrac><mml:mstyle displaystyle="true"><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>u</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>K</mml:mi></mml:msubsup><mml:mrow><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mrow></mml:mstyle><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>τ</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>K</mml:mi><mml:mo>+</mml:mo><mml:mn>1</mml:mn><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mrow><mml:mn>2</mml:mn><mml:mi>K</mml:mi></mml:mrow></mml:mfrac><mml:mo>,</mml:mo></mml:math></alternatives></inline-formula> so <inline-formula id="pgen.1009241.e372"><alternatives><graphic id="pgen.1009241.e372g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e372" xlink:type="simple"/><mml:math display="inline" id="M372"><mml:mrow><mml:mi>τ</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mn>2</mml:mn><mml:mi>K</mml:mi><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub></mml:mrow><mml:mrow><mml:mi>K</mml:mi><mml:mo>+</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mfrac></mml:mrow></mml:math></alternatives></inline-formula> gives the desired <italic>F</italic><sub>ST</sub> (<italic>τ</italic> ≈ 0.18 for <italic>F</italic><sub>ST</sub> = 0.1). For the admixture model, <italic>τ</italic> is found numerically (<italic>τ</italic> ≈ 0.90 for <italic>F</italic><sub>ST</sub> = 0.1; see last subsection). Lastly, <inline-formula id="pgen.1009241.e373"><alternatives><graphic id="pgen.1009241.e373g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e373" xlink:type="simple"/><mml:math display="inline" id="M373"><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:msubsup></mml:math></alternatives></inline-formula> values are drawn from the Balding-Nichols distribution,
<disp-formula id="pgen.1009241.e374"><alternatives><graphic id="pgen.1009241.e374g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e374" xlink:type="simple"/><mml:math display="block" id="M374"><mml:mrow><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:msubsup><mml:mrow><mml:mo>|</mml:mo><mml:mi>T</mml:mi><mml:mo>∼</mml:mo><mml:mtext>Beta</mml:mtext></mml:mrow><mml:mo>(</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mfrac><mml:mo>-</mml:mo><mml:mn>1</mml:mn><mml:mo>)</mml:mo><mml:mo>,</mml:mo><mml:mrow><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo></mml:mrow><mml:mo>(</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mfrac><mml:mo>-</mml:mo><mml:mn>1</mml:mn><mml:mo>)</mml:mo><mml:mo>)</mml:mo><mml:mo>,</mml:mo></mml:mrow></mml:math></alternatives></disp-formula>
which results in subpopulation allele frequencies that obey the coancestry model of <xref ref-type="disp-formula" rid="pgen.1009241.e048">Eq (6)</xref>, with <inline-formula id="pgen.1009241.e375"><alternatives><graphic id="pgen.1009241.e375g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e375" xlink:type="simple"/><mml:math display="inline" id="M375"><mml:mrow><mml:mo form="prefix">E</mml:mo><mml:mo>[</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:msubsup><mml:mrow><mml:mo>|</mml:mo><mml:mi>T</mml:mi></mml:mrow><mml:mo>]</mml:mo><mml:mo>=</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup></mml:mrow></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009241.e376"><alternatives><graphic id="pgen.1009241.e376g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e376" xlink:type="simple"/><mml:math display="inline" id="M376"><mml:mrow><mml:mo form="prefix">Var</mml:mo><mml:mo>(</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:msubsup><mml:mrow><mml:mo>|</mml:mo><mml:mi>T</mml:mi></mml:mrow><mml:mo>)</mml:mo><mml:mo>=</mml:mo><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula> [<xref ref-type="bibr" rid="pgen.1009241.ref003">3</xref>], as desired.</p>
</sec>
<sec id="sec036">
<title>Random subpopulation sizes</title>
<p>We randomly generate sample sizes <bold>r</bold> = (<italic>r</italic><sub><italic>u</italic></sub>) for <italic>K</italic> subpopulations and <inline-formula id="pgen.1009241.e377"><alternatives><graphic id="pgen.1009241.e377g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e377" xlink:type="simple"/><mml:math display="inline" id="M377"><mml:mrow><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>u</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>K</mml:mi></mml:msubsup><mml:msub><mml:mi>r</mml:mi><mml:mi>u</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mi>n</mml:mi><mml:mo>=</mml:mo><mml:mn>1000</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> individuals, as follows. First, draw <bold>x</bold> ∼ Dirichlet (1, …, 1) of length <italic>K</italic> and <bold>r</bold> = round(<italic>n</italic> <bold>x</bold>). While <inline-formula id="pgen.1009241.e378"><alternatives><graphic id="pgen.1009241.e378g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e378" xlink:type="simple"/><mml:math display="inline" id="M378"><mml:mrow><mml:msub><mml:mo form="prefix" movablelimits="true">min</mml:mo><mml:mi>u</mml:mi></mml:msub><mml:msub><mml:mi>r</mml:mi><mml:mi>u</mml:mi></mml:msub><mml:mo>&lt;</mml:mo><mml:mfrac><mml:mi>n</mml:mi><mml:mrow><mml:mn>3</mml:mn><mml:mi>K</mml:mi></mml:mrow></mml:mfrac></mml:mrow></mml:math></alternatives></inline-formula>, draw a new <bold>r</bold>, to prevent small subpopulations (they do not occur in real data). Due to rounding, <inline-formula id="pgen.1009241.e379"><alternatives><graphic id="pgen.1009241.e379g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e379" xlink:type="simple"/><mml:math display="inline" id="M379"><mml:mrow><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>u</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>K</mml:mi></mml:msubsup><mml:msub><mml:mi>r</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow></mml:math></alternatives></inline-formula> may not equal <italic>n</italic> as desired. Thus, while <inline-formula id="pgen.1009241.e380"><alternatives><graphic id="pgen.1009241.e380g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e380" xlink:type="simple"/><mml:math display="inline" id="M380"><mml:mrow><mml:mi>δ</mml:mi><mml:mo>=</mml:mo><mml:mi>n</mml:mi><mml:mo>-</mml:mo><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>u</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>K</mml:mi></mml:msubsup><mml:msub><mml:mi>r</mml:mi><mml:mi>u</mml:mi></mml:msub><mml:mo>≠</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>, a random <italic>u</italic> is updated to <italic>r</italic><sub><italic>u</italic></sub> ← <italic>r</italic><sub><italic>u</italic></sub> + sgn(<italic>δ</italic>), which brings <italic>δ</italic> closer to zero at every iteration. Weights for individuals <italic>j</italic> in <italic>S</italic><sub><italic>u</italic></sub> are <inline-formula id="pgen.1009241.e381"><alternatives><graphic id="pgen.1009241.e381g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e381" xlink:type="simple"/><mml:math display="inline" id="M381"><mml:mrow><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mi>K</mml:mi><mml:msub><mml:mi>r</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow></mml:mfrac></mml:mrow></mml:math></alternatives></inline-formula> so the generalized <italic>F</italic><sub>ST</sub> matches <inline-formula id="pgen.1009241.e382"><alternatives><graphic id="pgen.1009241.e382g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e382" xlink:type="simple"/><mml:math display="inline" id="M382"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>K</mml:mi></mml:mfrac><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>u</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>K</mml:mi></mml:msubsup><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:mrow></mml:math></alternatives></inline-formula> from the independent subpopulations model (see section <bold>The generalized <italic>F</italic><sub>ST</sub> for arbitrary population structures</bold>), which HudsonK estimates.</p>
</sec>
<sec id="sec037">
<title>Admixture proportions from 1D geography</title>
<p>We construct <italic>q</italic><sub><italic>ju</italic></sub> from random-walk migrations along a one-dimensional geography. Let <italic>x</italic><sub><italic>u</italic></sub> be the coordinate of intermediate subpopulation <italic>u</italic> and <italic>y</italic><sub><italic>j</italic></sub> the coordinate of a modern individual <italic>j</italic>. We assume <italic>q</italic><sub><italic>ju</italic></sub> is proportional to <italic>f</italic>(|<italic>x</italic><sub><italic>u</italic></sub> − <italic>y</italic><sub><italic>j</italic></sub>|), or
<disp-formula id="pgen.1009241.e383"><alternatives><graphic id="pgen.1009241.e383g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e383" xlink:type="simple"/><mml:math display="block" id="M383"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mi>q</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>u</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>f</mml:mi><mml:mo>(</mml:mo><mml:mo>|</mml:mo><mml:msub><mml:mi>x</mml:mi><mml:mi>u</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mi>y</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>|</mml:mo><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>v</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>K</mml:mi></mml:munderover></mml:mstyle><mml:mrow><mml:mi>f</mml:mi><mml:mo>(</mml:mo><mml:mo>|</mml:mo></mml:mrow><mml:msub><mml:mi>x</mml:mi><mml:mi>v</mml:mi></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mi>y</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mrow><mml:mo>|</mml:mo><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mfrac><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
where <italic>f</italic> is the Normal density function with <italic>μ</italic> = 0 and tunable <italic>σ</italic>. The Normal density models random walks, where <italic>σ</italic> sets the spread of the populations (<xref ref-type="fig" rid="pgen.1009241.g005">Fig 5</xref>). Our simulation uses <italic>x</italic><sub><italic>u</italic></sub> = <italic>u</italic> and <inline-formula id="pgen.1009241.e384"><alternatives><graphic id="pgen.1009241.e384g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e384" xlink:type="simple"/><mml:math display="inline" id="M384"><mml:mrow><mml:msub><mml:mi>y</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mn>2</mml:mn></mml:mfrac><mml:mo>+</mml:mo><mml:mfrac><mml:mrow><mml:mi>j</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>n</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mfrac><mml:mi>K</mml:mi></mml:mrow></mml:math></alternatives></inline-formula>, so the intermediate subpopulations span between 1 and <italic>K</italic> and individuals span between <inline-formula id="pgen.1009241.e385"><alternatives><graphic id="pgen.1009241.e385g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e385" xlink:type="simple"/><mml:math display="inline" id="M385"><mml:mfrac><mml:mn>1</mml:mn><mml:mn>2</mml:mn></mml:mfrac></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009241.e386"><alternatives><graphic id="pgen.1009241.e386g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e386" xlink:type="simple"/><mml:math display="inline" id="M386"><mml:mrow><mml:mi>K</mml:mi><mml:mo>+</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mn>2</mml:mn></mml:mfrac></mml:mrow></mml:math></alternatives></inline-formula>. For the <italic>F</italic><sub>ST</sub> estimators that require subpopulations, individual <italic>j</italic> is assigned to the nearest subpopulation <italic>S</italic><sub><italic>u</italic></sub> (the <italic>u</italic> that minimizes |<italic>x</italic><sub><italic>u</italic></sub> − <italic>y</italic><sub><italic>j</italic></sub>|; <xref ref-type="fig" rid="pgen.1009241.g003">Fig 3D</xref>); these subpopulations have equal sample size, so <inline-formula id="pgen.1009241.e387"><alternatives><graphic id="pgen.1009241.e387g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e387" xlink:type="simple"/><mml:math display="inline" id="M387"><mml:mrow><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac></mml:mrow></mml:math></alternatives></inline-formula> is appropriate.</p>
</sec>
<sec id="sec038">
<title>Choosing <italic>σ</italic> and <italic>τ</italic></title>
<p>Here we find values for <italic>σ</italic> (controls <italic>q</italic><sub><italic>jk</italic></sub>) and <italic>τ</italic> (scales <inline-formula id="pgen.1009241.e388"><alternatives><graphic id="pgen.1009241.e388g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e388" xlink:type="simple"/><mml:math display="inline" id="M388"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula>) that give <inline-formula id="pgen.1009241.e389"><alternatives><graphic id="pgen.1009241.e389g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e389" xlink:type="simple"/><mml:math display="inline" id="M389"><mml:mrow><mml:msup><mml:mi>s</mml:mi><mml:mi>T</mml:mi></mml:msup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mn>2</mml:mn></mml:mfrac></mml:mrow></mml:math></alternatives></inline-formula> and <italic>F</italic><sub>ST</sub> = 0.1 in the admixture model. In our simulation, <inline-formula id="pgen.1009241.e390"><alternatives><graphic id="pgen.1009241.e390g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e390" xlink:type="simple"/><mml:math display="inline" id="M390"><mml:mrow><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac></mml:mrow></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009241.e391"><alternatives><graphic id="pgen.1009241.e391g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e391" xlink:type="simple"/><mml:math display="inline" id="M391"><mml:mrow><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mfrac><mml:mi>u</mml:mi><mml:mi>K</mml:mi></mml:mfrac><mml:mi>τ</mml:mi></mml:mrow></mml:math></alternatives></inline-formula>, so applying those parameters to <xref ref-type="disp-formula" rid="pgen.1009241.e278">Eq (39)</xref> gives <inline-formula id="pgen.1009241.e392"><alternatives><graphic id="pgen.1009241.e392g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e392" xlink:type="simple"/><mml:math display="inline" id="M392"><mml:mrow><mml:msubsup><mml:mi>θ</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow><mml:mi>T</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mfrac><mml:mi>τ</mml:mi><mml:mi>K</mml:mi></mml:mfrac><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>u</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>K</mml:mi></mml:msubsup><mml:mi>u</mml:mi><mml:msub><mml:mi>q</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>u</mml:mi></mml:mrow></mml:msub><mml:msub><mml:mi>q</mml:mi><mml:mrow><mml:mi>k</mml:mi><mml:mi>u</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></alternatives></inline-formula> and <inline-formula id="pgen.1009241.e393"><alternatives><graphic id="pgen.1009241.e393g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e393" xlink:type="simple"/><mml:math display="inline" id="M393"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mi>τ</mml:mi><mml:mrow><mml:mi>n</mml:mi><mml:mi>K</mml:mi></mml:mrow></mml:mfrac><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:msubsup><mml:mo>∑</mml:mo><mml:mrow><mml:mi>u</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>K</mml:mi></mml:msubsup><mml:mi>u</mml:mi><mml:msubsup><mml:mi>q</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>u</mml:mi></mml:mrow><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:math></alternatives></inline-formula>. Therefore,
<disp-formula id="pgen.1009241.e394"><alternatives><graphic id="pgen.1009241.e394g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e394" xlink:type="simple"/><mml:math display="block" id="M394"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msup><mml:mi>s</mml:mi><mml:mi>T</mml:mi></mml:msup><mml:mo>=</mml:mo><mml:mfrac><mml:msup><mml:mover accent="true"><mml:mi>θ</mml:mi><mml:mo>¯</mml:mo></mml:mover><mml:mi>T</mml:mi></mml:msup><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub></mml:mfrac><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:mfrac><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>u</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>K</mml:mi></mml:munderover></mml:mstyle><mml:mi>u</mml:mi><mml:msup><mml:mrow><mml:mo>(</mml:mo><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mi>q</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>u</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo>(</mml:mo><mml:mi>σ</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:mrow><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>u</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>K</mml:mi></mml:munderover></mml:mstyle><mml:mi>u</mml:mi><mml:mo>(</mml:mo><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msubsup><mml:mi>q</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>u</mml:mi></mml:mrow><mml:mn>2</mml:mn></mml:msubsup><mml:mrow><mml:mo>(</mml:mo><mml:mi>σ</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mfrac></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
depends only on <italic>σ</italic>. A numerical root finder finds that <italic>σ</italic> ≈ 1.78 gives <inline-formula id="pgen.1009241.e395"><alternatives><graphic id="pgen.1009241.e395g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e395" xlink:type="simple"/><mml:math display="inline" id="M395"><mml:mrow><mml:msup><mml:mi>s</mml:mi><mml:mi>T</mml:mi></mml:msup><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mn>2</mml:mn></mml:mfrac></mml:mrow></mml:math></alternatives></inline-formula>. For fixed <italic>q</italic><sub><italic>ju</italic></sub>,
<disp-formula id="pgen.1009241.e396"><alternatives><graphic id="pgen.1009241.e396g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e396" xlink:type="simple"/><mml:math display="block" id="M396"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>τ</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:msub><mml:mi>F</mml:mi><mml:mtext>ST</mml:mtext></mml:msub><mml:mrow><mml:mfrac><mml:mn>1</mml:mn><mml:mi>K</mml:mi></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>u</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>K</mml:mi></mml:munderover></mml:mstyle><mml:mi>u</mml:mi><mml:mo>(</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover></mml:mstyle><mml:msubsup><mml:mi>q</mml:mi><mml:mrow><mml:mi>j</mml:mi><mml:mi>u</mml:mi></mml:mrow><mml:mn>2</mml:mn></mml:msubsup><mml:mo>)</mml:mo></mml:mrow></mml:mfrac><mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula> <italic>F</italic><sub>ST</sub> = 0.1 is achieved with <italic>τ</italic> ≈ 0.901.</p>
</sec>
</sec>
<sec id="sec039">
<title>Prediction intervals</title>
<p>Prediction intervals with <italic>α</italic> = 95% correspond to the range of <italic>n</italic> = 39 independent <italic>F</italic><sub>ST</sub> estimates. In the general case, <italic>n</italic> independent statistics are given in order <italic>X</italic><sub>(1)</sub> &lt; … &lt; <italic>X</italic><sub>(<italic>n</italic>)</sub>. Then <italic>I</italic> = [<italic>X</italic><sub>(<italic>j</italic>)</sub>, <italic>X</italic><sub>(<italic>n</italic>+1−<italic>j</italic>)</sub>] is a prediction interval with confidence <inline-formula id="pgen.1009241.e397"><alternatives><graphic id="pgen.1009241.e397g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e397" xlink:type="simple"/><mml:math display="inline" id="M397"><mml:mrow><mml:mi>α</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>n</mml:mi><mml:mo>+</mml:mo><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:mn>2</mml:mn><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>n</mml:mi><mml:mo>+</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mfrac></mml:mrow></mml:math></alternatives></inline-formula> [<xref ref-type="bibr" rid="pgen.1009241.ref096">96</xref>]. In our case, <italic>j</italic> = 1 and <italic>n</italic> = 39 gives <italic>α</italic> = 0.95, as desired. Each estimate was constructed from simulated data with the same dimensions and structure as before (fixed <inline-formula id="pgen.1009241.e398"><alternatives><graphic id="pgen.1009241.e398g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e398" xlink:type="simple"/><mml:math display="inline" id="M398"><mml:msubsup><mml:mi>f</mml:mi><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:mrow><mml:mi>T</mml:mi></mml:msubsup></mml:math></alternatives></inline-formula> and <italic>q</italic><sub><italic>ju</italic></sub>; fixed sample sizes for the independent subpopulations model), but with <inline-formula id="pgen.1009241.e399"><alternatives><graphic id="pgen.1009241.e399g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pgen.1009241.e399" xlink:type="simple"/><mml:math display="inline" id="M399"><mml:mrow><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:mi>T</mml:mi></mml:msubsup><mml:mo>,</mml:mo><mml:msubsup><mml:mi>p</mml:mi><mml:mi>i</mml:mi><mml:msub><mml:mi>S</mml:mi><mml:mi>u</mml:mi></mml:msub></mml:msubsup><mml:mo>,</mml:mo><mml:msub><mml:mi>π</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></alternatives></inline-formula> drawn separately for each estimate.</p>
</sec>
<sec id="sec040">
<title>BayeScan and Weir-Goudet implementations</title>
<p>Weir-Goudet (WG) kinship estimates [<xref ref-type="bibr" rid="pgen.1009241.ref020">20</xref>–<xref ref-type="bibr" rid="pgen.1009241.ref022">22</xref>] were calculated using the function <monospace>snpgdsIndivBeta</monospace> in the R package <monospace>SNPRelate</monospace> 1.20.1 available on Bioconductor and GitHub. We found identical estimates using the function <monospace>beta.dosage</monospace> in the R package <monospace>hierfstat</monospace> 0.4.30 available on GitHub. WG (individuals) <italic>F</italic><sub>ST</sub> estimates were computed from the kinship estimates as described in section <bold>Comparison to the Weir-Goudet kinship estimator for individuals</bold>.</p>
<p>BayeScan 2.1 was downloaded from <ext-link ext-link-type="uri" xlink:href="http://cmpg.unibe.ch/software/BayeScan/" xlink:type="simple">http://cmpg.unibe.ch/software/BayeScan/</ext-link>. To estimate <italic>F</italic><sub>ST</sub>, first the per-subpopulation <italic>F</italic><sub>ST</sub> values were estimated across loci assuming no selection, then the global <italic>F</italic><sub>ST</sub> was given by the mean <italic>F</italic><sub>ST</sub> across subpopulations.</p>
</sec>
<sec id="sec041">
<title>Software</title>
<p>An R package called <monospace>popkin</monospace>, which implements the kinship and <italic>F</italic><sub>ST</sub> estimation methods proposed here, is available on the Comprehensive R Archive Network (CRAN) at <ext-link ext-link-type="uri" xlink:href="https://cran.r-project.org/package=popkin" xlink:type="simple">https://cran.r-project.org/package=popkin</ext-link> and on GitHub at <ext-link ext-link-type="uri" xlink:href="https://github.com/StoreyLab/popkin" xlink:type="simple">https://github.com/StoreyLab/popkin</ext-link>.</p>
<p>An R package called <monospace>bnpsd</monospace>, which implements the BN-PSD admixture simulation, is available on CRAN at <ext-link ext-link-type="uri" xlink:href="https://cran.r-project.org/package=bnpsd" xlink:type="simple">https://cran.r-project.org/package=bnpsd</ext-link> and on GitHub at <ext-link ext-link-type="uri" xlink:href="https://github.com/StoreyLab/bnpsd" xlink:type="simple">https://github.com/StoreyLab/bnpsd</ext-link>.</p>
<p>An R package called <monospace>popkinsuppl</monospace>, which implements memory-efficient algorithms for the Weir-Cockerham, Weir-Hill, and HudsonK <italic>F</italic><sub>ST</sub> estimators, and the standard kinship estimator, is available on GitHub at <ext-link ext-link-type="uri" xlink:href="https://github.com/OchoaLab/popkinsuppl" xlink:type="simple">https://github.com/OchoaLab/popkinsuppl</ext-link>.</p>
<p>Public code reproducing these analyses are available at <ext-link ext-link-type="uri" xlink:href="https://github.com/StoreyLab/human-differentiation-manuscript" xlink:type="simple">https://github.com/StoreyLab/human-differentiation-manuscript</ext-link>.</p>
</sec>
</sec>
<sec id="sec042" sec-type="supplementary-material">
<title>Supporting information</title>
<supplementary-material id="pgen.1009241.s001" mimetype="application/pdf" position="float" xlink:href="info:doi/10.1371/journal.pgen.1009241.s001" xlink:type="simple">
<label>S1 Text</label>
<caption>
<title>Supplementary information.</title>
<p>Includes mathematical proofs and other calculations, including proof of convergence of ratio-of-means estimators, proof that the Weir-Goudet <italic>F</italic><sub>ST</sub> estimator for subpopulations equals HudsonK, derivation of existing method-of-moment estimators, proof that <italic>F</italic><sub>ST</sub> and kinship estimator limits are constants with respect to the ancestral population <italic>T</italic>, mean coancestry bounds, moments of estimator building blocks, the derivation of our new kinship estimator, and proof that our estimator from our original 2016 manuscript is algebraically equivalent to the one presented here.</p>
<p>(PDF)</p>
</caption>
</supplementary-material>
</sec>
</body>
<back>
<ref-list>
<title>References</title>
<ref id="pgen.1009241.ref001"><label>1</label><mixed-citation publication-type="book" xlink:type="simple"><name name-style="western"><surname>Malécot</surname> <given-names>G</given-names></name>. <source>Mathématiques de l’hérédité</source>. <publisher-name>Masson et Cie</publisher-name>; <year>1948</year>.</mixed-citation></ref>
<ref id="pgen.1009241.ref002"><label>2</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Wright</surname> <given-names>S</given-names></name>. <article-title>The genetical structure of populations</article-title>. <source>Ann Eugen</source>. <year>1951</year>;<volume>15</volume>(<issue>4</issue>):<fpage>323</fpage>–<lpage>354</lpage>.</mixed-citation></ref>
<ref id="pgen.1009241.ref003"><label>3</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Balding</surname> <given-names>DJ</given-names></name>, <name name-style="western"><surname>Nichols</surname> <given-names>RA</given-names></name>. <article-title>A method for quantifying differentiation between populations at multi-allelic loci and its implications for investigating identity and paternity</article-title>. <source>Genetica</source>. <year>1995</year>;<volume>96</volume>(<issue>1-2</issue>):<fpage>3</fpage>–<lpage>12</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/BF01441146" xlink:type="simple">10.1007/BF01441146</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref004"><label>4</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Weir</surname> <given-names>BS</given-names></name>, <name name-style="western"><surname>Hill</surname> <given-names>WG</given-names></name>. <article-title>Estimating F-Statistics</article-title>. <source>Annual Review of Genetics</source>. <year>2002</year>;<volume>36</volume>(<issue>1</issue>):<fpage>721</fpage>–<lpage>750</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1146/annurev.genet.36.050802.093940" xlink:type="simple">10.1146/annurev.genet.36.050802.093940</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref005"><label>5</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Nicholson</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Smith</surname> <given-names>AV</given-names></name>, <name name-style="western"><surname>Jónsson</surname> <given-names>F</given-names></name>, <name name-style="western"><surname>Gústafsson</surname> <given-names>O</given-names></name>, <name name-style="western"><surname>Stefánsson</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Donnelly</surname> <given-names>P</given-names></name>. <article-title>Assessing population differentiation and isolation from single-nucleotide polymorphism data</article-title>. <source>Journal of the Royal Statistical Society: Series B (Statistical Methodology)</source>. <year>2002</year>;<volume>64</volume>(<issue>4</issue>):<fpage>695</fpage>–<lpage>715</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/1467-9868.00357" xlink:type="simple">10.1111/1467-9868.00357</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref006"><label>6</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Falush</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Stephens</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Pritchard</surname> <given-names>JK</given-names></name>. <article-title>Inference of population structure using multilocus genotype data: linked loci and correlated allele frequencies</article-title>. <source>Genetics</source>. <year>2003</year>;<volume>164</volume>(<issue>4</issue>):<fpage>1567</fpage>–<lpage>1587</lpage>.</mixed-citation></ref>
<ref id="pgen.1009241.ref007"><label>7</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Balding</surname> <given-names>DJ</given-names></name>. <article-title>Likelihood-based inference for genetic correlation coefficients</article-title>. <source>Theoretical Population Biology</source>. <year>2003</year>;<volume>63</volume>(<issue>3</issue>):<fpage>221</fpage>–<lpage>230</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/S0040-5809(03)00007-8" xlink:type="simple">10.1016/S0040-5809(03)00007-8</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref008"><label>8</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Beaumont</surname> <given-names>MA</given-names></name>, <name name-style="western"><surname>Balding</surname> <given-names>DJ</given-names></name>. <article-title>Identifying adaptive genetic divergence among populations from genome scans</article-title>. <source>Molecular Ecology</source>. <year>2004</year>;<volume>13</volume>(<issue>4</issue>):<fpage>969</fpage>–<lpage>980</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/j.1365-294X.2004.02125.x" xlink:type="simple">10.1111/j.1365-294X.2004.02125.x</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref009"><label>9</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Foll</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Gaggiotti</surname> <given-names>O</given-names></name>. <article-title>Identifying the Environmental Factors That Determine the Genetic Structure of Populations</article-title>. <source>Genetics</source>. <year>2006</year>;<volume>174</volume>(<issue>2</issue>):<fpage>875</fpage>–<lpage>891</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.106.059451" xlink:type="simple">10.1534/genetics.106.059451</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref010"><label>10</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Foll</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Gaggiotti</surname> <given-names>O</given-names></name>. <article-title>A genome-scan method to identify selected loci appropriate for both dominant and codominant markers: a Bayesian perspective</article-title>. <source>Genetics</source>. <year>2008</year>;<volume>180</volume>(<issue>2</issue>):<fpage>977</fpage>–<lpage>993</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.108.092221" xlink:type="simple">10.1534/genetics.108.092221</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref011"><label>11</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Coop</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Witonsky</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Rienzo</surname> <given-names>AD</given-names></name>, <name name-style="western"><surname>Pritchard</surname> <given-names>JK</given-names></name>. <article-title>Using Environmental Correlations to Identify Loci Underlying Local Adaptation</article-title>. <source>Genetics</source>. <year>2010</year>;<volume>185</volume>(<issue>4</issue>):<fpage>1411</fpage>–<lpage>1423</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.110.114819" xlink:type="simple">10.1534/genetics.110.114819</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref012"><label>12</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Thompson</surname> <given-names>EA</given-names></name>. <article-title>The estimation of pairwise relationships</article-title>. <source>Ann Hum Genet</source>. <year>1975</year>;<volume>39</volume>(<issue>2</issue>):<fpage>173</fpage>–<lpage>188</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/j.1469-1809.1975.tb00120.x" xlink:type="simple">10.1111/j.1469-1809.1975.tb00120.x</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref013"><label>13</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Milligan</surname> <given-names>BG</given-names></name>. <article-title>Maximum-likelihood estimation of relatedness</article-title>. <source>Genetics</source>. <year>2003</year>;<volume>163</volume>(<issue>3</issue>):<fpage>1153</fpage>–<lpage>1167</lpage>.</mixed-citation></ref>
<ref id="pgen.1009241.ref014"><label>14</label><mixed-citation publication-type="book" xlink:type="simple"><name name-style="western"><surname>Jacquard</surname> <given-names>A</given-names></name>. <source>Structures génétiques des populations</source>. <publisher-loc>Paris</publisher-loc>: <publisher-name>Masson et Cie</publisher-name>; <year>1970</year>.</mixed-citation></ref>
<ref id="pgen.1009241.ref015"><label>15</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Csűrös</surname> <given-names>M</given-names></name>. <article-title>Non-identifiability of identity coefficients at biallelic loci</article-title>. <source>Theor Popul Biol</source>. <year>2014</year>;<volume>92</volume>:<fpage>22</fpage>–<lpage>29</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.tpb.2013.11.001" xlink:type="simple">10.1016/j.tpb.2013.11.001</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref016"><label>16</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Astle</surname> <given-names>W</given-names></name>, <name name-style="western"><surname>Balding</surname> <given-names>DJ</given-names></name>. <article-title>Population Structure and Cryptic Relatedness in Genetic Association Studies</article-title>. <source>Statist Sci</source>. <year>2009</year>;<volume>24</volume>(<issue>4</issue>):<fpage>451</fpage>–<lpage>471</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1214/09-STS307" xlink:type="simple">10.1214/09-STS307</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref017"><label>17</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Weir</surname> <given-names>BS</given-names></name>, <name name-style="western"><surname>Cockerham</surname> <given-names>CC</given-names></name>. <article-title>Estimating F-Statistics for the Analysis of Population Structure</article-title>. <source>Evolution</source>. <year>1984</year>;<volume>38</volume>(<issue>6</issue>):<fpage>1358</fpage>–<lpage>1370</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/j.1558-5646.1984.tb05657.x" xlink:type="simple">10.1111/j.1558-5646.1984.tb05657.x</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref018"><label>18</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Weir</surname> <given-names>BS</given-names></name>, <name name-style="western"><surname>Cardon</surname> <given-names>LR</given-names></name>, <name name-style="western"><surname>Anderson</surname> <given-names>AD</given-names></name>, <name name-style="western"><surname>Nielsen</surname> <given-names>DM</given-names></name>, <name name-style="western"><surname>Hill</surname> <given-names>WG</given-names></name>. <article-title>Measures of human population structure show heterogeneity among genomic regions</article-title>. <source>Genome Res</source>. <year>2005</year>;<volume>15</volume>(<issue>11</issue>):<fpage>1468</fpage>–<lpage>1476</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1101/gr.4398405" xlink:type="simple">10.1101/gr.4398405</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref019"><label>19</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Buckleton</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Curran</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Goudet</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Taylor</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Thiery</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Weir</surname> <given-names>BS</given-names></name>. <article-title>Population-specific FST values for forensic STR markers: A worldwide survey</article-title>. <source>Forensic Science International: Genetics</source>. <year>2016</year>;<volume>23</volume>:<fpage>91</fpage>–<lpage>100</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.fsigen.2016.03.004" xlink:type="simple">10.1016/j.fsigen.2016.03.004</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref020"><label>20</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Weir</surname> <given-names>B</given-names></name>, <name name-style="western"><surname>Zheng</surname> <given-names>X</given-names></name>. <article-title>SNPs and SNVs in forensic science</article-title>. <source>Forensic Science International: Genetics Supplement Series</source>. <year>2015</year>;<volume>5</volume>(<issue>Dec</issue>):<fpage>e267</fpage>–<lpage>e268</lpage>.</mixed-citation></ref>
<ref id="pgen.1009241.ref021"><label>21</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Weir</surname> <given-names>BS</given-names></name>, <name name-style="western"><surname>Goudet</surname> <given-names>J</given-names></name>. <article-title>A Unified Characterization of Population Structure and Relatedness</article-title>. <source>Genetics</source>. <year>2017</year>;<volume>206</volume>(<issue>4</issue>):<fpage>2085</fpage>–<lpage>2103</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.116.198424" xlink:type="simple">10.1534/genetics.116.198424</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref022"><label>22</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Goudet</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Kay</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Weir</surname> <given-names>BS</given-names></name>. <article-title>How to estimate kinship</article-title>. <source>Mol Ecol</source>. <year>2018</year>;<volume>27</volume>(<issue>20</issue>):<fpage>4121</fpage>–<lpage>4135</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/mec.14833" xlink:type="simple">10.1111/mec.14833</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref023"><label>23</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Bhatia</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Patterson</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Sankararaman</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Price</surname> <given-names>AL</given-names></name>. <article-title>Estimating and interpreting FST: the impact of rare variants</article-title>. <source>Genome Res</source>. <year>2013</year>;<volume>23</volume>(<issue>9</issue>):<fpage>1514</fpage>–<lpage>1521</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1101/gr.154831.113" xlink:type="simple">10.1101/gr.154831.113</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref024"><label>24</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Xie</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Gessler</surname> <given-names>DD</given-names></name>, <name name-style="western"><surname>Xu</surname> <given-names>S</given-names></name>. <article-title>Combining different line crosses for mapping quantitative trait loci using the identical by descent-based variance component method</article-title>. <source>Genetics</source>. <year>1998</year>;<volume>149</volume>(<issue>2</issue>):<fpage>1139</fpage>–<lpage>1146</lpage>.</mixed-citation></ref>
<ref id="pgen.1009241.ref025"><label>25</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Yu</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Pressoir</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Briggs</surname> <given-names>WH</given-names></name>, <name name-style="western"><surname>Vroh Bi</surname> <given-names>I</given-names></name>, <name name-style="western"><surname>Yamasaki</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Doebley</surname> <given-names>JF</given-names></name>, <etal>et al</etal>. <article-title>A unified mixed-model method for association mapping that accounts for multiple levels of relatedness</article-title>. <source>Nat Genet</source>. <year>2006</year>;<volume>38</volume>(<issue>2</issue>):<fpage>203</fpage>–<lpage>208</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng1702" xlink:type="simple">10.1038/ng1702</ext-link></comment> <object-id pub-id-type="pmid">16380716</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref026"><label>26</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Aulchenko</surname> <given-names>YS</given-names></name>, <name name-style="western"><surname>de Koning</surname> <given-names>DJ</given-names></name>, <name name-style="western"><surname>Haley</surname> <given-names>C</given-names></name>. <article-title>Genomewide rapid association using mixed model and regression: a fast and simple method for genomewide pedigree-based quantitative trait loci association analysis</article-title>. <source>Genetics</source>. <year>2007</year>;<volume>177</volume>(<issue>1</issue>):<fpage>577</fpage>–<lpage>585</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.107.075614" xlink:type="simple">10.1534/genetics.107.075614</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref027"><label>27</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Price</surname> <given-names>AL</given-names></name>, <name name-style="western"><surname>Patterson</surname> <given-names>NJ</given-names></name>, <name name-style="western"><surname>Plenge</surname> <given-names>RM</given-names></name>, <name name-style="western"><surname>Weinblatt</surname> <given-names>ME</given-names></name>, <name name-style="western"><surname>Shadick</surname> <given-names>NA</given-names></name>, <name name-style="western"><surname>Reich</surname> <given-names>D</given-names></name>. <article-title>Principal components analysis corrects for stratification in genome-wide association studies</article-title>. <source>Nat Genet</source>. <year>2006</year>;<volume>38</volume>(<issue>8</issue>):<fpage>904</fpage>–<lpage>909</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng1847" xlink:type="simple">10.1038/ng1847</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref028"><label>28</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Kang</surname> <given-names>HM</given-names></name>, <name name-style="western"><surname>Zaitlen</surname> <given-names>NA</given-names></name>, <name name-style="western"><surname>Wade</surname> <given-names>CM</given-names></name>, <name name-style="western"><surname>Kirby</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Heckerman</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Daly</surname> <given-names>MJ</given-names></name>, <etal>et al</etal>. <article-title>Efficient control of population structure in model organism association mapping</article-title>. <source>Genetics</source>. <year>2008</year>;<volume>178</volume>(<issue>3</issue>):<fpage>1709</fpage>–<lpage>1723</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.107.080101" xlink:type="simple">10.1534/genetics.107.080101</ext-link></comment> <object-id pub-id-type="pmid">18385116</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref029"><label>29</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Kang</surname> <given-names>HM</given-names></name>, <name name-style="western"><surname>Sul</surname> <given-names>JH</given-names></name>, <name name-style="western"><surname>Service</surname> <given-names>SK</given-names></name>, <name name-style="western"><surname>Zaitlen</surname> <given-names>NA</given-names></name>, <name name-style="western"><surname>Kong</surname> <given-names>SY</given-names></name>, <name name-style="western"><surname>Freimer</surname> <given-names>NB</given-names></name>, <etal>et al</etal>. <article-title>Variance component model to account for sample structure in genome-wide association studies</article-title>. <source>Nat Genet</source>. <year>2010</year>;<volume>42</volume>(<issue>4</issue>):<fpage>348</fpage>–<lpage>354</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng.548" xlink:type="simple">10.1038/ng.548</ext-link></comment> <object-id pub-id-type="pmid">20208533</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref030"><label>30</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Zhou</surname> <given-names>X</given-names></name>, <name name-style="western"><surname>Stephens</surname> <given-names>M</given-names></name>. <article-title>Genome-wide efficient mixed-model analysis for association studies</article-title>. <source>Nat Genet</source>. <year>2012</year>;<volume>44</volume>(<issue>7</issue>):<fpage>821</fpage>–<lpage>824</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng.2310" xlink:type="simple">10.1038/ng.2310</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref031"><label>31</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Yang</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Benyamin</surname> <given-names>B</given-names></name>, <name name-style="western"><surname>McEvoy</surname> <given-names>BP</given-names></name>, <name name-style="western"><surname>Gordon</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Henders</surname> <given-names>AK</given-names></name>, <name name-style="western"><surname>Nyholt</surname> <given-names>DR</given-names></name>, <etal>et al</etal>. <article-title>Common SNPs explain a large proportion of the heritability for human height</article-title>. <source>Nat Genet</source>. <year>2010</year>;<volume>42</volume>(<issue>7</issue>):<fpage>565</fpage>–<lpage>569</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng.608" xlink:type="simple">10.1038/ng.608</ext-link></comment> <object-id pub-id-type="pmid">20562875</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref032"><label>32</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Yang</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Lee</surname> <given-names>SH</given-names></name>, <name name-style="western"><surname>Goddard</surname> <given-names>ME</given-names></name>, <name name-style="western"><surname>Visscher</surname> <given-names>PM</given-names></name>. <article-title>GCTA: a tool for genome-wide complex trait analysis</article-title>. <source>Am J Hum Genet</source>. <year>2011</year>;<volume>88</volume>(<issue>1</issue>):<fpage>76</fpage>–<lpage>82</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.ajhg.2010.11.011" xlink:type="simple">10.1016/j.ajhg.2010.11.011</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref033"><label>33</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Rakovski</surname> <given-names>CS</given-names></name>, <name name-style="western"><surname>Stram</surname> <given-names>DO</given-names></name>. <article-title>A kinship-based modification of the armitage trend test to address hidden population structure and small differential genotyping errors</article-title>. <source>PLoS ONE</source>. <year>2009</year>;<volume>4</volume>(<issue>6</issue>):<fpage>e5825</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pone.0005825" xlink:type="simple">10.1371/journal.pone.0005825</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref034"><label>34</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Thornton</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>McPeek</surname> <given-names>MS</given-names></name>. <article-title>ROADTRIPS: case-control association testing with partially or completely unknown population and pedigree structure</article-title>. <source>Am J Hum Genet</source>. <year>2010</year>;<volume>86</volume>(<issue>2</issue>):<fpage>172</fpage>–<lpage>184</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.ajhg.2010.01.001" xlink:type="simple">10.1016/j.ajhg.2010.01.001</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref035"><label>35</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Speed</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Balding</surname> <given-names>DJ</given-names></name>. <article-title>Relatedness in the post-genomic era: is it still useful?</article-title> <source>Nat Rev Genet</source>. <year>2015</year>;<volume>16</volume>(<issue>1</issue>):<fpage>33</fpage>–<lpage>44</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nrg3821" xlink:type="simple">10.1038/nrg3821</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref036"><label>36</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Wang</surname> <given-names>B</given-names></name>, <name name-style="western"><surname>Sverdlov</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Thompson</surname> <given-names>E</given-names></name>. <article-title>Efficient Estimation of Realized Kinship from SNP Genotypes</article-title>. <source>Genetics</source>. <year>2017</year>; p. genetics.116.197004. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.116.197004" xlink:type="simple">10.1534/genetics.116.197004</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref037"><label>37</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Wright</surname> <given-names>S</given-names></name>. <article-title>Systems of Mating. V. General Considerations</article-title>. <source>Genetics</source>. <year>1921</year>;<volume>6</volume>(<issue>2</issue>):<fpage>167</fpage>–<lpage>178</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/genetics/6.2.167" xlink:type="simple">10.1093/genetics/6.2.167</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref038"><label>38</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Lush</surname> <given-names>JL</given-names></name>. <article-title>Heritability of Quantitative Characters in Farm Animals</article-title>. <source>Hereditas</source>. <year>1949</year>;<volume>35</volume>(<issue>S1</issue>):<fpage>356</fpage>–<lpage>375</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/j.1601-5223.1949.tb03347.x" xlink:type="simple">10.1111/j.1601-5223.1949.tb03347.x</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref039"><label>39</label><mixed-citation publication-type="book" xlink:type="simple"><name name-style="western"><surname>Falconer</surname> <given-names>DS</given-names></name>, <name name-style="western"><surname>Mackay</surname> <given-names>TFC</given-names></name>. <source>Introduction to Quantitative Genetics</source>. <edition designator="4">4th ed</edition>. <publisher-loc>Harlow</publisher-loc>: <publisher-name>Pearson</publisher-name>; <year>1996</year>.</mixed-citation></ref>
<ref id="pgen.1009241.ref040"><label>40</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Thompson</surname> <given-names>EA</given-names></name>. <article-title>Identity by descent: variation in meiosis, across genomes, and in populations</article-title>. <source>Genetics</source>. <year>2013</year>;<volume>194</volume>(<issue>2</issue>):<fpage>301</fpage>–<lpage>326</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.112.148825" xlink:type="simple">10.1534/genetics.112.148825</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref041"><label>41</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Slatkin</surname> <given-names>M</given-names></name>. <article-title>Inbreeding coefficients and coalescence times</article-title>. <source>Genetics Research</source>. <year>1991</year>;<volume>58</volume>(<issue>2</issue>):<fpage>167</fpage>–<lpage>175</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1017/S0016672300029827" xlink:type="simple">10.1017/S0016672300029827</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref042"><label>42</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Emik</surname> <given-names>LO</given-names></name>, <name name-style="western"><surname>Terrill</surname> <given-names>CE</given-names></name>. <article-title>Systematic procedures for calculating inbreeding coefficients</article-title>. <source>J Hered</source>. <year>1949</year>;<volume>40</volume>(<issue>2</issue>):<fpage>51</fpage>–<lpage>55</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/oxfordjournals.jhered.a105986" xlink:type="simple">10.1093/oxfordjournals.jhered.a105986</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref043"><label>43</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>García-Cortés</surname> <given-names>LA</given-names></name>. <article-title>A novel recursive algorithm for the calculation of the detailed identity coefficients</article-title>. <source>Genetics Selection Evolution</source>. <year>2015</year>;<volume>47</volume>(<issue>1</issue>):<fpage>33</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/s12711-015-0108-6" xlink:type="simple">10.1186/s12711-015-0108-6</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref044"><label>44</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Rosenberg</surname> <given-names>NA</given-names></name>, <name name-style="western"><surname>Pritchard</surname> <given-names>JK</given-names></name>, <name name-style="western"><surname>Weber</surname> <given-names>JL</given-names></name>, <name name-style="western"><surname>Cann</surname> <given-names>HM</given-names></name>, <name name-style="western"><surname>Kidd</surname> <given-names>KK</given-names></name>, <name name-style="western"><surname>Zhivotovsky</surname> <given-names>LA</given-names></name>, <etal>et al</etal>. <article-title>Genetic Structure of Human Populations</article-title>. <source>Science</source>. <year>2002</year>;<volume>298</volume>(<issue>5602</issue>):<fpage>2381</fpage>–<lpage>2385</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1126/science.1078311" xlink:type="simple">10.1126/science.1078311</ext-link></comment> <object-id pub-id-type="pmid">12493913</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref045"><label>45</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Ramachandran</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Deshpande</surname> <given-names>O</given-names></name>, <name name-style="western"><surname>Roseman</surname> <given-names>CC</given-names></name>, <name name-style="western"><surname>Rosenberg</surname> <given-names>NA</given-names></name>, <name name-style="western"><surname>Feldman</surname> <given-names>MW</given-names></name>, <name name-style="western"><surname>Cavalli-Sforza</surname> <given-names>LL</given-names></name>. <article-title>Support from the relationship of genetic and geographic distance in human populations for a serial founder effect originating in Africa</article-title>. <source>Proc Natl Acad Sci U S A</source>. <year>2005</year>;<volume>102</volume>(<issue>44</issue>):<fpage>15942</fpage>–<lpage>15947</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1073/pnas.0507611102" xlink:type="simple">10.1073/pnas.0507611102</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref046"><label>46</label><mixed-citation publication-type="journal" xlink:type="simple"><collab>Consortium TGP</collab>. <article-title>A map of human genome variation from population-scale sequencing</article-title>. <source>Nature</source>. <year>2010</year>;<volume>467</volume>(<issue>7319</issue>):<fpage>1061</fpage>–<lpage>1073</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nature09534" xlink:type="simple">10.1038/nature09534</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref047"><label>47</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Lazaridis</surname> <given-names>I</given-names></name>, <name name-style="western"><surname>Patterson</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Mittnik</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Renaud</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Mallick</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Kirsanow</surname> <given-names>K</given-names></name>, <etal>et al</etal>. <article-title>Ancient human genomes suggest three ancestral populations for present-day Europeans</article-title>. <source>Nature</source>. <year>2014</year>;<volume>513</volume>(<issue>7518</issue>):<fpage>409</fpage>–<lpage>413</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nature13673" xlink:type="simple">10.1038/nature13673</ext-link></comment> <object-id pub-id-type="pmid">25230663</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref048"><label>48</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Lazaridis</surname> <given-names>I</given-names></name>, <name name-style="western"><surname>Nadel</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Rollefson</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Merrett</surname> <given-names>DC</given-names></name>, <name name-style="western"><surname>Rohland</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Mallick</surname> <given-names>S</given-names></name>, <etal>et al</etal>. <article-title>Genomic insights into the origin of farming in the ancient Near East</article-title>. <source>Nature</source>. <year>2016</year>;<volume>536</volume>(<issue>7617</issue>):<fpage>419</fpage>–<lpage>424</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nature19310" xlink:type="simple">10.1038/nature19310</ext-link></comment> <object-id pub-id-type="pmid">27459054</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref049"><label>49</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Skoglund</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Posth</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Sirak</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Spriggs</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Valentin</surname> <given-names>F</given-names></name>, <name name-style="western"><surname>Bedford</surname> <given-names>S</given-names></name>, <etal>et al</etal>. <article-title>Genomic insights into the peopling of the Southwest Pacific</article-title>. <source>Nature</source>. <year>2016</year>;<volume>538</volume>(<issue>7626</issue>):<fpage>510</fpage>–<lpage>513</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nature19844" xlink:type="simple">10.1038/nature19844</ext-link></comment> <object-id pub-id-type="pmid">27698418</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref050"><label>50</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Tishkoff</surname> <given-names>SA</given-names></name>, <name name-style="western"><surname>Reed</surname> <given-names>FA</given-names></name>, <name name-style="western"><surname>Friedlaender</surname> <given-names>FR</given-names></name>, <name name-style="western"><surname>Ehret</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Ranciaro</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Froment</surname> <given-names>A</given-names></name>, <etal>et al</etal>. <article-title>The Genetic Structure and History of Africans and African Americans</article-title>. <source>Science</source>. <year>2009</year>;<volume>324</volume>(<issue>5930</issue>):<fpage>1035</fpage>–<lpage>1044</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1126/science.1172257" xlink:type="simple">10.1126/science.1172257</ext-link></comment> <object-id pub-id-type="pmid">19407144</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref051"><label>51</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Moreno-Estrada</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Gravel</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Zakharia</surname> <given-names>F</given-names></name>, <name name-style="western"><surname>McCauley</surname> <given-names>JL</given-names></name>, <name name-style="western"><surname>Byrnes</surname> <given-names>JK</given-names></name>, <name name-style="western"><surname>Gignoux</surname> <given-names>CR</given-names></name>, <etal>et al</etal>. <article-title>Reconstructing the Population Genetic History of the Caribbean</article-title>. <source>PLOS Genetics</source>. <year>2013</year>;<volume>9</volume>(<issue>11</issue>):<fpage>e1003925</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pgen.1003925" xlink:type="simple">10.1371/journal.pgen.1003925</ext-link></comment> <object-id pub-id-type="pmid">24244192</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref052"><label>52</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Moreno-Estrada</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Gignoux</surname> <given-names>CR</given-names></name>, <name name-style="western"><surname>Fernández-López</surname> <given-names>JC</given-names></name>, <name name-style="western"><surname>Zakharia</surname> <given-names>F</given-names></name>, <name name-style="western"><surname>Sikora</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Contreras</surname> <given-names>AV</given-names></name>, <etal>et al</etal>. <article-title>The genetics of Mexico recapitulates Native American substructure and affects biomedical traits</article-title>. <source>Science</source>. <year>2014</year>;<volume>344</volume>(<issue>6189</issue>):<fpage>1280</fpage>–<lpage>1285</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1126/science.1251688" xlink:type="simple">10.1126/science.1251688</ext-link></comment> <object-id pub-id-type="pmid">24926019</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref053"><label>53</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Leslie</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Winney</surname> <given-names>B</given-names></name>, <name name-style="western"><surname>Hellenthal</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Davison</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Boumertit</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Day</surname> <given-names>T</given-names></name>, <etal>et al</etal>. <article-title>The fine-scale genetic structure of the British population</article-title>. <source>Nature</source>. <year>2015</year>;<volume>519</volume>(<issue>7543</issue>):<fpage>309</fpage>–<lpage>314</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nature14230" xlink:type="simple">10.1038/nature14230</ext-link></comment> <object-id pub-id-type="pmid">25788095</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref054"><label>54</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Baharian</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Barakatt</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Gignoux</surname> <given-names>CR</given-names></name>, <name name-style="western"><surname>Shringarpure</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Errington</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Blot</surname> <given-names>WJ</given-names></name>, <etal>et al</etal>. <article-title>The Great Migration and African-American Genomic Diversity</article-title>. <source>PLoS Genet</source>. <year>2016</year>;<volume>12</volume>(<issue>5</issue>):<fpage>e1006059</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pgen.1006059" xlink:type="simple">10.1371/journal.pgen.1006059</ext-link></comment> <object-id pub-id-type="pmid">27232753</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref055"><label>55</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Haak</surname> <given-names>W</given-names></name>, <name name-style="western"><surname>Lazaridis</surname> <given-names>I</given-names></name>, <name name-style="western"><surname>Patterson</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Rohland</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Mallick</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Llamas</surname> <given-names>B</given-names></name>, <etal>et al</etal>. <article-title>Massive migration from the steppe was a source for Indo-European languages in Europe</article-title>. <source>Nature</source>. <year>2015</year>;<volume>522</volume>(<issue>7555</issue>):<fpage>207</fpage>–<lpage>211</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nature14317" xlink:type="simple">10.1038/nature14317</ext-link></comment> <object-id pub-id-type="pmid">25731166</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref056"><label>56</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Allentoft</surname> <given-names>ME</given-names></name>, <name name-style="western"><surname>Sikora</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Sjögren</surname> <given-names>KG</given-names></name>, <name name-style="western"><surname>Rasmussen</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Rasmussen</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Stenderup</surname> <given-names>J</given-names></name>, <etal>et al</etal>. <article-title>Population genomics of Bronze Age Eurasia</article-title>. <source>Nature</source>. <year>2015</year>;<volume>522</volume>(<issue>7555</issue>):<fpage>167</fpage>–<lpage>172</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nature14507" xlink:type="simple">10.1038/nature14507</ext-link></comment> <object-id pub-id-type="pmid">26062507</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref057"><label>57</label><mixed-citation publication-type="other" xlink:type="simple">Ochoa A, Storey JD. <italic>F</italic><sub>ST</sub> and kinship for arbitrary population structures I: Generalized definitions. bioRxiv. 2016; <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1101/083915" xlink:type="simple">10.1101/083915</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref058"><label>58</label><mixed-citation publication-type="other" xlink:type="simple">Ochoa A, Storey JD. <italic>F</italic><sub>ST</sub> and kinship for arbitrary population structures II: Method of moments estimators. bioRxiv. 2016; <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1101/083923" xlink:type="simple">10.1101/083923</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref059"><label>59</label><mixed-citation publication-type="other" xlink:type="simple">Ochoa A, Storey JD. New kinship and <italic>F</italic><sub>ST</sub> estimates reveal higher levels of differentiation in the global human population. bioRxiv. 2019; <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1101/653279" xlink:type="simple">10.1101/653279</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref060"><label>60</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Thornton</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Tang</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Hoffmann</surname> <given-names>TJ</given-names></name>, <name name-style="western"><surname>Ochs-Balcom</surname> <given-names>HM</given-names></name>, <name name-style="western"><surname>Caan</surname> <given-names>BJ</given-names></name>, <name name-style="western"><surname>Risch</surname> <given-names>N</given-names></name>. <article-title>Estimating kinship in admixed populations</article-title>. <source>Am J Hum Genet</source>. <year>2012</year>;<volume>91</volume>(<issue>1</issue>):<fpage>122</fpage>–<lpage>138</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.ajhg.2012.05.024" xlink:type="simple">10.1016/j.ajhg.2012.05.024</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref061"><label>61</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Hao</surname> <given-names>W</given-names></name>, <name name-style="western"><surname>Song</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Storey</surname> <given-names>JD</given-names></name>. <article-title>Probabilistic models of genetic variation in structured populations applied to global human studies</article-title>. <source>Bioinformatics</source>. <year>2016</year>;<volume>32</volume>(<issue>5</issue>):<fpage>713</fpage>–<lpage>721</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/bioinformatics/btv641" xlink:type="simple">10.1093/bioinformatics/btv641</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref062"><label>62</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Zheng</surname> <given-names>X</given-names></name>, <name name-style="western"><surname>Weir</surname> <given-names>BS</given-names></name>. <article-title>Eigenanalysis of SNP data with an identity by descent interpretation</article-title>. <source>Theoretical Population Biology</source>. <year>2016</year>;<volume>107</volume>:<fpage>65</fpage>–<lpage>76</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.tpb.2015.09.004" xlink:type="simple">10.1016/j.tpb.2015.09.004</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref063"><label>63</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Pritchard</surname> <given-names>JK</given-names></name>, <name name-style="western"><surname>Stephens</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Donnelly</surname> <given-names>P</given-names></name>. <article-title>Inference of population structure using multilocus genotype data</article-title>. <source>Genetics</source>. <year>2000</year>;<volume>155</volume>(<issue>2</issue>):<fpage>945</fpage>–<lpage>959</lpage>.</mixed-citation></ref>
<ref id="pgen.1009241.ref064"><label>64</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Tang</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Peng</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Wang</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Risch</surname> <given-names>NJ</given-names></name>. <article-title>Estimation of individual admixture: analytical and study design considerations</article-title>. <source>Genet Epidemiol</source>. <year>2005</year>;<volume>28</volume>(<issue>4</issue>):<fpage>289</fpage>–<lpage>301</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1002/gepi.20064" xlink:type="simple">10.1002/gepi.20064</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref065"><label>65</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Alexander</surname> <given-names>DH</given-names></name>, <name name-style="western"><surname>Novembre</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Lange</surname> <given-names>K</given-names></name>. <article-title>Fast model-based estimation of ancestry in unrelated individuals</article-title>. <source>Genome Res</source>. <year>2009</year>;<volume>19</volume>(<issue>9</issue>):<fpage>1655</fpage>–<lpage>1664</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1101/gr.094052.109" xlink:type="simple">10.1101/gr.094052.109</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref066"><label>66</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Browning</surname> <given-names>BL</given-names></name>, <name name-style="western"><surname>Browning</surname> <given-names>SR</given-names></name>. <article-title>A Fast, Powerful Method for Detecting Identity by Descent</article-title>. <source>The American Journal of Human Genetics</source>. <year>2011</year>;<volume>88</volume>(<issue>2</issue>):<fpage>173</fpage>–<lpage>182</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.ajhg.2011.01.010" xlink:type="simple">10.1016/j.ajhg.2011.01.010</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref067"><label>67</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Gazal</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Sahbatou</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Perdry</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Letort</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Génin</surname> <given-names>E</given-names></name>, <name name-style="western"><surname>Leutenegger</surname> <given-names>AL</given-names></name>. <article-title>Inbreeding Coefficient Estimation with Dense SNP Data: Comparison of Strategies and Application to HapMap III</article-title>. <source>HHE</source>. <year>2014</year>;<volume>77</volume>(<issue>1-4</issue>):<fpage>49</fpage>–<lpage>62</lpage>.</mixed-citation></ref>
<ref id="pgen.1009241.ref068"><label>68</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Joshi</surname> <given-names>PK</given-names></name>, <name name-style="western"><surname>Esko</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Mattsson</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Eklund</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Gandin</surname> <given-names>I</given-names></name>, <name name-style="western"><surname>Nutile</surname> <given-names>T</given-names></name>, <etal>et al</etal>. <article-title>Directional dominance on stature and cognition in diverse human populations</article-title>. <source>Nature</source>. <year>2015</year>;<volume>523</volume>(<issue>7561</issue>):<fpage>459</fpage>–<lpage>462</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nature14618" xlink:type="simple">10.1038/nature14618</ext-link></comment> <object-id pub-id-type="pmid">26131930</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref069"><label>69</label><mixed-citation publication-type="book" xlink:type="simple"><name name-style="western"><surname>Cochran</surname> <given-names>WG</given-names></name>. <source>Sampling techniques</source>. <edition designator="3">3rd ed</edition>. <publisher-name>Wiley</publisher-name>; <year>1977</year>.</mixed-citation></ref>
<ref id="pgen.1009241.ref070"><label>70</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Reynolds</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Weir</surname> <given-names>BS</given-names></name>, <name name-style="western"><surname>Cockerham</surname> <given-names>CC</given-names></name>. <article-title>Estimation of the Coancestry Coefficient: Basis for a Short-Term Genetic Distance</article-title>. <source>Genetics</source>. <year>1983</year>;<volume>105</volume>(<issue>3</issue>):<fpage>767</fpage>–<lpage>779</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/genetics/105.3.767" xlink:type="simple">10.1093/genetics/105.3.767</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref071"><label>71</label><mixed-citation publication-type="book" xlink:type="simple"><name name-style="western"><surname>Weir</surname> <given-names>BS</given-names></name>. <chapter-title>Genetic data analysis II</chapter-title>. <source>Methods for discrete population genetic data</source>. <publisher-loc>Sunderland, USA</publisher-loc>: <publisher-name>Sinauer Associates</publisher-name>; <year>1996</year>.</mixed-citation></ref>
<ref id="pgen.1009241.ref072"><label>72</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Bourgain</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Hoffjan</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Nicolae</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Newman</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Steiner</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Walker</surname> <given-names>K</given-names></name>, <etal>et al</etal>. <article-title>Novel case-control test in a founder population identifies P-selectin as an atopy-susceptibility locus</article-title>. <source>Am J Hum Genet</source>. <year>2003</year>;<volume>73</volume>(<issue>3</issue>):<fpage>612</fpage>–<lpage>626</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1086/378208" xlink:type="simple">10.1086/378208</ext-link></comment> <object-id pub-id-type="pmid">12929084</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref073"><label>73</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Choi</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Wijsman</surname> <given-names>EM</given-names></name>, <name name-style="western"><surname>Weir</surname> <given-names>BS</given-names></name>. <article-title>Case-Control Association Testing in the Presence of Unknown Relationships</article-title>. <source>Genet Epidemiol</source>. <year>2009</year>;<volume>33</volume>(<issue>8</issue>):<fpage>668</fpage>–<lpage>678</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1002/gepi.20418" xlink:type="simple">10.1002/gepi.20418</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref074"><label>74</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Pickrell</surname> <given-names>JK</given-names></name>, <name name-style="western"><surname>Pritchard</surname> <given-names>JK</given-names></name>. <article-title>Inference of population splits and mixtures from genome-wide allele frequency data</article-title>. <source>PLoS Genet</source>. <year>2012</year>;<volume>8</volume>(<issue>11</issue>):<fpage>e1002967</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pgen.1002967" xlink:type="simple">10.1371/journal.pgen.1002967</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref075"><label>75</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Nei</surname> <given-names>M</given-names></name>. <article-title>Analysis of Gene Diversity in Subdivided Populations</article-title>. <source>PNAS</source>. <year>1973</year>;<volume>70</volume>(<issue>12</issue>):<fpage>3321</fpage>–<lpage>3323</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1073/pnas.70.12.3321" xlink:type="simple">10.1073/pnas.70.12.3321</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref076"><label>76</label><mixed-citation publication-type="other" xlink:type="simple">Weir BS, Goudet J. A unified characterization of population structure and relatedness. bioRxiv. 2016; p. 088260.</mixed-citation></ref>
<ref id="pgen.1009241.ref077"><label>77</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Raj</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Stephens</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Pritchard</surname> <given-names>JK</given-names></name>. <article-title>fastSTRUCTURE: variational inference of population structure in large SNP data sets</article-title>. <source>Genetics</source>. <year>2014</year>;<volume>197</volume>(<issue>2</issue>):<fpage>573</fpage>–<lpage>589</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.114.164350" xlink:type="simple">10.1534/genetics.114.164350</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref078"><label>78</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Nelis</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Esko</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Mägi</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Zimprich</surname> <given-names>F</given-names></name>, <name name-style="western"><surname>Zimprich</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Toncheva</surname> <given-names>D</given-names></name>, <etal>et al</etal>. <article-title>Genetic Structure of Europeans: A View from the North–East</article-title>. <source>PLOS ONE</source>. <year>2009</year>;<volume>4</volume>(<issue>5</issue>):<fpage>e5472</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pone.0005472" xlink:type="simple">10.1371/journal.pone.0005472</ext-link></comment> <object-id pub-id-type="pmid">19424496</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref079"><label>78</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Silva</surname> <given-names>NM</given-names></name>, <name name-style="western"><surname>Pereira</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Poloni</surname> <given-names>ES</given-names></name>, <name name-style="western"><surname>Currat</surname> <given-names>M</given-names></name>. <article-title>Human Neutral Genetic Variation and Forensic STR Data</article-title>. <source>PLOS ONE</source>. <year>2012</year>;<volume>7</volume>(<issue>11</issue>):<fpage>e49666</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pone.0049666" xlink:type="simple">10.1371/journal.pone.0049666</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref080"><label>80</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Steele</surname> <given-names>CD</given-names></name>, <name name-style="western"><surname>Court</surname> <given-names>DS</given-names></name>, <name name-style="western"><surname>Balding</surname> <given-names>DJ</given-names></name>. <article-title>Worldwide FST Estimates Relative to Five Continental-Scale Populations</article-title>. <source>Annals of Human Genetics</source>. <year>2014</year>;<volume>78</volume>(<issue>6</issue>):<fpage>468</fpage>–<lpage>477</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/ahg.12081" xlink:type="simple">10.1111/ahg.12081</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref081"><label>81</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Cavalli-Sforza</surname> <given-names>LL</given-names></name>. <article-title>Population Structure and Human Evolution</article-title>. <source>Proceedings of the Royal Society of London Series B, Biological Sciences</source>. <year>1966</year>;<volume>164</volume>(<issue>995</issue>):<fpage>362</fpage>–<lpage>379</lpage>.</mixed-citation></ref>
<ref id="pgen.1009241.ref082"><label>82</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Lewontin</surname> <given-names>RC</given-names></name>, <name name-style="western"><surname>Krakauer</surname> <given-names>J</given-names></name>. <article-title>Distribution of Gene Frequency as a Test of the Theory of the Selective Neutrality of Polymorphisms</article-title>. <source>Genetics</source>. <year>1973</year>;<volume>74</volume>(<issue>1</issue>):<fpage>175</fpage>–<lpage>195</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/genetics/74.1.175" xlink:type="simple">10.1093/genetics/74.1.175</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref083"><label>83</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Beaumont</surname> <given-names>MA</given-names></name>, <name name-style="western"><surname>Nichols</surname> <given-names>RA</given-names></name>. <article-title>Evaluating Loci for Use in the Genetic Analysis of Population Structure</article-title>. <source>Proceedings of the Royal Society of London B: Biological Sciences</source>. <year>1996</year>;<volume>263</volume>(<issue>1377</issue>):<fpage>1619</fpage>–<lpage>1626</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1098/rspb.1996.0237" xlink:type="simple">10.1098/rspb.1996.0237</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref084"><label>84</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Vitalis</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Dawson</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Boursot</surname> <given-names>P</given-names></name>. <article-title>Interpretation of Variation Across Marker Loci as Evidence of Selection</article-title>. <source>Genetics</source>. <year>2001</year>;<volume>158</volume>(<issue>4</issue>):<fpage>1811</fpage>–<lpage>1823</lpage>.</mixed-citation></ref>
<ref id="pgen.1009241.ref085"><label>85</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Akey</surname> <given-names>JM</given-names></name>, <name name-style="western"><surname>Zhang</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Zhang</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Jin</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Shriver</surname> <given-names>MD</given-names></name>. <article-title>Interrogating a high-density SNP map for signatures of natural selection</article-title>. <source>Genome Res</source>. <year>2002</year>;<volume>12</volume>(<issue>12</issue>):<fpage>1805</fpage>–<lpage>1814</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1101/gr.631202" xlink:type="simple">10.1101/gr.631202</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref086"><label>86</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Porter</surname> <given-names>AH</given-names></name>. <article-title>A test for deviation from island-model population structure</article-title>. <source>Molecular Ecology</source>. <year>2003</year>;<volume>12</volume>(<issue>4</issue>):<fpage>903</fpage>–<lpage>915</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1046/j.1365-294X.2003.01783.x" xlink:type="simple">10.1046/j.1365-294X.2003.01783.x</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref087"><label>87</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Bowcock</surname> <given-names>AM</given-names></name>, <name name-style="western"><surname>Kidd</surname> <given-names>JR</given-names></name>, <name name-style="western"><surname>Mountain</surname> <given-names>JL</given-names></name>, <name name-style="western"><surname>Hebert</surname> <given-names>JM</given-names></name>, <name name-style="western"><surname>Carotenuto</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Kidd</surname> <given-names>KK</given-names></name>, <etal>et al</etal>. <article-title>Drift, admixture, and selection in human evolution: a study with DNA polymorphisms</article-title>. <source>PNAS</source>. <year>1991</year>;<volume>88</volume>(<issue>3</issue>):<fpage>839</fpage>–<lpage>843</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1073/pnas.88.3.839" xlink:type="simple">10.1073/pnas.88.3.839</ext-link></comment> <object-id pub-id-type="pmid">1992475</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref088"><label>88</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Hedrick</surname> <given-names>PW</given-names></name>. <article-title>A Standardized Genetic Differentiation Measure</article-title>. <source>Evolution</source>. <year>2005</year>;<volume>59</volume>(<issue>8</issue>):<fpage>1633</fpage>–<lpage>1638</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/j.0014-3820.2005.tb01814.x" xlink:type="simple">10.1111/j.0014-3820.2005.tb01814.x</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref089"><label>89</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Jakobsson</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Edge</surname> <given-names>MD</given-names></name>, <name name-style="western"><surname>Rosenberg</surname> <given-names>NA</given-names></name>. <article-title>The Relationship Between FST and the Frequency of the Most Frequent Allele</article-title>. <source>Genetics</source>. <year>2013</year>;<volume>193</volume>(<issue>2</issue>):<fpage>515</fpage>–<lpage>528</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.112.144758" xlink:type="simple">10.1534/genetics.112.144758</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref090"><label>90</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Edge</surname> <given-names>MD</given-names></name>, <name name-style="western"><surname>Rosenberg</surname> <given-names>NA</given-names></name>. <article-title>Upper bounds on FST in terms of the frequency of the most frequent allele and total homozygosity: the case of a specified number of alleles</article-title>. <source>Theor Popul Biol</source>. <year>2014</year>;<volume>97</volume>:<fpage>20</fpage>–<lpage>34</lpage>.</mixed-citation></ref>
<ref id="pgen.1009241.ref091"><label>91</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Lewontin</surname> <given-names>RC</given-names></name>. <article-title>The Apportionment of Human Diversity</article-title>. <source>Evolutionary Biology</source>. <year>1972</year>;<volume>6</volume>:<fpage>381</fpage>–<lpage>398</lpage>.</mixed-citation></ref>
<ref id="pgen.1009241.ref092"><label>92</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Barbujani</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Magagni</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Minch</surname> <given-names>E</given-names></name>, <name name-style="western"><surname>Cavalli-Sforza</surname> <given-names>LL</given-names></name>. <article-title>An apportionment of human DNA diversity</article-title>. <source>PNAS</source>. <year>1997</year>;<volume>94</volume>(<issue>9</issue>):<fpage>4516</fpage>–<lpage>4519</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1073/pnas.94.9.4516" xlink:type="simple">10.1073/pnas.94.9.4516</ext-link></comment></mixed-citation></ref>
<ref id="pgen.1009241.ref093"><label>93</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Novembre</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Johnson</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Bryc</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Kutalik</surname> <given-names>Z</given-names></name>, <name name-style="western"><surname>Boyko</surname> <given-names>AR</given-names></name>, <name name-style="western"><surname>Auton</surname> <given-names>A</given-names></name>, <etal>et al</etal>. <article-title>Genes mirror geography within Europe</article-title>. <source>Nature</source>. <year>2008</year>;<volume>456</volume>(<issue>7218</issue>):<fpage>98</fpage>–<lpage>101</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nature07331" xlink:type="simple">10.1038/nature07331</ext-link></comment> <object-id pub-id-type="pmid">18758442</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref094"><label>94</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Coop</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Pickrell</surname> <given-names>JK</given-names></name>, <name name-style="western"><surname>Novembre</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Kudaravalli</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Li</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Absher</surname> <given-names>D</given-names></name>, <etal>et al</etal>. <article-title>The Role of Geography in Human Adaptation</article-title>. <source>PLoS Genet</source>. <year>2009</year>;<volume>5</volume>(<issue>6</issue>):<fpage>e1000500</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pgen.1000500" xlink:type="simple">10.1371/journal.pgen.1000500</ext-link></comment> <object-id pub-id-type="pmid">19503611</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref095"><label>95</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Patterson</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Moorjani</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Luo</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Mallick</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Rohland</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Zhan</surname> <given-names>Y</given-names></name>, <etal>et al</etal>. <article-title>Ancient admixture in human history</article-title>. <source>Genetics</source>. <year>2012</year>;<volume>192</volume>(<issue>3</issue>):<fpage>1065</fpage>–<lpage>1093</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.112.145037" xlink:type="simple">10.1534/genetics.112.145037</ext-link></comment> <object-id pub-id-type="pmid">22960212</object-id></mixed-citation></ref>
<ref id="pgen.1009241.ref096"><label>96</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Beran</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Hall</surname> <given-names>P</given-names></name>. <article-title>Interpolated Nonparametric Prediction Intervals and Confidence Intervals</article-title>. <source>Journal of the Royal Statistical Society Series B (Methodological)</source>. <year>1993</year>;<volume>55</volume>(<issue>3</issue>):<fpage>643</fpage>–<lpage>652</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/j.2517-6161.1993.tb01929.x" xlink:type="simple">10.1111/j.2517-6161.1993.tb01929.x</ext-link></comment></mixed-citation></ref>
</ref-list>
</back>
</article>