<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.1d3 20150301//EN" "http://jats.nlm.nih.gov/publishing/1.1d3/JATS-journalpublishing1.dtd">
<article article-type="research-article" dtd-version="1.1d3" xml:lang="en" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="nlm-ta">PLoS Comput Biol</journal-id>
<journal-id journal-id-type="publisher-id">plos</journal-id>
<journal-id journal-id-type="pmc">ploscomp</journal-id>
<journal-title-group>
<journal-title>PLOS Computational Biology</journal-title>
</journal-title-group>
<issn pub-type="ppub">1553-734X</issn>
<issn pub-type="epub">1553-7358</issn>
<publisher>
<publisher-name>Public Library of Science</publisher-name>
<publisher-loc>San Francisco, CA USA</publisher-loc>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">PCOMPBIOL-D-18-02024</article-id>
<article-id pub-id-type="doi">10.1371/journal.pcbi.1007177</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Research Article</subject>
</subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Population biology</subject><subj-group><subject>Population metrics</subject><subj-group><subject>Population size</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Genetics</subject><subj-group><subject>Phenotypes</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Biochemistry</subject><subj-group><subject>Proteins</subject><subj-group><subject>DNA-binding proteins</subject><subj-group><subject>Transcription factors</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Genetics</subject><subj-group><subject>Gene expression</subject><subj-group><subject>Gene regulation</subject><subj-group><subject>Transcription factors</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Biochemistry</subject><subj-group><subject>Proteins</subject><subj-group><subject>Regulatory proteins</subject><subj-group><subject>Transcription factors</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Biochemistry</subject><subj-group><subject>Proteins</subject><subj-group><subject>DNA-binding proteins</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Genetics</subject><subj-group><subject>Gene expression</subject><subj-group><subject>DNA transcription</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Developmental biology</subject><subj-group><subject>Molecular development</subject><subj-group><subject>Morphogens</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Physical sciences</subject><subj-group><subject>Physics</subject><subj-group><subject>Thermodynamics</subject><subj-group><subject>Entropy</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Evolutionary biology</subject><subj-group><subject>Evolutionary processes</subject><subj-group><subject>Speciation</subject></subj-group></subj-group></subj-group></subj-group></article-categories>
<title-group>
<article-title>Biophysics and population size constrains speciation in an evolutionary model of developmental system drift</article-title>
<alt-title alt-title-type="running-head">Biophysics and population size constrains speciation</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0002-0312-336X</contrib-id>
<name name-style="western">
<surname>Khatri</surname> <given-names>Bhavin S.</given-names></name>
<role content-type="http://credit.casrai.org/">Conceptualization</role>
<role content-type="http://credit.casrai.org/">Formal analysis</role>
<role content-type="http://credit.casrai.org/">Investigation</role>
<role content-type="http://credit.casrai.org/">Methodology</role>
<role content-type="http://credit.casrai.org/">Software</role>
<role content-type="http://credit.casrai.org/">Validation</role>
<role content-type="http://credit.casrai.org/">Visualization</role>
<role content-type="http://credit.casrai.org/">Writing – original draft</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
<xref ref-type="fn" rid="currentaff001"><sup>¤</sup></xref>
<xref ref-type="corresp" rid="cor001">*</xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Goldstein</surname> <given-names>Richard A.</given-names></name>
<role content-type="http://credit.casrai.org/">Conceptualization</role>
<role content-type="http://credit.casrai.org/">Funding acquisition</role>
<role content-type="http://credit.casrai.org/">Methodology</role>
<role content-type="http://credit.casrai.org/">Supervision</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
</contrib>
</contrib-group>
<aff id="aff001">
<label>1</label>
<addr-line>The Francis Crick Institute, London, United Kingdom</addr-line>
</aff>
<aff id="aff002">
<label>2</label>
<addr-line>Division of Infection &amp; Immunity, University College London, London, United Kingdom</addr-line>
</aff>
<contrib-group>
<contrib contrib-type="editor" xlink:type="simple">
<name name-style="western">
<surname>Mustonen</surname> <given-names>Ville</given-names></name>
<role>Editor</role>
<xref ref-type="aff" rid="edit1"/>
</contrib>
</contrib-group>
<aff id="edit1">
<addr-line>University of Helsinki, FINLAND</addr-line>
</aff>
<author-notes>
<fn fn-type="conflict" id="coi001">
<p>The authors have declared that no competing interests exist.</p>
</fn>
<fn fn-type="current-aff" id="currentaff001">
<label>¤</label>
<p>Current address: Department of Life Sciences, Imperial College London, Silwood Park, Ascot, United Kingdom</p>
</fn>
<corresp id="cor001">* E-mail: <email xlink:type="simple">bhavin.khatri@physics.org</email></corresp>
</author-notes>
<pub-date pub-type="collection">
<month>7</month>
<year>2019</year>
</pub-date>
<pub-date pub-type="epub">
<day>23</day>
<month>7</month>
<year>2019</year>
</pub-date>
<volume>15</volume>
<issue>7</issue>
<elocation-id>e1007177</elocation-id>
<history>
<date date-type="received">
<day>30</day>
<month>11</month>
<year>2018</year>
</date>
<date date-type="accepted">
<day>13</day>
<month>6</month>
<year>2019</year>
</date>
</history>
<permissions>
<copyright-year>2019</copyright-year>
<copyright-holder>Khatri, Goldstein</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">
<license-p>This is an open access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">Creative Commons Attribution License</ext-link>, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
</license>
</permissions>
<self-uri content-type="pdf" xlink:href="info:doi/10.1371/journal.pcbi.1007177"/>
<abstract>
<p>Developmental system drift is a likely mechanism for the origin of hybrid incompatibilities between closely related species. We examine here the detailed mechanistic basis of hybrid incompatibilities between two allopatric lineages, for a genotype-phenotype map of developmental system drift under stabilising selection, where an organismal phenotype is conserved, but the underlying molecular phenotypes and genotype can drift. This leads to number of emergent phenomenon not obtainable by modelling genotype or phenotype alone. Our results show that: 1) speciation is more rapid at smaller population sizes with a characteristic, Orr-like, power law, but at large population sizes slow, characterised by a sub-diffusive growth law; 2) the molecular phenotypes under weakest selection contribute to the earliest incompatibilities; and 3) pair-wise incompatibilities dominate over higher order, contrary to previous predictions that the latter should dominate. The population size effect we find is consistent with previous results on allopatric divergence of transcription factor-DNA binding, where smaller populations have common ancestors with a larger drift load because genetic drift favours phenotypes which have a larger number of genotypes (higher sequence entropy) over more fit phenotypes which have far fewer genotypes; this means less substitutions are required in either lineage before incompatibilities arise. Overall, our results indicate that biophysics and population size provide a much stronger constraint to speciation than suggested by previous models, and point to a general mechanistic principle of how incompatibilities arise the under stabilising selection for an organismal phenotype.</p>
</abstract>
<abstract abstract-type="summary">
<title>Author summary</title>
<p>The process of speciation is of fundamental importance to the field of evolution as it is intimately connected to understanding the immense bio-diversity of life. There is still relatively little understanding of the underlying genetic mechanisms that give rise to hybrid incompatibilities with results suggesting that divergence in transcription factor DNA binding and gene expression play an important role. A key finding from the field of evo-devo is that organismal phenotypes show developmental system drift, where species maintain the same phenotype, but diverge in developmental pathways; this is an important potential source of hybrid incompatibilities. Here, we explore a theoretical framework to understand how incompatibilities arise due to developmental system drift, using a tractable biophysically inspired genotype-phenotype for spatial gene expression. Modelling the evolution of phenotypes in this way has the key advantage that it mirrors how selection works in nature, i.e. that selection acts on phenotypes, but variation (mutation) arise at the level of genotypes. This results, as we demonstrate, in a number of non-trivial and testable predictions concerning speciation due to developmental system drift, which would not be obtainable by modelling evolution of genotypes or phenotypes alone.</p>
</abstract>
<funding-group>
<award-group id="award001">
<funding-source>
<institution>Medical Research Council</institution>
</funding-source>
<award-id>U117573805</award-id>
<principal-award-recipient>
<name name-style="western">
<surname>Goldstein</surname> <given-names>Richard A.</given-names></name>
</principal-award-recipient>
</award-group>
<funding-statement>RAG was supported by the Medical Research Council under grant U117573805 and BSK by The Francis Crick Institute which receives its core funding from Cancer Research UK, the UK Medical Research Council and the Wellcome Trust. The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</funding-statement>
</funding-group>
<counts>
<fig-count count="6"/>
<table-count count="2"/>
<page-count count="24"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>PLOS Publication Stage</meta-name>
<meta-value>vor-update-to-uncorrected-proof</meta-value>
</custom-meta>
<custom-meta>
<meta-name>Publication Update</meta-name>
<meta-value>2019-08-02</meta-value>
</custom-meta>
<custom-meta id="data-availability">
<meta-name>Data Availability</meta-name>
<meta-value>All relevant data are within the manuscript and its Supporting Information files.</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="sec001" sec-type="intro">
<title>Introduction</title>
<p>The detailed genetic mechanisms by which non-interbreeding species diverge is still poorly understood. Darwin, inspired by John Herschel, called it that “mystery of mysteries” [<xref ref-type="bibr" rid="pcbi.1007177.ref001">1</xref>]; he struggled to understand how natural selection could give rise to hybrid inviability or infertility between populations without producing such incompatibilities within the populations. A solution to this problem was conceived independently by Dobzhansky, Muller and Bateson in which cross-mating would combine alleles at different loci that are incompatible due to epistatic interactions (Dobzhansky Muller incompatibilities, DMI) [<xref ref-type="bibr" rid="pcbi.1007177.ref002">2</xref>–<xref ref-type="bibr" rid="pcbi.1007177.ref004">4</xref>]. Consider a common ancestor with alleles <italic>ab</italic> across two loci, which after a period of allopatric divergence give rise to two lineages which have fixed genotypes <italic>Ab</italic> and <italic>aB</italic>, respectively. Interbreeding between these two populations would result in the heterozygotic hybrid genotype <italic>Aa</italic>|<italic>Bb</italic>, combining the potentially incompatible <italic>A</italic> and <italic>B</italic>, a combination that could not arise in either population mating separately.</p>
<p>Assuming that any combination of alleles that have not been “tested” by the process of evolution represents a potential incompatibility, Orr predicted that the number of incompatibilities between pairs of alleles in a sufficiently large genome would increase with the number of substitutions separating the two lineages (<italic>K</italic>) as <italic>K</italic> (<italic>K</italic>−1) ∼ <italic>K</italic><sup>2</sup> [<xref ref-type="bibr" rid="pcbi.1007177.ref005">5</xref>]. Similarly, the number of untested combinations involving <italic>n</italic> loci would increase as ∼ <italic>K</italic><sup><italic>n</italic></sup>, suggesting that, with evolutionary time, potential incompatibilities would become increasingly dominated by more complex epistatic interactions [<xref ref-type="bibr" rid="pcbi.1007177.ref005">5</xref>]. This would occur, firstly, because there are a larger number of combinations, and secondly, because there are more ways for separate lineages to evolve around incompatible genotypes when there is a larger number of loci. It is unclear, however, how the simplistic assumptions of this model fare with increased biological realism. Not all possible untested hybrids are equally likely to result in real incompatibilities. Selection acting on each separate lineage affects the substitutions that occur and their likely contributions to reproductive isolation. In particular, evolutionary constraints have a strong effect on the development of more complex DMIs, making it uncertain whether their role is as important as suggested by Orr’s combinatorial argument. This highlights the need for considering more realistic models that better capture the salient aspects of the underlying biology, whilst remaining sufficiently simple for tractable evolutionary modelling and simulation.</p>
<p>In recent years a form of epistasis has been described in a number of organisms whereby closely related species have similar organismal phenotypes but are produced by very different developmental mechanisms [<xref ref-type="bibr" rid="pcbi.1007177.ref006">6</xref>–<xref ref-type="bibr" rid="pcbi.1007177.ref009">9</xref>]. This cryptic “developmental system drift” [<xref ref-type="bibr" rid="pcbi.1007177.ref010">10</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref011">11</xref>] could be an important source of hybrid incompatibilities that cause reproductive isolation [<xref ref-type="bibr" rid="pcbi.1007177.ref012">12</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref013">13</xref>]. Developmental system drift is an example of a more general characteristic of biological systems where many genotypes can correspond to the same phenotype; this redundancy of the mapping from genotype to phenotype results in a number of non-trivial behaviours which do not arise on fitness landscapes which consider evolution of phenotypes or genotypes independently [<xref ref-type="bibr" rid="pcbi.1007177.ref014">14</xref>–<xref ref-type="bibr" rid="pcbi.1007177.ref025">25</xref>]. The degree of redundancy can be represented as the “sequence entropy”, corresponding to the log of the number of genotypes corresponding to a given phenotype, in analogy to the similar expression in statistical mechanics [<xref ref-type="bibr" rid="pcbi.1007177.ref017">17</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref025">25</xref>–<xref ref-type="bibr" rid="pcbi.1007177.ref027">27</xref>].</p>
<p>To explore the role of developmental system drift on speciation, we examine the growth of Dobzhansky-Muller incompatibilities using a simple genotype-phenotype map that models the development of spatial patterning of gene expression. The model, introduced by [<xref ref-type="bibr" rid="pcbi.1007177.ref017">17</xref>] allows for cryptic genetic variation and changes in molecular phenotypes while maintaining organismal phenotype under stabilising selection. In addition, we introduce a novel computational method to decompose hybrid DMIs so we can examine the behaviour of the fundamental pair-wise and higher order incompatibilities. We show that including biologically relevant elements gives rise to a number of novel phenomenon that could not arise with models based only on the fitness of genotypes or phenotypes. Our results show that small populations develop hybrid incompatibilities more quickly, due to the pressure of sequence entropy in small populations meaning the common ancestor harbours on average a larger drift load. For large populations, we find hybrid incompatibilities arise more slowly, with a growth law characteristic of a sub-diffusion of the hybrid binding energies, indicative of kinetic traps in the molecular substitution process due to roughness to the fitness landscape [<xref ref-type="bibr" rid="pcbi.1007177.ref017">17</xref>]. Strikingly, we find that for moderate population sizes it is the molecular phenotypes under weakest selection that give rise to earliest incompatibilities, since in the common ancestor they are more likely to be already maladapted. Finally, we find that unlike Orr’s prediction that complex DMIs should be abundant, pair-wise interactions between loci dominate the growth of DMIs, showing that biophysics provides a stronger constraint than pure combinatorics.</p>
<sec id="sec002">
<title>A simple genotype-phenotype map to model developmental system drift</title>
<p>The genotype-phenotype map we use is a modification of the one described in [<xref ref-type="bibr" rid="pcbi.1007177.ref017">17</xref>]. The evolutionary task set for the gene regulation module is to turn an exponentially decaying morphogen gradient (<italic>M</italic>) across a field of cells in an embryo into a sharp step function profile of a downstream transcription factor <italic>T</italic> with its transition at the mid-point of the embryo, as shown in <xref ref-type="fig" rid="pcbi.1007177.g001">Fig 1</xref>. This is accomplished by having the morphogen and an RNA Polymerase <italic>R</italic> bind to two adjacent non-overlapping binding sites in the cis-regulatory region (<italic>C</italic>) region of the transcription factor, the promoter <italic>P</italic>, and a single binding site <italic>B</italic> adjacent to it; transcription occurs whenever the polymerase binds to the promoter, although both proteins can bind to both binding sites dependent on their binding affinities. Binding to the regulatory region is cooperative due to stabilising interactions between the two proteins when bound at the two adjacent sites. The sequences of <italic>M</italic> and <italic>R</italic> at the DNA binding sites are represented by binary strings of length <italic>ℓ</italic><sub><italic>pd</italic></sub> = 10. The corresponding DNA binding sites <italic>B</italic> and <italic>P</italic> are also represented by binary strings of the same length. Interactions between a pair of proteins are similarly represented by binary strings of length <italic>ℓ</italic><sub><italic>pp</italic></sub> = 5. We assume an exponential morphogen concentration profile [<italic>M</italic>](<italic>x</italic>, <italic>α</italic>), as a function of the position of embryonic cells, <italic>x</italic>; the decay rate of the morphogen <italic>α</italic> is represented as a continuous variable, with a relative probability of mutation corresponding to an effective string of length <italic>ℓ</italic><sub><italic>α</italic></sub> = 10 bases. This results in a genome <italic><bold>G</bold></italic>, of total length <italic>ℓ</italic><sub><italic><bold>G</bold></italic></sub> = 60. Protein-DNA and protein-protein binding strengths are determined by the number of mismatches between corresponding strings on the two interacting molecules, where for protein-DNA binding the cost of a mismatch is <italic>ϵ</italic><sub><italic>pd</italic></sub> = 2<italic>k</italic><sub><italic>B</italic></sub><italic>T</italic> and for protein-protein interactions <italic>ϵ</italic><sub><italic>pp</italic></sub> = 1<italic>k</italic><sub><italic>B</italic></sub><italic>T</italic>, where <italic>k</italic><sub><italic>B</italic></sub><italic>T</italic> is Boltzmann’s constant multiplied by room temperature (298<italic>K</italic>). We assume that there is a fixed concentration [<italic>R</italic>] of polymerase, in each cell. We then follow [<xref ref-type="bibr" rid="pcbi.1007177.ref028">28</xref>] and assume that the concentration of the transcription factor in a cell at position <italic>x</italic> ([<italic>T</italic>](<italic>x</italic>)) is simply proportional to the probability of the polymerase being bound to the promoter, where this is calculated using standard methods of equilibrium statistical mechanics allowing for all configurations of protein species bound at these two binding sites, as well as none being bound (see <xref ref-type="sec" rid="sec021">Methods</xref> for details). The fitness contribution <italic>F</italic> of the overall patterning phenotype ranges from 0 to <italic>κ</italic><sub><italic>F</italic></sub> depending on how well expression of the transcription factor is confined to the anterior half of the embryo, as shown in <xref ref-type="fig" rid="pcbi.1007177.g001">Fig 1</xref> (bottom left), where <italic>κ</italic><sub><italic>F</italic></sub> is a measure of the relative contribution of this trait to the fitness of the organism. We define a population-scaled fitness contribution 2<italic>N</italic><sub><italic>e</italic></sub><italic>κ</italic><sub><italic>F</italic></sub>, where <italic>N</italic><sub><italic>e</italic></sub> is the effective population size; for 2<italic>N</italic><sub><italic>e</italic></sub> <italic>κ</italic><sub><italic>F</italic></sub> &lt; 1 the effects of selection are weak, and are conversely strong when 2<italic>Nκ</italic><sub><italic>F</italic></sub> &gt; 1. We also assume that there is a boundary at <italic>F</italic> = <italic>F</italic>*, below which the organism is unviable. We simulate evolution as continuous time Markov process. After evolving a single population for a given number of generations, we form two replicates of the population that evolve independently, representing the process of allopatric speciation. At various time points following this imposed isolation, we consider the fitness and viability of various outcrossings between the two populations. A DMI occurs when the fitness contribution of a particular hybrid drops below <italic>F</italic>*.</p>
<fig id="pcbi.1007177.g001" position="float">
<object-id pub-id-type="doi">10.1371/journal.pcbi.1007177.g001</object-id>
<label>Fig 1</label>
<caption>
<title>An overview of the genotype-phenotype map.</title>
<p>The gene regulatory module has as input a morphogen concentration [<italic>M</italic>](<italic>x</italic>) that varies approximately exponentially across a 1-dimensional embryo of length <italic>L</italic>, and outputs a transcription factor [<italic>T</italic>](<italic>x</italic>). Spatial gene regulation of <italic>T</italic> is achieved via a simple Hamming model of protein DNA binding as shown. Fitness is determined by weighting any gene expression in the anterior half of the embryo as positive, and any in the posterior half as negative (as shown bottom left). We show idealised expression profiles that give maximum fitness when gene expression is confined only to the anterior half (bottom middle), and minimum fitness when there is no discrimination between anterior and posterior (bottom right); these translate to log-fitnesses of <italic>F</italic> = 0 and <italic>F</italic> = −∞, respectively (see <xref ref-type="sec" rid="sec021">Methods</xref>).</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1007177.g001" xlink:type="simple"/>
</fig>
</sec>
</sec>
<sec id="sec003" sec-type="results">
<title>Results</title>
<sec id="sec004">
<title>Evolutionary properties of genotype-phenotype map on each lineage</title>
<p>The properties of a similar genotype-phenotype map have been previously explored [<xref ref-type="bibr" rid="pcbi.1007177.ref017">17</xref>]. An important property of this genotype-phenotype map is that only a single mechanism of patterning is found, in which the polymerase (<italic>R</italic>) binds with intermediate affinity to the promoter (<italic>P</italic>) but with high affinity to the morphogen (<italic>M</italic>), while the morphogen binds to the morphogen binding site (<italic>B</italic>) only above a critical morphogen concentration. This results in a spatial switch once the morphogen falls below this concentration; evolution then fine tunes the relationship between the protein-DNA binding energies, the protein-protein binding energy and the steepness of the morphogen gradient <italic>α</italic> to turn off transcription at the mid-point of the embryo. Despite a single global solution there are many different combinations of the protein-DNA and protein-protein binding energies and <italic>α</italic> that give good patterning, and each of these correspond to many possible genotypes (<italic><bold>G</bold></italic>). Of the different possible binding energies, we find that <inline-formula id="pcbi.1007177.e001"><alternatives><graphic id="pcbi.1007177.e001g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e001" xlink:type="simple"/><mml:math display="inline" id="M1"><mml:mrow><mml:msub><mml:mi>E</mml:mi> <mml:mrow><mml:mi>M</mml:mi> <mml:mi>B</mml:mi></mml:mrow></mml:msub> <mml:mo>,</mml:mo> <mml:msub><mml:mi>E</mml:mi> <mml:mrow><mml:mi>R</mml:mi> <mml:mi>P</mml:mi></mml:mrow></mml:msub> <mml:mo>,</mml:mo> <mml:msub><mml:mover accent="true"><mml:mi>E</mml:mi> <mml:mo>˜</mml:mo></mml:mover> <mml:mrow><mml:mi>R</mml:mi> <mml:mi>M</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></alternatives></inline-formula> (binding energy of <italic>M</italic> to <italic>B</italic>, <italic>R</italic> to <italic>P</italic>, and <italic>R</italic> to <italic>M</italic>, respectively, calculated by the equivalent of <xref ref-type="disp-formula" rid="pcbi.1007177.e007">Eq 3</xref> in the <xref ref-type="sec" rid="sec021">Methods</xref>) are under strong selection, whilst the other possible binding energies are essentially neutral with weak selective effects. At large population sizes it is found that the evolutionary dynamics exhibits what is known as quenched-disorder in statistical physics, where energy phenotypes that are less constrained take different <italic>random</italic> values between independent evolutionary runs with no further substitutions; this indicates an underlying roughness to the fitness landscape and that these weakly selected traits are trapped in a local optimum [<xref ref-type="bibr" rid="pcbi.1007177.ref017">17</xref>].</p>
<p>A key property determining the rate at which incompatibilities arise is the distribution of common ancestor phenotypes as a function of the population-scaled fitness contribution 2<italic>N</italic><sub><italic>e</italic></sub> <italic>κ</italic><sub><italic>F</italic></sub>, as shown in <xref ref-type="fig" rid="pcbi.1007177.g002">Fig 2</xref>. For a given value of <italic>κ</italic><sub><italic>F</italic></sub>, we see that for large population sizes (2<italic>Nκ</italic><sub><italic>F</italic></sub> ≫ 10) the distribution is what we would expect from conventional evolutionary theory on a fitness landscape with a fitness maximum. In contrast, as the population size is decreased, we find the distribution shifts to lower fitness values to the point when selection is weak (2<italic>Nκ</italic><sub><italic>F</italic></sub> ≤ 1) the distribution is poised at the inviability boundary. This effect arises due to genetic drift at low population sizes pushing populations towards marginally fit phenotypes that correspond to the largest number of genotypes, that is, with the largest sequence entropy.</p>
<fig id="pcbi.1007177.g002" position="float">
<object-id pub-id-type="doi">10.1371/journal.pcbi.1007177.g002</object-id>
<label>Fig 2</label>
<caption>
<title>Histogram of the fitness of populations over single long runs as a function of the population scaled fitness contribution 2<italic>Nκ</italic><sub><italic>F</italic></sub>.</title>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1007177.g002" xlink:type="simple"/>
</fig>
</sec>
<sec id="sec005">
<title>Decomposition of DMIs</title>
<p>Our genome is composed of 4 loci: 1) the <italic>R</italic> locus corresponding to the polymerase sequence, 2) the Morphogen (<italic>M</italic>) locus, 3) the <italic>C</italic> locus which corresponds to the sequences for the cis-regulatory region of the transcription factor and 4) the <italic>α</italic> locus, which is the morphogen gradient steepness <italic>α</italic>. Hybrids between the two lineages are constructed by independent reassortment of these loci assuming complete linkage within each locus and no linkage between them. We define a hybrid genotype by a 4 letter string where each letter corresponds to one of the loci defined above and takes one of two cases correspond to whether the allele is from the 1st line or 2nd line; for example, the hybrid <monospace>rMCa</monospace> corresponds to <italic>R</italic> locus having an allele from the 1st lineage, <italic>M</italic> locus with the allele from the 2nd lineage, the transcription factor (cis-regulatory) <italic>C</italic> locus from the 2nd lineage and <italic>α</italic> locus the allele from the 1st lineage. Note that the underlying sequence of each hybrid changes as different substitutions are accepted in each lineage; the notation only refers to alleles fixed at any point in time. We can represent all combinations of the four loci drawn from the two parents (<monospace>RMCA</monospace>, <monospace>RMCa</monospace>, <monospace>RMcA</monospace>, etc.) as points on a four-dimensional Boolean hypercube. In total there are 2<sup>4</sup> − 2 = 14 hybrids.</p>
<p>In <xref ref-type="fig" rid="pcbi.1007177.g003">Fig 3</xref>, we plot a typical time series of how the fitness of two different hybrids (<monospace>Rmca</monospace>(a &amp; b) and <monospace>RMcA</monospace>(c &amp; d) changes over a divergence time <italic>μt</italic> separating a pair of lineages, for 2<italic>Nκ</italic><sub><italic>F</italic></sub> = 1 (a &amp; c) and 2<italic>Nκ</italic><sub><italic>F</italic></sub> = 10 (b &amp; d), where <italic>μ</italic> = <italic>ℓ</italic><sub><italic><bold>G</bold></italic></sub><italic>μ</italic><sub>0</sub> is the mutation rate for all base pairs in all loci. 2<italic>Nκ</italic><sub><italic>F</italic></sub> &gt; 1 indicates strong selection, whilst 2<italic>Nκ</italic><sub><italic>F</italic></sub> ≤ 1 indicates weak selection where genetic drift dominates (For reference, in human populations it has been estimated that ≈ 20 − 30% of mutations are weakly selected [<xref ref-type="bibr" rid="pcbi.1007177.ref029">29</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref030">30</xref>], compared to in <italic>Drosophila</italic> &lt; 10% [<xref ref-type="bibr" rid="pcbi.1007177.ref030">30</xref>].). We see that the fitness of hybrids generally decreases in a stochastic fashion; when the log-fitness of a hybrid drops below the threshold <italic>F</italic>* (indicated by the dashed line), a DMI arises as is indicated by a vertical log-fitness line (<italic>F</italic> = −∞) for that hybrid. As can be seen in <xref ref-type="fig" rid="pcbi.1007177.g003">Fig 3</xref>, at any given time a changing subset of the fourteen possible hybrids might be incompatible.</p>
<fig id="pcbi.1007177.g003" position="float">
<object-id pub-id-type="doi">10.1371/journal.pcbi.1007177.g003</object-id>
<label>Fig 3</label>
<caption>
<title>Plot of the times series of two hybrids <monospace>Rmca</monospace>(a &amp; b) and <monospace>Rmca</monospace>(c &amp; d) at population scaled fitness contributions of 2<italic>Nκ</italic><sub><italic>F</italic></sub> = 1 (a &amp; c) and 2<italic>Nκ</italic><sub><italic>F</italic></sub> = 10 (b &amp; d).</title>
<p>Times when the fitness of a hybrid drop below the critical value <italic>F</italic>* (dashed line) correspond to DMIs.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1007177.g003" xlink:type="simple"/>
</fig>
<sec id="sec006">
<title>Total number and type of DMIs</title>
<p>To decompose the pattern of hybrid DMIs into fundamental pair-wise, 3-way and 4-way incompatibilities, we use a parsimonious method (<xref ref-type="sec" rid="sec021">Material &amp; Methods</xref>) which finds the minimum total number of fundamental DMIs types that can explain the pattern of DMIs observed. As shown in <xref ref-type="fig" rid="pcbi.1007177.g004">Fig 4a</xref>, on a 4-dimensional Boolean hypercube, a pair-wise incompatibility is represented by a face of the cube (blue square), a 3-way incompatibility by a single edge (green line) and a 4-way incompatibility by a single point (red circle). This arises because, for example, as in <xref ref-type="fig" rid="pcbi.1007177.g004">Fig 4a</xref>, a 2-point DMI <italic>I</italic><sub><monospace>Ca</monospace></sub> means any genotype which features this sub-genotype <monospace>Ca</monospace> must, by definition, also be a DMI; the alleles on the remaining loci not involved in the DMI, can take any value and so form a 2<italic>D</italic> subspace, which is a whole face of the Boolean 4-cube. Similarly, a 3-point DMI, such as <italic>I</italic><sub><monospace>mcA</monospace></sub> as shown, constrains the sub-genotype of 3 loci to be incompatible and the remaining locus can take any value forming an edge (<monospace>r → R</monospace> in the example) of a 4<italic>D</italic> Boolean hypercube. A 4-point DMI must be a single point in a 4<italic>D</italic> Boolean hypercube (e.g. <italic>I</italic><sub><monospace>rmCA</monospace></sub> as shown). In <xref ref-type="fig" rid="pcbi.1007177.g004">Fig 4b</xref>, we show an example where the pattern of hybrid incompatibilities, shown by red crosses, can be explained in three different ways, each with only 2 DMIs: 1) <italic>I</italic><sub><monospace>Ca</monospace></sub> + <italic>I</italic><sub><monospace>Rca</monospace></sub>, 2) <italic>I</italic><sub><monospace>Ra</monospace></sub> + <italic>I</italic><sub><monospace>rCa</monospace></sub>, 3) <italic>I</italic><sub><monospace>Ca</monospace></sub> + <italic>I</italic><sub><monospace>Ra</monospace></sub>; two is the minimum number of DMIs, as there is no way to explain the pattern seen with a single pair-wise, 3-way or 4-way DMI. We assume each of these is, a priori, equally likely and so the total number of pair-wise incompatibilities is calculated as an average over the different ways we can explain the observed pattern of hybrid DMIs; in the example in <xref ref-type="fig" rid="pcbi.1007177.g004">Fig 4b</xref>, we therefore have a total number of 2-way DMIs of <italic>n</italic><sub>2</sub> = 4/3 and 3-way DMIs <italic>n</italic><sub>3</sub> = 2/3, giving a total number of <italic>n</italic> = <italic>n</italic><sub>2</sub> + <italic>n</italic><sub>3</sub> = 2 DMIs, which is the minimum number of DMIs needed to explain the pattern of hybrid incompatibilities.</p>
<fig id="pcbi.1007177.g004" position="float">
<object-id pub-id-type="doi">10.1371/journal.pcbi.1007177.g004</object-id>
<label>Fig 4</label>
<caption>
<title>Decomposition of hybrid DMIs on a Boolean hyper 4-cube.</title>
<p>Each point on the 4-cube represent each possible hybrid genotype across 4 loci, including the genotype of each parental lineage, where each red cross represents an incompatible hybrid genotype. As shown in a) the fundamental types of DMIs, where a blue square or face identify a subspace of genotypes that correspond to a 2-way DMI, a single green edge or line corresponds to a 3-way DMI and a red open circle corresponds to a single isolated 4-way DMI. b) A more complicated pattern of hybrid DMIs and their decomposition into fundamental types.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1007177.g004" xlink:type="simple"/>
</fig>
<p>Using this method, we plot the total number of each type of DMI versus divergence time in <xref ref-type="fig" rid="pcbi.1007177.g005">Fig 5</xref>, where the panels correspond to different population scaled fitness contributions from 2<italic>N</italic><sub><italic>e</italic></sub><italic>κ</italic><sub><italic>F</italic></sub> = 0.1 to 2<italic>N</italic><sub><italic>e</italic></sub><italic>κ</italic><sub><italic>F</italic></sub> = 100. We see clearly that as the population size is decreased the rate at which incompatibilities arise increases. This effect results from the shift in distribution of fitness to poorer values for smaller populations in <xref ref-type="fig" rid="pcbi.1007177.g002">Fig 2</xref>; this means that the common ancestor is more likely to be slightly maladapted (higher mutational load) for smaller populations, and so fewer substitutions are required before hybrid incompatibilities arise. This effect was also found for simple models of protein-DNA binding [<xref ref-type="bibr" rid="pcbi.1007177.ref026">26</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref027">27</xref>], but arose as a result of direct selection for high binding affinity, which also corresponds to low sequence entropy as there are exponentially fewer ways of binding with no or only a few mismatches between protein and DNA. In this work there is only selection on the overall patterning phenotype, yet remarkably we find analogous behaviour due to the effect of sequence entropy of this phenotype.</p>
<fig id="pcbi.1007177.g005" position="float">
<object-id pub-id-type="doi">10.1371/journal.pcbi.1007177.g005</object-id>
<label>Fig 5</label>
<caption>
<title>Plot of the total number of DMIs vs divergence time, together with their decomposition into the total number of 2-way, 3-way, 4-way DMIs, for various scaled populations sizes.</title>
<p>For 2<italic>Nκ</italic><sub><italic>F</italic></sub> ≤ 20 the solid lines correspond to fits of the simulation data to <xref ref-type="disp-formula" rid="pcbi.1007177.e002">Eq 1</xref>, while for 2<italic>Nκ</italic><sub><italic>F</italic></sub> ≥ 50 correspond to fits to <xref ref-type="disp-formula" rid="pcbi.1007177.e004">Eq 2</xref>.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1007177.g005" xlink:type="simple"/>
</fig>
</sec>
<sec id="sec007">
<title>Pair-wise incompatibilities dominate reproductive isolation</title>
<p>As is clearly shown by <xref ref-type="fig" rid="pcbi.1007177.g005">Fig 5</xref>, pair-wise incompatibilities dominate for all population sizes, though at larger population sizes the difference is smaller, and particularly at shorter times. These results should be contrasted with the prediction of Orr that 2-way: 3-way: 4-way incompatibilities should arise in the ratio 12 : 24 : 14 (for <italic>L</italic> = 4 loci); so for example, there should be double the number of 3-way incompatibilities to pair-wise.</p>
<p>It is possible that this bias could arise by the development of a random set of incompatibilities that would preferentially decompose into sets of 2-way DMIs. In order to consider this possibility, we randomly assigned a set of incompatibilities and analysed them using our decomposition procedure. Contrary to the observed results,, we find that this decomposition results in the largest number of 4-way DMIs, followed by 3-way and then 2-way DMIs (<xref ref-type="supplementary-material" rid="pcbi.1007177.s001">S1 Text</xref>). This is as expected as when the probability that a hybrid is incompatible is small, by random chance, we should expect to see isolated incompatible hybrid genotypes, which would be explained by 4-way DMIs; the fact that our results show that 2-way DMIs are dominant, even at early times, means that whole faces of the Boolean hypercube are found to incompatible, which is not likely to arise in a random model. Hence overall, these results show that contrary to Orr’s prediction that higher order DMIs should be easier to evolve, higher order DMIs evolve more slowly and are in smaller number compared to pair-wise DMIs.</p>
</sec>
<sec id="sec008">
<title>Quantification of power law growth of DMIs for small populations</title>
<p>We find that for small population sizes 2-way, 3-way and 4-way DMIs all increase as a power law at small times, indicated by a straight line on a log-log plot, in agreement with [<xref ref-type="bibr" rid="pcbi.1007177.ref005">5</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref031">31</xref>], who predicted that <italic>n</italic>-way DMIs should increase as ∼ <italic>t</italic><sup><italic>n</italic></sup>. To more quantitatively assess the exponent, we fit the data for 2<italic>Nκ</italic><sub><italic>F</italic></sub> ≤ 20 using the phenomenological equation:
<disp-formula id="pcbi.1007177.e002"><alternatives><graphic id="pcbi.1007177.e002g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e002" xlink:type="simple"/><mml:math display="block" id="M2"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>I</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>t</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:mfrac><mml:mrow><mml:msub><mml:mi>I</mml:mi> <mml:mn>0</mml:mn></mml:msub> <mml:mi>t</mml:mi></mml:mrow> <mml:mrow><mml:mi>T</mml:mi> <mml:mo>+</mml:mo> <mml:mi>t</mml:mi></mml:mrow></mml:mfrac> <mml:mo>(</mml:mo> <mml:mn>1</mml:mn> <mml:mo>-</mml:mo> <mml:mtext>exp</mml:mtext> <mml:mrow><mml:mo>-</mml:mo> <mml:msup><mml:mrow><mml:mo>(</mml:mo> <mml:mi>t</mml:mi> <mml:mo>/</mml:mo> <mml:mi>τ</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mrow><mml:mi>γ</mml:mi> <mml:mo>-</mml:mo> <mml:mn>1</mml:mn></mml:mrow></mml:msup></mml:mrow> <mml:mo>)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(1)</label></disp-formula>
which has the asymptotic form of <italic>I</italic>(<italic>t</italic>) ∼ <italic>t</italic><sup><italic>γ</italic></sup> for <italic>t</italic> ≪ <italic>τ</italic> and <italic>t</italic> ≪ <italic>T</italic> and an opposite limit of <italic>I</italic>(<italic>t</italic> → ∞) = <italic>I</italic><sub>0</sub>. We see that for the total number of DMIs and for 2-way, 3-way and 4-way DMIs, this form fits the data well at intermediate and small population sizes. We tabulate the power law exponent derived from these fits in <xref ref-type="table" rid="pcbi.1007177.t001">Table 1</xref>. We see that the total number of DMIs and 2-way DMIs have a power law exponent close to <italic>γ</italic> = 2, which is consistent with the Orr model. The 4-way DMIs have a larger exponent than the 3-way DMIs, which is larger than the 2-way DMIs, also in agreement with Orr’s model, although the values of the exponent are substantially lower than <italic>n</italic> for the 3-way and 4-way DMIs.</p>
<table-wrap id="pcbi.1007177.t001" position="float">
<object-id pub-id-type="doi">10.1371/journal.pcbi.1007177.t001</object-id>
<label>Table 1</label>
<caption>
<title>Table of values of the exponent <italic>γ</italic> characterising the power law of growth of DMIs at short times and small scaled population sizes.</title>
</caption>
<alternatives>
<graphic id="pcbi.1007177.t001g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1007177.t001" xlink:type="simple"/>
<table border="0" frame="box" rules="all">
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="center" style="border-bottom:thick">2<italic>Nκ</italic><sub><italic>F</italic></sub></th>
<th align="center" style="border-bottom:thick"/>
<th align="center" style="border-bottom:thick">0.1</th>
<th align="center" style="border-bottom:thick">1</th>
<th align="center" style="border-bottom:thick">10</th>
<th align="center" style="border-bottom:thick">20</th>
</tr>
</thead>
<tbody>
<tr>
<td align="center">Total</td>
<td align="center" rowspan="4"><italic>γ</italic></td>
<td align="center">1.94 ± 0.05</td>
<td align="center">1.99 ± 0.05</td>
<td align="center">1.95 ± 0.05</td>
<td align="center">2.00 ± 0.12</td>
</tr>
<tr>
<td align="center">2-way</td>
<td align="center">1.93 ± 0.05</td>
<td align="center">1.98 ± 0.06</td>
<td align="center">1.84 ± 0.06</td>
<td align="center">1.97 ± 0.13</td>
</tr>
<tr>
<td align="center">3-way</td>
<td align="center">2.66 ± 0.13</td>
<td align="center">2.81 ± 0.17</td>
<td align="center">2.76 ± 0.24</td>
<td align="center">2.14 ± 0.15</td>
</tr>
<tr>
<td align="center">4-way</td>
<td align="center">3.17 ± 0.19</td>
<td align="center">3.43 ± 0.41</td>
<td align="center">3.14 ± 0.24</td>
<td align="center">2.93 ± 0.19</td>
</tr>
</tbody>
</table>
</alternatives>
</table-wrap>
</sec>
<sec id="sec009">
<title>Sub-diffusive growth of DMIs for large populations</title>
<p>For large population sizes there is no clear power law, which is again consistent with previous simulations [<xref ref-type="bibr" rid="pcbi.1007177.ref027">27</xref>] and also theoretical calculations [<xref ref-type="bibr" rid="pcbi.1007177.ref026">26</xref>]; when high fitness corresponds to high binding affinity, so that the common ancestor distribution is peaked away from the inviability boundary, large populations have a small drift load, meaning that DMIs arise when hybrid energy traits diffuse to the boundary. One such analytically tractable model was investigated in [<xref ref-type="bibr" rid="pcbi.1007177.ref026">26</xref>] and predicted that the number of DMIs is a complementary error function, which has an asymptotic form <inline-formula id="pcbi.1007177.e003"><alternatives><graphic id="pcbi.1007177.e003g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e003" xlink:type="simple"/><mml:math display="inline" id="M3"><mml:mrow><mml:mi>I</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>t</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>∼</mml:mo> <mml:mfrac><mml:msqrt><mml:mrow><mml:mn>4</mml:mn> <mml:mi>μ</mml:mi> <mml:mi>t</mml:mi></mml:mrow></mml:msqrt> <mml:msup><mml:mi>K</mml:mi> <mml:mo>*</mml:mo></mml:msup></mml:mfrac> <mml:msup><mml:mi>e</mml:mi> <mml:mrow><mml:mo>-</mml:mo> <mml:msup><mml:mrow><mml:mo>(</mml:mo> <mml:msup><mml:mi>K</mml:mi> <mml:mo>*</mml:mo></mml:msup> <mml:mo>)</mml:mo></mml:mrow> <mml:mn>2</mml:mn></mml:msup> <mml:mo>/</mml:mo> <mml:mn>4</mml:mn> <mml:mi>μ</mml:mi> <mml:mi>t</mml:mi></mml:mrow></mml:msup></mml:mrow></mml:math></alternatives></inline-formula>, which due to the essential singularity as <italic>t</italic> → 0 has the property of negative curvature on a log-log plot. However, neither this form nor its multidimensional generalization fit the simulation data well (not shown). A functional form that <italic>is</italic> a good fit to the data at large populations sizes is
<disp-formula id="pcbi.1007177.e004"><alternatives><graphic id="pcbi.1007177.e004g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e004" xlink:type="simple"/><mml:math display="block" id="M4"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>I</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>t</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:mfrac><mml:msqrt><mml:mrow><mml:mn>4</mml:mn> <mml:msup><mml:mrow><mml:mo>(</mml:mo> <mml:mi>μ</mml:mi> <mml:mi>t</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mi>β</mml:mi></mml:msup></mml:mrow></mml:msqrt> <mml:msup><mml:mi>K</mml:mi> <mml:mo>*</mml:mo></mml:msup></mml:mfrac> <mml:msup><mml:mi>e</mml:mi> <mml:mrow><mml:mo>-</mml:mo> <mml:msup><mml:mrow><mml:mo>(</mml:mo> <mml:msup><mml:mi>K</mml:mi> <mml:mo>*</mml:mo></mml:msup> <mml:mo>)</mml:mo></mml:mrow> <mml:mn>2</mml:mn></mml:msup> <mml:mo>/</mml:mo> <mml:mn>4</mml:mn> <mml:msup><mml:mrow><mml:mo>(</mml:mo> <mml:mi>μ</mml:mi> <mml:mi>t</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mi>β</mml:mi></mml:msup></mml:mrow></mml:msup> <mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(2)</label></disp-formula>
which arises when considering fractional Brownian processes with exponent <italic>β</italic> [<xref ref-type="bibr" rid="pcbi.1007177.ref032">32</xref>]; normal diffusion or Brownian motion arises when <italic>β</italic> = 1, while <italic>β</italic> &lt; 1 corresponds to <italic>sub</italic>diffusive behaviour, while <italic>β</italic> &gt; 1 is <italic>super</italic>diffusive. It is clear by examining the exponent <italic>β</italic> in <xref ref-type="table" rid="pcbi.1007177.t002">Table 2</xref> from fits of the data in <xref ref-type="fig" rid="pcbi.1007177.g005">Fig 5</xref> at large population size (2<italic>Nκ</italic><sub><italic>F</italic></sub> ≥ 50) that the DMIs arise as a result of a sub-diffusive process, where 2-way, 3-way and 4-way DMIs have an exponent <italic>β</italic> ≈ 1/3 for 2<italic>Nκ</italic><sub><italic>F</italic></sub> = 50 and <italic>β</italic> ≈ 1/4 for 2<italic>Nκ</italic><sub><italic>F</italic></sub> = 100. The most likely mechanism that would give rise to sub-diffusive behaviour is a broad spectrum of times between substitutions; even though in the simulations the kinetic Monte Carlo scheme is based on a Poisson process for a given genotypic state <italic><bold>G</bold></italic>, the distribution of rates could vary significantly as populations explore the fitness landscape. This would be consistent with the results in [<xref ref-type="bibr" rid="pcbi.1007177.ref017">17</xref>], which reveal the underlying fitness landscape of this spatial patterning genotype-phenotype map to be rough, which could lead to broad distribution of substitution rates in each lineage and effective sub-diffusive behaviour of the hybrids. Finally as expected the average number of substitutions needed at large population sizes is large, with values of <italic>K</italic>* ranging from 6 to 9, and increases with increasing population size, as expected; it also increases very moderately with increasing <italic>n</italic>, which would be consistent with an increase in dimensionality of higher order DMIs. Interestingly, these values of <italic>K</italic>* would indicate that the fraction of viable genotypes is very small, <inline-formula id="pcbi.1007177.e005"><alternatives><graphic id="pcbi.1007177.e005g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e005" xlink:type="simple"/><mml:math display="inline" id="M5"><mml:mrow><mml:mo>∼</mml:mo> <mml:msup><mml:mn>2</mml:mn> <mml:msup><mml:mi>K</mml:mi> <mml:mo>*</mml:mo></mml:msup></mml:msup> <mml:mo>/</mml:mo> <mml:msup><mml:mn>2</mml:mn> <mml:msub><mml:mi>ℓ</mml:mi> <mml:mi mathvariant="bold-italic">G</mml:mi></mml:msub></mml:msup> <mml:mo>∼</mml:mo> <mml:msup><mml:mn>10</mml:mn> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>13</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></alternatives></inline-formula>, where <italic>ℓ</italic><sub><italic><bold>G</bold></italic></sub> = 60 is the number of effective binary sites in this genotype-phenotype map.</p>
<table-wrap id="pcbi.1007177.t002" position="float">
<object-id pub-id-type="doi">10.1371/journal.pcbi.1007177.t002</object-id>
<label>Table 2</label>
<caption>
<title>Table of values of the parameters characterising the sub-diffusive growth of DMIs for large scaled population sizes; <italic>β</italic> = 1 corresponds to normal diffusive motion, <italic>β</italic> &lt; 1 to sub-diffusion and <italic>β</italic> &gt; 1 super-diffusion, while <italic>K</italic>* corresponds roughly to the number of substitutions required to reach the inviable region.</title>
</caption>
<alternatives>
<graphic id="pcbi.1007177.t002g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1007177.t002" xlink:type="simple"/>
<table border="0" frame="box" rules="all">
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="center" style="border-bottom:thick">2<italic>Nκ</italic><sub><italic>F</italic></sub></th>
<th align="center" style="border-bottom:thick"/>
<th align="center" style="border-bottom:thick">50</th>
<th align="center" style="border-bottom:thick">100</th>
</tr>
</thead>
<tbody>
<tr>
<td align="center" rowspan="2">Total</td>
<td align="center"><italic>β</italic></td>
<td align="center">0.47 ± 0.03</td>
<td align="center">0.33 ± 0.02</td>
</tr>
<tr>
<td align="center"><italic>K</italic>*</td>
<td align="center">6.58 ± 0.12</td>
<td align="center">7.37 ± 0.26</td>
</tr>
<tr>
<td align="center" rowspan="2">2-way</td>
<td align="center"><italic>β</italic></td>
<td align="center">0.32 ± 0.01</td>
<td align="center">0.25 ± 0.01</td>
</tr>
<tr>
<td align="center"><italic>K</italic>*</td>
<td align="center">6.71 ± 0.07</td>
<td align="center">7.51 ± 0.18</td>
</tr>
<tr>
<td align="center" rowspan="2">3-way</td>
<td align="center"><italic>β</italic></td>
<td align="center">0.33 ± 0.01</td>
<td align="center">0.22 ± 0.01</td>
</tr>
<tr>
<td align="center"><italic>K</italic>*</td>
<td align="center">7.53 ± 0.10</td>
<td align="center">8.09 ± 0.27</td>
</tr>
<tr>
<td align="center" rowspan="2">4-way</td>
<td align="center"><italic>β</italic></td>
<td align="center">0.31 ± 0.02</td>
<td align="center">0.25 ± 0.02</td>
</tr>
<tr>
<td align="center"><italic>K</italic>*</td>
<td align="center">7.50 ± 0.28</td>
<td align="center">8.66 ± 0.39</td>
</tr>
</tbody>
</table>
</alternatives>
</table-wrap>
</sec>
<sec id="sec010">
<title>Molecular phenotypes under weakest selection dominate DMIs at larger population sizes</title>
<p>The DMI decomposition algorithm allows examination of the behaviour of different types of pair-wise, 3-way and 4-way DMIs. The different pair-wise DMIs can easily be identified with the different molecular binding energy phenotypes that combine together to form the overall organismal phenotype. The plot in <xref ref-type="fig" rid="pcbi.1007177.g006">Fig 6</xref> shows how the number of DMIs grows for the three most dominant pair-wise DMIs <italic>I</italic><sub><monospace>rm</monospace></sub>, <italic>I</italic><sub><monospace>rc</monospace></sub> and <italic>I</italic><sub><monospace>mc</monospace></sub> (pair-wise DMIs involving the <italic>α</italic> locus are orders of magnitude smaller—see <xref ref-type="supplementary-material" rid="pcbi.1007177.s001">S1 Text</xref>), as a function of the scaled divergence time <italic>ℓ</italic>′<italic>μt</italic>, where <italic>ℓ</italic>′ = 5 for <italic>I</italic><sub><monospace>rm</monospace></sub> and <italic>ℓ</italic>′ = 10 for <italic>I</italic><sub><monospace>rc</monospace></sub> and <italic>I</italic><sub><monospace>mc</monospace></sub>, cancelling how mutations are more likely to hit longer regions of the genome [<xref ref-type="bibr" rid="pcbi.1007177.ref027">27</xref>]. Strikingly, we find that contrary to what might seem intuitive, it is the molecular interactions under weakest selection that dominate the number of DMIs, particularly for larger population sizes. For 2<italic>Nκ</italic><sub><italic>F</italic></sub> &gt;= 50, we see at early times <italic>I</italic><sub><monospace>rc</monospace></sub> &gt; <italic>I</italic><sub><monospace>rm</monospace></sub> &gt; <italic>I</italic><sub><monospace>mc</monospace></sub>, which is the same order of increasing selective constraint on each of these molecular interactions (<xref ref-type="supplementary-material" rid="pcbi.1007177.s001">S1 Text</xref>). This has a simple explanation: at a sufficiently large population size such that none of the selective constraints on different molecular phenotypes is neutral, in the common ancestor the molecular interaction strengths under weakest selection will have the largest drift load and hence fewer substitutions are needed for incompatibilities to arise in hybrids. This is precisely as observed in simple models of transcription factor DNA binding, where the incompatibilities arise more quickly where binding is under weak selection for high affinity [<xref ref-type="bibr" rid="pcbi.1007177.ref027">27</xref>].</p>
<fig id="pcbi.1007177.g006" position="float">
<object-id pub-id-type="doi">10.1371/journal.pcbi.1007177.g006</object-id>
<label>Fig 6</label>
<caption>
<title>Plot of the spectrum 2-way DMIs vs scaled divergence time for different scaled population sizes.</title>
<p>Here the divergence time for each pair-wise DMI is scaled by the number of base-pairs involved in each interaction in order to remove the effect that interactions with a larger number of base-pairs mutate at a larger rate in proportion to their length; for <italic>I</italic><sub><monospace>rm</monospace></sub>, <italic>ℓ</italic>′ = 5, and for <italic>I</italic><sub><monospace>rc</monospace></sub> and <italic>I</italic><sub><monospace>mc</monospace></sub>, <italic>ℓ</italic>′ = 10.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1007177.g006" xlink:type="simple"/>
</fig>
<p>In the converse limit, when population sizes are sufficiently small that all molecular phenotypes are neutral (up to the truncation threshold), we find only small differences between the rise of each of the pair-wise incompatibility types; this is again consistent with simple models of transcription factor DNA binding, where the phenotypic distribution of binding energies is dominated by their sequence entropy and not fitness at small population sizes and there is only a weak dependence on sequence length [<xref ref-type="bibr" rid="pcbi.1007177.ref027">27</xref>]. In the <xref ref-type="supplementary-material" rid="pcbi.1007177.s001">S1 Text</xref>, we show this is also true of the higher order DMIs, where it is purely the sequence-entropy constraints of each DMI type which controls the dynamics of incompatibilities and fitness has little bearing; however, as the population size is increased this degeneracy is lifted and each of the DMIs exhibits individual behaviour.</p>
</sec>
</sec>
</sec>
<sec id="sec011" sec-type="conclusions">
<title>Discussion</title>
<p>There is still very little understood about the underlying genetic basis that gives rise to reproductive isolation between lineages. Gene expression divergence is thought to be a strong determinant of the differences between species [<xref ref-type="bibr" rid="pcbi.1007177.ref033">33</xref>–<xref ref-type="bibr" rid="pcbi.1007177.ref037">37</xref>] with a growing body of evidence for their direct role in speciation, particularly through transcription factors [<xref ref-type="bibr" rid="pcbi.1007177.ref038">38</xref>–<xref ref-type="bibr" rid="pcbi.1007177.ref042">42</xref>]. In particular, transcription factors mediate the control of gene expression and the ultimately body plans of organisms through complicated gene regulatory networks. Studies in drosophila and nematodes have shown in closely diverged species conserved body plans yet plasticity in the underlying molecular architectures between them [<xref ref-type="bibr" rid="pcbi.1007177.ref007">7</xref>–<xref ref-type="bibr" rid="pcbi.1007177.ref011">11</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref043">43</xref>].</p>
<p>This evidence suggests that divergence in the regulatory networks controlling gene expression and body plans in allopatric lineages is likely to be an important mechanism of speciation in many higher organisms, yet we do not yet have a quantitative evolutionary framework to model such processes, which can then be used to make predictions. A key challenge is to link changes at the genetic level, where mutations arise, to their outcomes on changes in phenotype, where selection actually acts. Although in the past century we have made great strides in our understanding of evolution through the modern synthesis of Fisher, Wright, Kimura and many others [<xref ref-type="bibr" rid="pcbi.1007177.ref044">44</xref>–<xref ref-type="bibr" rid="pcbi.1007177.ref048">48</xref>], this has focussed on the evolution of either genotypes or phenotypes separately. However, in recent years there has been increasing attention on the development of more realistic fitness landscapes, and how this affects the evolutionary process. For example, in biologically realistic systems, often many genotypes correspond to the same phenotype; this redundancy of the mapping from genotype to phenotype results in a number of non-trivial and emergent behaviours which do not arise on fitness landscapes which consider evolution of phenotypes or genotypes independently [<xref ref-type="bibr" rid="pcbi.1007177.ref014">14</xref>–<xref ref-type="bibr" rid="pcbi.1007177.ref024">24</xref>].</p>
<sec id="sec012">
<title>Role of free fitness in genotype-phenotype maps</title>
<p>One important and well explored example is the evolution of transcription factor DNA binding [<xref ref-type="bibr" rid="pcbi.1007177.ref015">15</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref016">16</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref022">22</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref026">26</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref027">27</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref049">49</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref050">50</xref>], where the genotype-phenotype map from sequence to binding affinity can be explicitly enumerated under simplifying assumptions [<xref ref-type="bibr" rid="pcbi.1007177.ref051">51</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref052">52</xref>]. These investigations show that for small populations dominated by genetic drift, evolution does not optimise fitness. Rather, there is a trade off between the high fitness of a small number of sequences that bind well and the exponentially larger number of sequences that bind less well. The result is the maximisation of a combination of fitness and the number of sequences that correspond to that phenotype. We can take advantage of analogies with statistical mechanics and represent this combination as the “free fitness”, where the log of the number of sequences is the “sequence entropy” of a phenotype [<xref ref-type="bibr" rid="pcbi.1007177.ref015">15</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref026">26</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref027">27</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref053">53</xref>]. In this formulation, the effective population size is analogous to an inverse temperature for a physical system connected to a heat-bath, where decreasing population size increases the effect of drift and the importance of sequence entropy relative to fitness.</p>
<p>When the free fitness framework is applied to the role of transcription factor DNA binding in allopatric speciation, our previous work gave rise to a simple prediction: incompatibilities arise more quickly for smaller, drift-dominated, populations [<xref ref-type="bibr" rid="pcbi.1007177.ref026">26</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref027">27</xref>], supporting previous computational studies by Tulchinsky et al. [<xref ref-type="bibr" rid="pcbi.1007177.ref054">54</xref>], that showed decreased hybrid fitness for smaller populations. This can be understood as a result of the greater importance of sequence entropy for small populations, resulting in common ancestors with a higher drift load, which are therefore closer to incompatible regions. As a result, fewer substitutions are required for the development of hybrid incompatibilities [<xref ref-type="bibr" rid="pcbi.1007177.ref026">26</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref027">27</xref>]. Conversely, those transcription factor binding site pairs under weaker selection, at a fixed population size, will give rise to incompatibilities more quickly, as they are more susceptible to drift and in the common ancestor will have a larger drift load.</p>
<p>In this paper, we examine speciation in a more realistic genotype phenotype map. For the first time we examine how incompatibilities arise in allopatry for a simple evolutionary model of developmental system drift, where a higher level organismal spatial patterning phenotype is maintained by stabilising selection, whilst the underlying molecular binding energy phenotypes and ultimately the sequences that determine them, the genotype, are allowed to drift in the evolutionary simulations. Earlier analyses of this model demonstrated the evolution of a number of non-trivial features such as a balance between fitness and sequence entropy deciding the course of evolution at small population sizes and a roughness to the fitness landscape for phenotypes which have high fitness [<xref ref-type="bibr" rid="pcbi.1007177.ref017">17</xref>]. Importantly here, unlike in previous works [<xref ref-type="bibr" rid="pcbi.1007177.ref026">26</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref027">27</xref>] we do not directly select for high binding affinity, but only on the organismal level phenotype, but as we discuss, we find the same population size dependence, as well as a number of other novel phenomenon to the speciation process, which would not be obtainable by modelling selection only at the level of phenotypes or genotypes. The results show that biophysics and effective population size provide a much stronger constraint than previous simple modelling of the dynamics of hybrid incompatibilities would suggest [<xref ref-type="bibr" rid="pcbi.1007177.ref005">5</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref031">31</xref>].</p>
</sec>
<sec id="sec013">
<title>Small populations characterised by power law growth of incompatibilities, large populations by diffusive growth</title>
<p>A key result we find is that small populations are characterised by a power law growth of incompatibilities with time, vs large populations a diffusive law (discussed below). Thus we suggest that empirical evidence of power law growth in incompatibilities is a signature of allopatric speciation at small population sizes. The Orr model of the growth of hybrid incompatibilities predicts that incompatibilities grow as a power law of the divergence time between allopatric lineages [<xref ref-type="bibr" rid="pcbi.1007177.ref005">5</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref031">31</xref>], where the exponent represents the number of genes participating in the interaction (e.g. 2 for a 2-way incompatibility). The results of our model also yield this prediction, but only when populations sizes are sufficiently small. There is, however, an alternative model for the power law behaviour to the combinatoric argument made by Orr. As argued in [<xref ref-type="bibr" rid="pcbi.1007177.ref027">27</xref>], at small population sizes, where genetic drift is dominant and there is a large drift load, common ancestor populations are poised close to the incompatibility boundary and the growth of DMIs at short times is determined by the likelihood that a few critical substitutions arrive quickly, which is given by a Poisson process; if the critical number of substitutions is <italic>K</italic>* then for short times we would expect <inline-formula id="pcbi.1007177.e006"><alternatives><graphic id="pcbi.1007177.e006g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e006" xlink:type="simple"/><mml:math display="inline" id="M6"><mml:mrow><mml:msub><mml:mi>P</mml:mi> <mml:mi>I</mml:mi></mml:msub> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>t</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>∼</mml:mo> <mml:msup><mml:mrow><mml:mo>(</mml:mo> <mml:mi>μ</mml:mi> <mml:mi>t</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:msup><mml:mi>K</mml:mi> <mml:mo>*</mml:mo></mml:msup></mml:msup></mml:mrow></mml:math></alternatives></inline-formula> and so given that at least <italic>n</italic> substitutions are needed for a <italic>n</italic>-way incompatibility, we would expect <italic>K</italic>* ≥ <italic>n</italic>. In this paper, we introduced a new method to decompose DMIs into their fundamental pair-wise, 3- and 4-way incompatibilities, and find that for more complex incompatibilities (more loci involved) the larger the exponent of their power law growth. However, we find the exponents we measure for 3- and 4-way incompatibilities are smaller than the predicted exponents of 3 and 4 respectively. We suggest this could be due, as shown in the <xref ref-type="supplementary-material" rid="pcbi.1007177.s001">S1 Text</xref>, to the greater number of higher order DMIs arising just by chance, leading to an overestimation of 3- and 4-way DMIs at short times, where at short times a <italic>smaller</italic> exponent corresponds to a larger number (i.e. <italic>τ</italic><sup><italic>n</italic>−1</sup> &gt; <italic>τ</italic><sup><italic>n</italic></sup> for <italic>τ</italic> &lt; 1, where <italic>τ</italic> is some dimensionless timescale).</p>
<p>Examining the growth of incompatibilities at large population sizes, we see there is a characteristic negative curvature on a log-log plot, predicted theoretically by [<xref ref-type="bibr" rid="pcbi.1007177.ref026">26</xref>], indicating that, as the number of substitutions needed for incompatibilities is large, the changes in the hybrid traits can be approximated by a diffusion process. However, we find that a simple model of diffusion does not fit the simulation data well; instead a model of sub-diffusion, that would arise if there are a number of kinetic traps giving a broad distribution of substitution times, does fit the data well. This is consistent with the finding that the genotype-phenotype map has a rough fitness landscape, which is only revealed at sufficiently large population sizes [<xref ref-type="bibr" rid="pcbi.1007177.ref017">17</xref>]. However, it is not clear whether we would observe quenched disorder and sub-diffusive behaviour with more realistic biophysical models that include a larger alphabet size with 20 amino acids and 4 nucleotides.</p>
</sec>
<sec id="sec014">
<title>Incompatibilities arise more rapidly in small populations</title>
<p>We also find that incompatibilities arise more rapidly in smaller populations, which is an emergent effect due to the genotype-phenotype map, giving a bias in degeneracy of different phenotypes; lower fitness and less sharp patterning organismal phenotypes have many more sequences than higher fitness, sharper patterning, phenotypes. In smaller drift-dominated populations, this means there is bias towards phenotypes of small sequence entropy (log degeneracy) that counteracts the tendency of natural selection to favour phenotypes of high fitness. Consequently, the common ancestor in small populations is more likely to be slightly maladapted and less substitutions are needed before hybrids develop incompatibilities. These predictions are consistent with empirical evidence for an inverse correlation of speciation rates with effective population size; the net rates of diversification from phylogenetic trees [<xref ref-type="bibr" rid="pcbi.1007177.ref055">55</xref>–<xref ref-type="bibr" rid="pcbi.1007177.ref057">57</xref>] indicate smaller populations speciate more quickly, as well from inferred times for post-zygotic isolation to arise [<xref ref-type="bibr" rid="pcbi.1007177.ref058">58</xref>–<xref ref-type="bibr" rid="pcbi.1007177.ref060">60</xref>], where for example mammals and cichlids, which have effective population sizes of order 10<sup>4</sup> [<xref ref-type="bibr" rid="pcbi.1007177.ref061">61</xref>– <xref ref-type="bibr" rid="pcbi.1007177.ref064">64</xref>], develop reproductive isolation more quickly than birds, which have effective populations sizes of order 10<sup>6</sup> [<xref ref-type="bibr" rid="pcbi.1007177.ref065">65</xref>]. This model and the similar results obtained for transcription factor DNA binding [<xref ref-type="bibr" rid="pcbi.1007177.ref026">26</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref027">27</xref>] provide a robust explanation of how stabilising selection can give rise to this population size effect in speciation, which do not require passing through fitness valleys as do models based on the founder effect [<xref ref-type="bibr" rid="pcbi.1007177.ref066">66</xref>–<xref ref-type="bibr" rid="pcbi.1007177.ref069">69</xref>].</p>
</sec>
<sec id="sec015">
<title>Universal phenomenon? Interplay between sequence entropy and specificity of fit phenotypes</title>
<p>However, the results for this genotype-phenotype map for developmental system drift are particularly noteworthy compared to the previous results on transcription factor DNA binding, as they are obtained without directly selecting for high affinity, low sequence entropy, binding phenotypes; here we only select on the organismal spatial patterning phenotype, but nonetheless we find small populations develop hybrid incompatibilities more quickly through a similar mechanism of the interplay between fitness, sequence entropy and populations size. Although studies with more complex genotype-phenotype maps will be required, we suggest this points towards a broad principle, where the specificity required of a phenotype to be functional and of high fitness will mean that it will be coded by fewer genotypes. For example, in simple models of protein stability, the empirical observation that all proteins tend to be marginally stable, can be explained by the fact that as the stability of a protein is increased the number of sequences that give that stability decreases rapidly [<xref ref-type="bibr" rid="pcbi.1007177.ref019">19</xref>]; assuming high fitness corresponds to maximum stability, this phenotype is highly specified, as only a few sequences will meet the requirement that all inter-chain interactions in the protein are favourable.</p>
</sec>
<sec id="sec016">
<title>Molecular phenotypes under weakest selection dominate DMIs at larger population sizes</title>
<p>Another property that emerges from this model not obtainable by simply modelling transcription factor DNA binding is that certain molecular phenotypes are more important than others in giving rise to incompatibilities. One particular feature of this model is that the selective constraints on the different molecular binding energy phenotypes emerge through the evolutionary process of stabilising selection on the organismal phenotype, and are not specified by the model. Most strikingly, and counterintuitively, the model predicts that molecular phenotypes that are under the weakest selective constraints (but not strictly neutral) dominate by giving rise to the earliest incompatibilities for intermediate and large population sizes. Remarkably, here this emerges as a consequence of stabilising selection on the organismal phenotype and not due to selection imposed for good binding affinity as in previous works [<xref ref-type="bibr" rid="pcbi.1007177.ref027">27</xref>].</p>
<p>We note that these results have been obtained by changing the population size whilst keeping the strength of selection on the organismal trait <italic>κ</italic><sub><italic>F</italic></sub> fixed. It would be tempting to use these results to suggest that overall those traits in a genome under weakest selection would give rise to the earliest incompatibilities and hence dominate allopatric speciation. However, the question of the how the dynamics of hybrid incompatibilities changes as the strength of selection changes is a subtle one, which we leave to future work; in this model a reduction in <italic>κ</italic><sub><italic>F</italic></sub> has the effect of changing the phenotypic regions of incompatibility, with non-trivial consequences. It should also be noted, the role of sequence entropy in giving a strong population size dependence to the rate of reproductive isolation; if we consider only a peaked phenotypic landscape without a sequence entropy bias, a reduction in population size would only lead to a broadening of the phenotypic distribution and not a change in the mean of the distribution, and so a much weaker effect, as the common ancestor will still be <italic>typically</italic> far from incompatible regions. On the other hand with strong (exponential) degeneracy biases, the mean phenotype of the common ancestor changes strongly giving the large population size effect seen, which is as demonstrated in <xref ref-type="fig" rid="pcbi.1007177.g002">Fig 2</xref>.</p>
</sec>
<sec id="sec017">
<title>Biophysics dominates combinatorics: Pair-wise incompatibilities dominate reproductive isolation</title>
<p>Another finding of significance is that pair-wise or 2-way DMIs dominate compared with higher order DMIs (3- and 4-way in this model with 4 loci). This is in contrast to Orr’s theoretical argument that predicts a very specific ratio of 2-way: 3-way: 4-way DMIs, equal to 12: 24: 14, which assumes that the fraction of viable paths from the common ancestor to the current day species increases as we consider higher order DMIs [<xref ref-type="bibr" rid="pcbi.1007177.ref005">5</xref>]. This argument partly rests on the assumption that the number of inviable genotypes remains fixed as a larger number of loci are considered, which would seem a very strong assumption. Despite its simplicity, the genotype-phenotype map in this paper has many of the key features required for higher levels of epistasis, with protein-DNA binding, protein-protein binding and control of the morphogen steepness, all interacting in a non-linear fashion to produce a single gene expression patterning phenotype and so there is clearly the potential for the Orr prediction to be verified; in contrast, we find the converse and our results show there is no bias towards 3-way DMIs, in fact showing instead that the ratio of 2-way to 3-way DMIs is at short times many orders of magnitude larger. This suggests, in this simple, but still relatively complex model, that biophysical constraints are far more important than a purely combinatorial argument would suggest. Evidence could be obtained from more detailed studies similar to [<xref ref-type="bibr" rid="pcbi.1007177.ref006">6</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref070">70</xref>], where a power law with an exponent greater than 2 would indicate higher-order DMIs are dominant; currently this evidence suggests a quadratic growth law, however, a study with more time-points or species-pairs would provide more confidence. An alternative approach would be to look for linkage disequilibrium between unlinked regions of hybrid genomes, such as was found with hybrids of two species of swordtail fish [<xref ref-type="bibr" rid="pcbi.1007177.ref071">71</xref>], and though computationally challenging and requiring large numbers of parallel datasets, compare this against evidence for pervasiveness of higher order epistasis. Although recent results of [<xref ref-type="bibr" rid="pcbi.1007177.ref072">72</xref>], would seem to contradict our conclusions, their finding of extensive complex epistasis relates to higher order interactions between sites within a single locus, coding for protein stability or enzymatic activity, whereas our work relates to epistasis between multiple loci. Similarly, the results of hybrid incompatibilities within RNA molecules [<xref ref-type="bibr" rid="pcbi.1007177.ref073">73</xref>], which show a ‘spiralling complexity’ of DMIs would appear to be of limited biological relevance to allopatric speciation in higher organisms, as these are related to epistasis within a single locus, which are unlikely to segregate into different recombinants in a hybrid.</p>
</sec>
<sec id="sec018">
<title>Symmetry breaking at large population sizes</title>
<p>Finally, for small populations we find clustering in the behaviours of growth of different types of DMIs, in particular, 3-way DMIs (<xref ref-type="supplementary-material" rid="pcbi.1007177.s001">S1 Text</xref>), which can be explained by the different sequence entropy constraints on different molecular phenotypes. This degeneracy is then lifted at larger population sizes and each <italic>n</italic>-way DMI takes on a different identity in their pattern of growth; this has strong analogy to physical phenomenon in statistical physics where constraints of symmetry dominate at large temperatures, in a regime where noise is important, but at smaller temperatures this symmetry is broken.</p>
</sec>
<sec id="sec019">
<title>Future directions</title>
<p>A clear future direction to investigate would be the effect of multiple transcription factors binding to enhancer regions to control gene expression [<xref ref-type="bibr" rid="pcbi.1007177.ref074">74</xref>–<xref ref-type="bibr" rid="pcbi.1007177.ref076">76</xref>] in large gene networks, where there is potential scope for complex epistasis across many loci coding for a large number of transcription factors. However, as our results show, despite the possibility and a prior expectation of a larger number of triplet interactions, pair-wise interactions dominate; for complex transcriptional control, if pair-wise interactions between proteins, and proteins and DNA dominate, for example in determining the binding affinity of transcriptional complexes, then our conclusions would hold. As we broaden the scope to large gene regulatory networks, there is no strong and direct empirical evidence for pervasive higher order epistasis in their function, which could give rise to higher order incompatibilities being dominant [<xref ref-type="bibr" rid="pcbi.1007177.ref077">77</xref>]. Specifically, although there is evidence that higher order incompatibilities have arisen in natural populations [<xref ref-type="bibr" rid="pcbi.1007177.ref078">78</xref>–<xref ref-type="bibr" rid="pcbi.1007177.ref081">81</xref>], nonetheless a survey of these findings suggest there is no evidence for their dominance [<xref ref-type="bibr" rid="pcbi.1007177.ref081">81</xref>] as would be predicted by Orr and would be consistent with our findings that point towards biophysics providing a stronger constraint.</p>
</sec>
<sec id="sec020">
<title>Conclusions</title>
<p>Overall, our results point to a basic principle, where developmental system drift or cryptic variation [<xref ref-type="bibr" rid="pcbi.1007177.ref007">7</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref010">10</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref011">11</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref043">43</xref>], play a key role in speciation; basic body plans or phenotypes are conserved, but co-evolution of the components and loci of complicated gene regulatory networks can change differently in different lineages, giving incompatibilities that grow in allopatry. Here, we suggest a universal mechanism, where the rate of growth of incompatibilities is controlled by the drift load, or distribution of phenotypic values, of the common ancestor, which in turn is determined by a balance between selection pushing populations towards phenotypes of higher fitness and genetic drift pushing them towards phenotypes that are more numerous (higher sequence entropy); this basic mechanism would predict in general that traits under weaker selection will dominant the initial development of reproductive isolation. In particular, although in principle more complicated regulation could give rise to more complex patterns of epistasis [<xref ref-type="bibr" rid="pcbi.1007177.ref005">5</xref>], our findings suggest that more simple, pair-wise, incompatibilities dominate the development of reproductive isolation between allopatric lineages under stabilising selection.</p>
</sec>
</sec>
<sec id="sec021" sec-type="materials|methods">
<title>Methods</title>
<sec id="sec022">
<title>Details of the GP map</title>
<p>We model the binding energies of proteins to DNA using the “two-state” approximation [<xref ref-type="bibr" rid="pcbi.1007177.ref051">51</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref052">52</xref>], which assumes that the binding energy of each amino acid-nucleotide interaction at the binding interface is additive and to a good approximation controlled by the number of mismatches, which each have the same penalty in binding affinity. The various protein-DNA binding energies in the main text are then given by the Hamming distance between the respective sequences. We assume these energies <italic>E</italic> are measured relative the background free energy of specific and non-specific binding all other sites in the genome, such that the probability of a given transcription factor being bound to a single site is <italic>p</italic> = 1/(1+<italic>e</italic><sup>(<italic>E</italic>−<italic>μ</italic>)/<italic>k</italic><sub><italic>B</italic></sub><italic>T</italic></sup>), where <italic>μ</italic> is the chemical potential (∼log(concentration)) of the TF [<xref ref-type="bibr" rid="pcbi.1007177.ref017">17</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref026">26</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref082">82</xref>]. For example, the binding energy between the morphogen (<italic>M</italic>) and the first binding site (<italic>B</italic>) is given by 
<disp-formula id="pcbi.1007177.e007"><alternatives><graphic id="pcbi.1007177.e007g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e007" xlink:type="simple"/><mml:math display="block" id="M7"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mi>E</mml:mi> <mml:mrow><mml:mi>M</mml:mi> <mml:mi>B</mml:mi></mml:mrow></mml:msub> <mml:mo>=</mml:mo> <mml:msub><mml:mi>ϵ</mml:mi> <mml:mrow><mml:mi>p</mml:mi> <mml:mi>d</mml:mi></mml:mrow></mml:msub> <mml:mspace width="0.166667em"/><mml:mi>ρ</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:msub><mml:mi mathvariant="bold">g</mml:mi> <mml:mi>m</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:msub><mml:mi mathvariant="bold">g</mml:mi> <mml:mi>B</mml:mi></mml:msub> <mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(3)</label></disp-formula>
where <italic>ρ</italic>(<italic><bold>g</bold></italic><sub><italic>m</italic></sub>, <italic><bold>g</bold></italic><sub><italic>B</italic></sub>) is the Hamming distance between the protein binding sequence (<italic><bold>g</bold></italic><sub><italic>m</italic></sub>) for the morphogen and the sequence for a first regulatory binding site (<italic><bold>g</bold></italic><sub><italic>B</italic></sub>), where <italic>ϵ</italic><sub><italic>pd</italic></sub> is the cost in energy for each mismatch. We assume <italic>ϵ</italic><sub><italic>pd</italic></sub> = 2<italic>k</italic><sub><italic>B</italic></sub><italic>T</italic> as a typical value for the mis-match energy, which are found to be in the range 1−3<italic>k</italic><sub><italic>B</italic></sub><italic>T</italic> [<xref ref-type="bibr" rid="pcbi.1007177.ref051">51</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref052">52</xref>]. Similarly the co-operative protein-protein binding energy, for example between RNAP and the morphogen is <inline-formula id="pcbi.1007177.e008"><alternatives><graphic id="pcbi.1007177.e008g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e008" xlink:type="simple"/><mml:math display="inline" id="M8"><mml:msub><mml:mover accent="true"><mml:mi>E</mml:mi> <mml:mo>˜</mml:mo></mml:mover> <mml:mrow><mml:mi>R</mml:mi> <mml:mi>M</mml:mi></mml:mrow></mml:msub></mml:math></alternatives></inline-formula> is
<disp-formula id="pcbi.1007177.e009"><alternatives><graphic id="pcbi.1007177.e009g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e009" xlink:type="simple"/><mml:math display="block" id="M9"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>E</mml:mi> <mml:mo>˜</mml:mo></mml:mover> <mml:mrow><mml:mi>R</mml:mi> <mml:mi>M</mml:mi></mml:mrow></mml:msub> <mml:mo>=</mml:mo> <mml:msub><mml:mi>ϵ</mml:mi> <mml:mrow><mml:mi>p</mml:mi> <mml:mi>p</mml:mi></mml:mrow></mml:msub> <mml:mrow><mml:mo>(</mml:mo> <mml:msub><mml:mi>ℓ</mml:mi> <mml:mrow><mml:mi>p</mml:mi> <mml:mi>p</mml:mi></mml:mrow></mml:msub> <mml:mo>-</mml:mo> <mml:mi>ρ</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:msub><mml:mi mathvariant="bold">g</mml:mi> <mml:mi>R</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:mover accent="true"><mml:msub><mml:mi mathvariant="bold">g</mml:mi> <mml:mi>M</mml:mi></mml:msub> <mml:mo>˘</mml:mo></mml:mover> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(4)</label></disp-formula>
where <italic><bold>g</bold></italic><sub><italic>R</italic></sub> is the sequence involved in protein-protein interactions for the polymerase, and <inline-formula id="pcbi.1007177.e010"><alternatives><graphic id="pcbi.1007177.e010g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e010" xlink:type="simple"/><mml:math display="inline" id="M10"><mml:mover accent="true"><mml:msub><mml:mi mathvariant="bold-italic">g</mml:mi> <mml:mi>M</mml:mi></mml:msub> <mml:mo>˘</mml:mo></mml:mover></mml:math></alternatives></inline-formula> represents the equivalent binary sequence for the morphogen, flipped about its centre, which mimics the chirality of real proteins and prevents the co-operative stability from always being maximum for homo-dimers. The parameter <italic>ϵ</italic><sub><italic>pp</italic></sub> is the stability added for each favourable hydrophobic interaction between amino acids, which we assume to be <italic>ϵ</italic><sub><italic>pp</italic></sub> = −<italic>k</italic><sub><italic>B</italic></sub><italic>T</italic>. Given <italic>ℓ</italic><sub><italic>pp</italic></sub> = 5 this gives interactions consistent with typical literature values of −2 to −7<italic>k</italic><sub><italic>B</italic></sub><italic>T</italic> for hydrophobic interactions between proteins [<xref ref-type="bibr" rid="pcbi.1007177.ref028">28</xref>, <xref ref-type="bibr" rid="pcbi.1007177.ref083">83</xref>].</p>
<p>The morphogen concentration profile is approximately exponential; the exact profile we use is
<disp-formula id="pcbi.1007177.e011"><alternatives><graphic id="pcbi.1007177.e011g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e011" xlink:type="simple"/><mml:math display="block" id="M11"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mrow><mml:mo>[</mml:mo> <mml:mi>M</mml:mi> <mml:mo>]</mml:mo></mml:mrow> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>x</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:mrow><mml:mo>[</mml:mo> <mml:msub><mml:mi>M</mml:mi> <mml:mn>0</mml:mn></mml:msub> <mml:mo>]</mml:mo></mml:mrow> <mml:mfrac><mml:mrow><mml:mtext>cosh</mml:mtext> <mml:mo>(</mml:mo> <mml:mi>α</mml:mi> <mml:mo>(</mml:mo> <mml:mi>x</mml:mi> <mml:mo>-</mml:mo> <mml:mi>L</mml:mi> <mml:mo>)</mml:mo> <mml:mo>)</mml:mo></mml:mrow> <mml:mrow><mml:mtext>sinh</mml:mtext> <mml:mo>(</mml:mo> <mml:mi>α</mml:mi> <mml:mi>L</mml:mi> <mml:mo>)</mml:mo></mml:mrow></mml:mfrac></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(5)</label></disp-formula>
where this arises from solving the reaction-diffusion equation with reflecting boundary conditions and is valid for all <italic>α</italic>.</p>
</sec>
<sec id="sec023">
<title>Probability of RNAP being bound to promoter</title>
<p>To calculate this probability, we use the canonical ensemble of statistical mechanics, for which the partition function <inline-formula id="pcbi.1007177.e012"><alternatives><graphic id="pcbi.1007177.e012g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e012" xlink:type="simple"/><mml:math display="inline" id="M12"><mml:mi mathvariant="script">Z</mml:mi></mml:math></alternatives></inline-formula> is most simply expressed in terms of a spin-like variable, which represents the occupation of each binding site, <inline-formula id="pcbi.1007177.e013"><alternatives><graphic id="pcbi.1007177.e013g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e013" xlink:type="simple"/><mml:math display="inline" id="M13"><mml:mrow><mml:msub><mml:mi>σ</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>=</mml:mo> <mml:mrow><mml:mo>{</mml:mo> <mml:mn mathvariant="sans-serif">0</mml:mn> <mml:mo>,</mml:mo> <mml:mi>R</mml:mi> <mml:mo>,</mml:mo> <mml:mi>M</mml:mi> <mml:mo>}</mml:mo></mml:mrow></mml:mrow></mml:math></alternatives></inline-formula>,
<disp-formula id="pcbi.1007177.e014"><alternatives><graphic id="pcbi.1007177.e014g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e014" xlink:type="simple"/><mml:math display="block" id="M14"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi mathvariant="script">Z</mml:mi> <mml:mo>=</mml:mo> <mml:munder><mml:mo>∑</mml:mo> <mml:msub><mml:mi>σ</mml:mi> <mml:mi>P</mml:mi></mml:msub></mml:munder> <mml:munder><mml:mo>∑</mml:mo> <mml:msub><mml:mi>σ</mml:mi> <mml:mi>B</mml:mi></mml:msub></mml:munder> <mml:msup><mml:mi>e</mml:mi> <mml:mrow><mml:mo>-</mml:mo> <mml:mrow><mml:mo>(</mml:mo> <mml:msub><mml:mi>E</mml:mi> <mml:mrow><mml:msub><mml:mi>σ</mml:mi> <mml:mi>P</mml:mi></mml:msub> <mml:mi>P</mml:mi></mml:mrow></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>E</mml:mi> <mml:mrow><mml:msub><mml:mi>σ</mml:mi> <mml:mi>B</mml:mi></mml:msub> <mml:mi>B</mml:mi></mml:mrow></mml:msub> <mml:mo>-</mml:mo> <mml:msub><mml:mi>μ</mml:mi> <mml:msub><mml:mi>σ</mml:mi> <mml:mi>P</mml:mi></mml:msub></mml:msub> <mml:mo>-</mml:mo> <mml:msub><mml:mi>μ</mml:mi> <mml:msub><mml:mi>σ</mml:mi> <mml:mi>B</mml:mi></mml:msub></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mover accent="true"><mml:mi>E</mml:mi> <mml:mo>˜</mml:mo></mml:mover> <mml:mrow><mml:msub><mml:mi>σ</mml:mi> <mml:mi>P</mml:mi></mml:msub> <mml:msub><mml:mi>σ</mml:mi> <mml:mi>B</mml:mi></mml:msub></mml:mrow></mml:msub> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>/</mml:mo> <mml:msub><mml:mi>k</mml:mi> <mml:mi>B</mml:mi></mml:msub> <mml:mi>T</mml:mi></mml:mrow></mml:msup></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
with <inline-formula id="pcbi.1007177.e015"><alternatives><graphic id="pcbi.1007177.e015g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e015" xlink:type="simple"/><mml:math display="inline" id="M15"><mml:mrow><mml:msub><mml:mi>E</mml:mi> <mml:mrow><mml:mn mathvariant="sans-serif">0</mml:mn> <mml:mi>j</mml:mi></mml:mrow></mml:msub> <mml:mo>=</mml:mo> <mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>, <inline-formula id="pcbi.1007177.e016"><alternatives><graphic id="pcbi.1007177.e016g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e016" xlink:type="simple"/><mml:math display="inline" id="M16"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>E</mml:mi> <mml:mo>˜</mml:mo></mml:mover> <mml:mrow><mml:mi>i</mml:mi> <mml:msup><mml:mi>i</mml:mi> <mml:mo>′</mml:mo></mml:msup></mml:mrow></mml:msub> <mml:mo>=</mml:mo> <mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>, for either <italic>i</italic> = 0 or <italic>i</italic>′ = 0 and <italic>μ</italic><sub>0</sub> = 0, where <inline-formula id="pcbi.1007177.e017"><alternatives><graphic id="pcbi.1007177.e017g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e017" xlink:type="simple"/><mml:math display="inline" id="M17"><mml:mrow><mml:msub><mml:mi>μ</mml:mi> <mml:msub><mml:mi>σ</mml:mi> <mml:mi>j</mml:mi></mml:msub></mml:msub> <mml:mo>=</mml:mo> <mml:msub><mml:mi>k</mml:mi> <mml:mi>B</mml:mi></mml:msub> <mml:mi>T</mml:mi> <mml:mo form="prefix">ln</mml:mo> <mml:mrow><mml:mo>[</mml:mo> <mml:msub><mml:mi>σ</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>]</mml:mo></mml:mrow></mml:mrow></mml:math></alternatives></inline-formula> represents the chemical potentials of the protein species at the <italic>j</italic><sup><italic>th</italic></sup> binding site with [<italic>σ</italic><sub><italic>j</italic></sub>] being the concentration of species <italic>σ</italic><sub><italic>j</italic></sub> and 0 represents a free binding site. Formally this construction is known as a 3−state Pott’s model. So given a ‘genome’ <italic><bold>G</bold></italic> = [<italic><bold>g</bold></italic><sub><italic>R</italic></sub>, <italic><bold>g</bold></italic><sub><italic>r</italic></sub>, <italic><bold>g</bold></italic><sub><italic>M</italic></sub>, <italic><bold>g</bold></italic><sub><italic>m</italic></sub> <italic><bold>g</bold></italic><sub><italic>P</italic></sub>, <italic><bold>g</bold></italic><sub><italic>B</italic></sub>] from which the protein-DNA and protein-protein binding energies are calculated (<italic>E</italic><sub><italic>ij</italic></sub> and <inline-formula id="pcbi.1007177.e019"><alternatives><graphic id="pcbi.1007177.e019g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e019" xlink:type="simple"/><mml:math display="inline" id="M19"><mml:msub><mml:mover accent="true"><mml:mi>E</mml:mi> <mml:mo>˜</mml:mo></mml:mover> <mml:mrow><mml:mi>i</mml:mi> <mml:msup><mml:mi>i</mml:mi> <mml:mo>′</mml:mo></mml:msup></mml:mrow></mml:msub></mml:math></alternatives></inline-formula>, respectively), <italic>p</italic><sub><italic>RP</italic></sub> is given schematically by
<disp-formula id="pcbi.1007177.e020"><alternatives><graphic id="pcbi.1007177.e020g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e020" xlink:type="simple"/><mml:math display="block" id="M20"><mml:mrow><mml:mtable><mml:mtr><mml:mtd><mml:mrow><mml:msub><mml:mi>p</mml:mi><mml:mrow><mml:mi>R</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>p</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:msub><mml:mi>σ</mml:mi><mml:mi>B</mml:mi></mml:msub><mml:mo>−</mml:mo><mml:mi>R</mml:mi><mml:mspace width="2pt"/><mml:mo>↱</mml:mo></mml:mrow><mml:mo>)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi mathvariant="script">Z</mml:mi></mml:mfrac><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mn>0</mml:mn><mml:mo>−</mml:mo><mml:mi>R</mml:mi><mml:mspace width="2pt"/><mml:mo>↱</mml:mo></mml:mrow><mml:mo>)</mml:mo></mml:mrow><mml:mo>+</mml:mo><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mi>M</mml:mi><mml:mo>−</mml:mo><mml:mi>R</mml:mi><mml:mspace width="2pt"/><mml:mo>↱</mml:mo></mml:mrow><mml:mo>)</mml:mo></mml:mrow><mml:mo>+</mml:mo><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mi>R</mml:mi><mml:mo>−</mml:mo><mml:mi>R</mml:mi><mml:mspace width="2pt"/><mml:mo>↱</mml:mo></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mrow></mml:math></alternatives> <label>(6)</label></disp-formula>
where, for example,
<disp-formula id="pcbi.1007177.e021"><alternatives><graphic id="pcbi.1007177.e021g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e021" xlink:type="simple"/><mml:math display="block" id="M21"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mrow><mml:mo>(</mml:mo> <mml:mstyle displaystyle="false" scriptlevel="1"><mml:mrow><mml:mi>M</mml:mi> <mml:mo>-</mml:mo> <mml:mi>R</mml:mi></mml:mrow></mml:mstyle> <mml:mo>↱</mml:mo> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>≡</mml:mo> <mml:msup><mml:mi>e</mml:mi> <mml:mrow><mml:mo>-</mml:mo> <mml:mrow><mml:mo>(</mml:mo> <mml:msub><mml:mi>E</mml:mi> <mml:mrow><mml:mi>R</mml:mi> <mml:mi>P</mml:mi></mml:mrow></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>E</mml:mi> <mml:mrow><mml:mi>M</mml:mi> <mml:mi>B</mml:mi></mml:mrow></mml:msub> <mml:mo>-</mml:mo> <mml:msub><mml:mi>μ</mml:mi> <mml:mi>R</mml:mi></mml:msub> <mml:mo>-</mml:mo> <mml:msub><mml:mi>μ</mml:mi> <mml:mi>M</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mover accent="true"><mml:mi>E</mml:mi> <mml:mo>˜</mml:mo></mml:mover> <mml:mrow><mml:mi>R</mml:mi> <mml:mi>M</mml:mi></mml:mrow></mml:msub> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>/</mml:mo> <mml:msub><mml:mi>k</mml:mi> <mml:mi>B</mml:mi></mml:msub> <mml:mi>T</mml:mi></mml:mrow></mml:msup></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula>
is the Boltzmann factor for co-operative binding of the morphogen and RNAP to <inline-formula id="pcbi.1007177.e022"><alternatives><graphic id="pcbi.1007177.e022g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e022" xlink:type="simple"/><mml:math display="inline" id="M22"><mml:mi mathvariant="script">R</mml:mi></mml:math></alternatives></inline-formula>. Note that we ignore in the partition sum protein-protein binding when not bound to DNA, since these co-operative binding energies tend to be relatively weak compared to DNA binding.</p>
</sec>
<sec id="sec024">
<title>Monte Carlo scheme for speciation simulations</title>
<p>We use a kinetic Monte Carlo scheme to simulate the evolutionary process for the genome <italic><bold>G</bold></italic> and <italic>α</italic> on two independent lineages, assuming a fixed effective population size of <italic>N</italic>, and that we are in the regime of small effective population size (<italic>ℓ</italic><sub><italic><bold>G</bold></italic></sub> <italic>μ</italic><sub>0</sub><italic>N</italic> ≪ 1, where <italic>μ</italic><sub>0</sub> is the base-pair mutation rate). This means the population is represented by a single fixed sequence (or number for <italic>α</italic>) for all of the loci at each time-point, where effectively mutations are either instantly fixed or eliminated. Specifically, we use the Gillespie algorithm [<xref ref-type="bibr" rid="pcbi.1007177.ref084">84</xref>], to simulate evolution as a continuous time Markov process; at each step of the simulation the rate of fixation of all one-step mutations from the currently fixed alleles (wild type) is calculated, and one of these mutations is selected randomly in proportion to their relative rate. Time is then progressed by <italic>K</italic><sup>−1</sup> ln(<italic>u</italic>), where <italic>K</italic> is the sum of the rates of all one-step mutants and <italic>u</italic> is a random number drawn independently between 0 and 1, which ensures the times at which substitutions occur is Poisson distributed, as we would be expected for a random substitution process. The rates are based upon the Kimura probability of fixation [<xref ref-type="bibr" rid="pcbi.1007177.ref085">85</xref>]:
<disp-formula id="pcbi.1007177.e023"><alternatives><graphic id="pcbi.1007177.e023g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e023" xlink:type="simple"/><mml:math display="block" id="M23"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>k</mml:mi> <mml:mo>=</mml:mo> <mml:msub><mml:mi>μ</mml:mi> <mml:mn>0</mml:mn></mml:msub> <mml:mi>N</mml:mi> <mml:mfrac><mml:mrow><mml:mn>1</mml:mn> <mml:mo>-</mml:mo> <mml:msup><mml:mi>e</mml:mi> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>2</mml:mn> <mml:mi>δ</mml:mi> <mml:mi>F</mml:mi></mml:mrow></mml:msup></mml:mrow> <mml:mrow><mml:mn>1</mml:mn> <mml:mo>-</mml:mo> <mml:msup><mml:mi>e</mml:mi> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>2</mml:mn> <mml:mi>N</mml:mi> <mml:mi>δ</mml:mi> <mml:mi>F</mml:mi></mml:mrow></mml:msup></mml:mrow></mml:mfrac> <mml:mo>≈</mml:mo> <mml:msub><mml:mi>μ</mml:mi> <mml:mn>0</mml:mn></mml:msub> <mml:mfrac><mml:mrow><mml:mn>2</mml:mn> <mml:mi>N</mml:mi> <mml:mi>δ</mml:mi> <mml:mi>F</mml:mi></mml:mrow> <mml:mrow><mml:mn>1</mml:mn> <mml:mo>-</mml:mo> <mml:msup><mml:mi>e</mml:mi> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>2</mml:mn> <mml:mi>N</mml:mi> <mml:mi>δ</mml:mi> <mml:mi>F</mml:mi></mml:mrow></mml:msup></mml:mrow></mml:mfrac> <mml:mo>,</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(7)</label></disp-formula>
where <italic>δF</italic> is the change of fitness of a mutation at a particular location, given by fitness function defined in the main text, and <italic>μ</italic><sub>0</sub><italic>N</italic> is the rate at which mutations arise in the population; the latter approximation in <xref ref-type="disp-formula" rid="pcbi.1007177.e023">Eq 7</xref> assumes <italic>δF</italic> ≪ 1. Note that although in the simulations we use the full form for the fixation probability, fitness effects are typically small (<italic>δF</italic> ≪ 1) in the simulations, so the substitution rates only depend on the population-scaled fitness changes 2<italic>NδF</italic> which, for a given mutation, is proportional to 2<italic>Nκ</italic><sub><italic>F</italic></sub>. Finally, we allow continuous ‘mutations’ in the morphogen steepness parameter <italic>α</italic>, chosen from a Gaussian distribution of standard deviation <italic>δα</italic> = 0.5 and assign it an 10 effective base-pairs, which are used when assigning relative weight in the kinetic Monte Carlo scheme, where the total number of base-pairs is <italic>ℓ</italic><sub><italic><bold>G</bold></italic></sub> = 60.</p>
<p>We determine the Malthusian or log fitness of the spatial gene regulation, from the resulting concentration profile [<italic>TF</italic>](<italic>x</italic>) by use of a functional that promotes expression of the<italic>TF</italic> in the anterior half, whilst penalising expression in the posterior half, with truncation selection below a critical value <italic>F</italic>*:
<disp-formula id="pcbi.1007177.e024"><alternatives><graphic id="pcbi.1007177.e024g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e024" xlink:type="simple"/><mml:math display="block" id="M24"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>F</mml:mi> <mml:mo>=</mml:mo> <mml:mo>{</mml:mo> <mml:mtable><mml:mtr><mml:mtd><mml:mrow><mml:msub><mml:mi>κ</mml:mi> <mml:mi>F</mml:mi></mml:msub> <mml:mo form="prefix">ln</mml:mo> <mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="script">W</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mspace width="1.em"/><mml:mtext>if</mml:mtext> <mml:mspace width="4pt"/><mml:msub><mml:mi>κ</mml:mi> <mml:mi>F</mml:mi></mml:msub> <mml:mo form="prefix">ln</mml:mo> <mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="script">W</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>&gt;</mml:mo> <mml:msup><mml:mi>F</mml:mi> <mml:mo>*</mml:mo></mml:msup></mml:mrow></mml:mtd></mml:mtr> <mml:mtr><mml:mtd><mml:mrow><mml:mo>-</mml:mo> <mml:mi>∞</mml:mi> <mml:mspace width="1.em"/><mml:mtext>if</mml:mtext> <mml:mspace width="4pt"/><mml:msub><mml:mi>κ</mml:mi> <mml:mi>F</mml:mi></mml:msub> <mml:mo form="prefix">ln</mml:mo> <mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="script">W</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>&lt;</mml:mo> <mml:msup><mml:mi>F</mml:mi> <mml:mo>*</mml:mo></mml:msup></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(8)</label></disp-formula>
where,
<disp-formula id="pcbi.1007177.e025"><alternatives><graphic id="pcbi.1007177.e025g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e025" xlink:type="simple"/><mml:math display="block" id="M25"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi mathvariant="script">W</mml:mi> <mml:mrow><mml:mo>[</mml:mo> <mml:mrow><mml:mo>[</mml:mo> <mml:mi>T</mml:mi> <mml:mi>F</mml:mi> <mml:mo>]</mml:mo></mml:mrow> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>x</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>]</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:mfrac><mml:mrow><mml:msubsup><mml:mo>∫</mml:mo> <mml:mn>0</mml:mn> <mml:mrow><mml:mi mathvariant="script">L</mml:mi> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn></mml:mrow></mml:msubsup> <mml:mrow><mml:mo>[</mml:mo> <mml:mi>T</mml:mi> <mml:mi>F</mml:mi> <mml:mo>]</mml:mo></mml:mrow> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>x</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mi mathvariant="normal">d</mml:mi> <mml:mi>x</mml:mi> <mml:mo>-</mml:mo> <mml:msubsup><mml:mo>∫</mml:mo> <mml:mrow><mml:mi mathvariant="script">L</mml:mi> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn></mml:mrow> <mml:mi mathvariant="script">L</mml:mi></mml:msubsup> <mml:mrow><mml:mo>[</mml:mo> <mml:mi>T</mml:mi> <mml:mi>F</mml:mi> <mml:mo>]</mml:mo></mml:mrow> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>x</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mi mathvariant="normal">d</mml:mi> <mml:mi>x</mml:mi></mml:mrow> <mml:mrow><mml:mfrac><mml:mi mathvariant="script">L</mml:mi> <mml:mn>2</mml:mn></mml:mfrac> <mml:msub><mml:mo form="prefix" movablelimits="true">max</mml:mo> <mml:mi>x</mml:mi></mml:msub> <mml:mrow><mml:mo>{</mml:mo> <mml:mrow><mml:mo>[</mml:mo> <mml:mi>T</mml:mi> <mml:mi>F</mml:mi> <mml:mo>]</mml:mo></mml:mrow> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>x</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>}</mml:mo></mml:mrow></mml:mrow></mml:mfrac> <mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(9)</label></disp-formula>
where we use a value of <italic>F</italic>* = −1.6 × 10<sup>−3</sup>, which corresponds a value of <inline-formula id="pcbi.1007177.e026"><alternatives><graphic id="pcbi.1007177.e026g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e026" xlink:type="simple"/><mml:math display="inline" id="M26"><mml:mrow><mml:mi mathvariant="script">W</mml:mi> <mml:mo>≈</mml:mo> <mml:mn>0</mml:mn> <mml:mo>.</mml:mo> <mml:mn>2</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>, when <italic>κ</italic><sub><italic>F</italic></sub> = 10<sup>−3</sup>. Strictly, an inviability on a lineage or a hybrid should correspond to <inline-formula id="pcbi.1007177.e027"><alternatives><graphic id="pcbi.1007177.e027g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e027" xlink:type="simple"/><mml:math display="inline" id="M27"><mml:mrow><mml:mi mathvariant="script">W</mml:mi> <mml:mo>=</mml:mo> <mml:mn>0</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> or <italic>F</italic>* = −∞, however, these values were chosen to so that a reasonable number of incompatibilities arise in a simulation; for comparison the typical maximum of the integral <inline-formula id="pcbi.1007177.e028"><alternatives><graphic id="pcbi.1007177.e028g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e028" xlink:type="simple"/><mml:math display="inline" id="M28"><mml:mrow><mml:mi mathvariant="script">W</mml:mi> <mml:mo>≈</mml:mo> <mml:mn>0</mml:mn> <mml:mo>.</mml:mo> <mml:mn>6</mml:mn></mml:mrow></mml:math></alternatives></inline-formula>. In this paper, we explore how the changing the population scaled strength of selection (2<italic>Nκ</italic><sub><italic>F</italic></sub>) affects the rate of reproductive isolation, by keeping <italic>κ</italic><sub><italic>F</italic></sub> fixed and varying<italic>N</italic> accordingly. Note that although here the exact form of the fitness is slightly different to the one used in [<xref ref-type="bibr" rid="pcbi.1007177.ref017">17</xref>], the qualitative behaviour is the same (<xref ref-type="supplementary-material" rid="pcbi.1007177.s001">S1 Text</xref>).</p>
<p>The speciation simulations consist of two replicate simulations starting with the same common ancestor and with the same fitness function. We draw the common ancestor from the equilibrium distribution for <italic><bold>G</bold></italic> and <italic>α</italic>. To do this we start from a random initial genome, and run one long simulation for 100,000 substitutions for a fixed scaled population size 2<italic>Nκ</italic><sub><italic>F</italic></sub>, in order to effectively equilibrate the system (typically 10,000 substitutions are required to adapt to an ensemble of fit states). This represents a reference equilibrium state; different random draws from the equilibrium distribution then consist of running the simulation for a further 100 substitutions.</p>
</sec>
<sec id="sec025">
<title>Decomposing DMIs</title>
<p>Given a pattern of hybrid incompatibilities, for example, as shown in <xref ref-type="fig" rid="pcbi.1007177.g004">Fig 4</xref>, if there is a 2-way DMI (e.g. between <italic>C</italic> and <italic>α</italic> loci, which we denote <italic>I</italic><sub><monospace>Ca</monospace></sub>), then all four hybrid-genotypes containing this DMI (e.g. <monospace>RMCa</monospace>, <monospace>RmCa</monospace>, <monospace>rMCa</monospace>, <monospace>rmCa</monospace>) are inviable; these genotypes define a two-dimensional subspace (or face) of the hypercube. Similarly, the points (e.g. <monospace>rmcA</monospace>, <monospace>RmcA</monospace>, which we denote <italic>I</italic><sub><monospace>mcA</monospace></sub>) containing a 3-way DMI form a one-dimensional subspace (or line), while a 4-way DMI takes up only a single point in the four-dimensional hypercube. These different 2-way, 3-way and 4-way DMIs are the fundamental incompatibility types which we seek to explain the pattern of hybrid inviable genotypes observed, for example, as in <xref ref-type="fig" rid="pcbi.1007177.g004">Fig 4a</xref>.</p>
<p>However, this decomposition is hugely underdetermined, as there are only 2<sup>4</sup> − 2 = 14 possible hybrids (not including the well-adapted genotypes of line 1 and line 2) and a total of <italic>I</italic><sub><italic>max</italic></sub> = 3<sup><italic>L</italic></sup> + 1 − 2<sup><italic>L</italic>+1</sup> = 50, different fundamental incompatibilities, for <italic>L</italic> = 4 loci. This arises as the total number of <italic>n</italic>−point DMIs is <inline-formula id="pcbi.1007177.e029"><alternatives><graphic id="pcbi.1007177.e029g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e029" xlink:type="simple"/><mml:math display="inline" id="M29"><mml:mrow><mml:mrow><mml:mo>(</mml:mo> <mml:msup><mml:mn>2</mml:mn> <mml:mi>n</mml:mi></mml:msup> <mml:mo>-</mml:mo> <mml:mn>2</mml:mn> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>(</mml:mo> <mml:mfrac linethickness="0pt"><mml:mi>L</mml:mi> <mml:mi>n</mml:mi></mml:mfrac> <mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula>, as there are <inline-formula id="pcbi.1007177.e030"><alternatives><graphic id="pcbi.1007177.e030g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e030" xlink:type="simple"/><mml:math display="inline" id="M30"><mml:mo>(</mml:mo> <mml:mfrac linethickness="0pt"><mml:mi>L</mml:mi> <mml:mi>n</mml:mi></mml:mfrac> <mml:mo>)</mml:mo></mml:math></alternatives></inline-formula> combinations of<italic>N</italic> loci amongst <italic>L</italic> total loci and then considering a binary choice of alleles across both lines, there are a total of 2<sup><italic>n</italic></sup> allelic combinations or states, 2 of which are the fit allelic combinations where all alleles come from one lineage or the other giving 2<sup><italic>n</italic></sup> − 2. For example, between each pair of loci there are 2<sup>2</sup> − 2 = 2 mismatching combinations of alleles (e.g. <monospace>rM</monospace> and <monospace>Rm</monospace>) that could give DMIs and <inline-formula id="pcbi.1007177.e031"><alternatives><graphic id="pcbi.1007177.e031g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e031" xlink:type="simple"/><mml:math display="inline" id="M31"><mml:mrow><mml:mo>(</mml:mo> <mml:mfrac linethickness="0pt"><mml:mi>L</mml:mi> <mml:mn>2</mml:mn></mml:mfrac> <mml:mo>)</mml:mo> <mml:mo>=</mml:mo> <mml:mi>L</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>L</mml:mi> <mml:mo>-</mml:mo> <mml:mn>1</mml:mn> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn> <mml:mo>=</mml:mo> <mml:mn>6</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> pairwise interactions. A similar argument would give a total of 24 3-way DMIs as there are 2<sup>3</sup> − 2 = 6 mismatching combinations of alleles at 3 loci (e.g., excluding <monospace>rmc</monospace> and <monospace>RMC</monospace>) and <inline-formula id="pcbi.1007177.e032"><alternatives><graphic id="pcbi.1007177.e032g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e032" xlink:type="simple"/><mml:math display="inline" id="M32"><mml:mrow><mml:mo>(</mml:mo> <mml:mfrac linethickness="0pt"><mml:mi>L</mml:mi> <mml:mn>3</mml:mn></mml:mfrac> <mml:mo>)</mml:mo> <mml:mo>=</mml:mo> <mml:mn>4</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> 3-way interactions and similarly, <inline-formula id="pcbi.1007177.e033"><alternatives><graphic id="pcbi.1007177.e033g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e033" xlink:type="simple"/><mml:math display="inline" id="M33"><mml:mrow><mml:mn>14</mml:mn> <mml:mo>(</mml:mo> <mml:mfrac linethickness="0pt"><mml:mi>L</mml:mi> <mml:mn>4</mml:mn></mml:mfrac> <mml:mo>)</mml:mo> <mml:mo>=</mml:mo> <mml:mn>14</mml:mn></mml:mrow></mml:math></alternatives></inline-formula> for 4-way interactions. In total, the max number of DMIs is <inline-formula id="pcbi.1007177.e018"><alternatives><graphic id="pcbi.1007177.e018g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1007177.e018" xlink:type="simple"/><mml:math display="inline" id="M18"><mml:mrow><mml:msub><mml:mi>I</mml:mi> <mml:mrow><mml:mi>m</mml:mi> <mml:mi>a</mml:mi> <mml:mi>x</mml:mi></mml:mrow></mml:msub> <mml:mo>=</mml:mo> <mml:msubsup><mml:mo>∑</mml:mo> <mml:mrow><mml:mi>n</mml:mi> <mml:mo>=</mml:mo> <mml:mn>2</mml:mn></mml:mrow> <mml:mi>L</mml:mi></mml:msubsup> <mml:mrow><mml:mo>(</mml:mo> <mml:msup><mml:mn>2</mml:mn> <mml:mi>n</mml:mi></mml:msup> <mml:mo>-</mml:mo> <mml:mn>2</mml:mn> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>(</mml:mo> <mml:mfrac linethickness="0pt"><mml:mi>L</mml:mi> <mml:mi>n</mml:mi></mml:mfrac> <mml:mo>)</mml:mo> <mml:mo>=</mml:mo> <mml:msup><mml:mn>3</mml:mn> <mml:mi>L</mml:mi></mml:msup> <mml:mo>+</mml:mo> <mml:mn>1</mml:mn> <mml:mo>-</mml:mo> <mml:msup><mml:mn>2</mml:mn> <mml:mrow><mml:mi>L</mml:mi> <mml:mo>+</mml:mo> <mml:mn>1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:math></alternatives></inline-formula>, which for <italic>L</italic> = 4 loci is <italic>I</italic><sub><italic>max</italic></sub> = 50.</p>
<p>The approach we take is to find only those combinations of fundamental DMIs that have the smallest total number that can explain the pattern of hybrid incompatibilities, which from a Bayesian perspective would have the smallest Occam factors [<xref ref-type="bibr" rid="pcbi.1007177.ref086">86</xref>]; for instance, as shown in <xref ref-type="fig" rid="pcbi.1007177.g004">Fig 4b</xref> the list of 6 incompatible hybrid genotypes <monospace>rmCa</monospace>, <monospace>rMCa</monospace>,<monospace>RmCa</monospace>,<monospace>RMCa</monospace>,<monospace>Rmca</monospace>,<monospace>RMca</monospace>, shown by red crosses, can be explained most parsimoniously by three different minimal combinations of fundamental DMIs, each with only 2 DMIs (see main text).</p>
</sec>
</sec>
<sec id="sec026">
<title>Supporting information</title>
<supplementary-material id="pcbi.1007177.s001" mimetype="application/pdf" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1007177.s001" xlink:type="simple">
<label>S1 Text</label>
<caption>
<title>Supporting figures and results.</title>
<p>(PDF)</p>
</caption>
</supplementary-material>
</sec>
</body>
<back>
<ack>
<p>We would like to thank Davis Pollock for initial discussions.</p>
</ack>
<ref-list>
<title>References</title>
<ref id="pcbi.1007177.ref001">
<label>1</label>
<mixed-citation publication-type="book" xlink:type="simple">
<name name-style="western"><surname>Darwin</surname> <given-names>CR</given-names></name>. <chapter-title>The Origin of Species</chapter-title>. <publisher-name>J. Murray</publisher-name>, <publisher-loc>London</publisher-loc>; <year>1859</year>.</mixed-citation>
</ref>
<ref id="pcbi.1007177.ref002">
<label>2</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Dobzhansky</surname> <given-names>T</given-names></name>. <article-title>Studies on Hybrid Sterility. II. Localization of Sterility Factors in Drosophila Pseudoobscura Hybrids</article-title>. <source>Genetics</source>. <year>1936</year>;<volume>21</volume>(<issue>2</issue>):<fpage>113</fpage>–<lpage>135</lpage>. <object-id pub-id-type="pmid">17246786</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref003">
<label>3</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Muller</surname> <given-names>HJ</given-names></name>. <article-title>Isolating mechanisms, evolution and temperature</article-title>. <source>Biol Symp</source>. <year>1942</year>;<volume>6</volume>:<fpage>71</fpage>–<lpage>125</lpage>.</mixed-citation>
</ref>
<ref id="pcbi.1007177.ref004">
<label>4</label>
<mixed-citation publication-type="book" xlink:type="simple">
<name name-style="western"><surname>Bateson</surname> <given-names>W</given-names></name>. In: <name name-style="western"><surname>Seward</surname> <given-names>AC</given-names></name>, editor. <source>Darwin and Modern Science</source>. <publisher-name>Cambridge University Press</publisher-name>; <year>1909</year>. p. <fpage>85</fpage>–<lpage>101</lpage>.</mixed-citation>
</ref>
<ref id="pcbi.1007177.ref005">
<label>5</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Orr</surname> <given-names>HA</given-names></name>. <article-title>The population genetics of speciation: the evolution of hybrid incompatibilities</article-title>. <source>Genetics</source>. <year>1995</year>;<volume>139</volume>(<issue>4</issue>):<fpage>1805</fpage>–<lpage>1813</lpage>. <object-id pub-id-type="pmid">7789779</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref006">
<label>6</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Matute</surname> <given-names>DR</given-names></name>, <name name-style="western"><surname>Coyne</surname> <given-names>JA</given-names></name>. <article-title>Intrinsic reproductive isolation between two sister species of Drosophila</article-title>. <source>Evolution</source>. <year>2010</year>;<volume>64</volume>(<issue>4</issue>):<fpage>903</fpage>–<lpage>920</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/j.1558-5646.2009.00879.x" xlink:type="simple">10.1111/j.1558-5646.2009.00879.x</ext-link></comment> <object-id pub-id-type="pmid">19891626</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref007">
<label>7</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Verster</surname> <given-names>AJ</given-names></name>, <name name-style="western"><surname>Ramani</surname> <given-names>AK</given-names></name>, <name name-style="western"><surname>McKay</surname> <given-names>SJ</given-names></name>, <name name-style="western"><surname>Fraser</surname> <given-names>AG</given-names></name>. <article-title>Comparative RNAi screens in C. elegans and C. briggsae reveal the impact of developmental system drift on gene function</article-title>. <source>PLoS genetics</source>. <year>2014</year>;<volume>10</volume>(<issue>2</issue>):<fpage>e1004077</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pgen.1004077" xlink:type="simple">10.1371/journal.pgen.1004077</ext-link></comment> <object-id pub-id-type="pmid">24516395</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref008">
<label>8</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Wotton</surname> <given-names>KR</given-names></name>, <name name-style="western"><surname>Jiménez-Guri</surname> <given-names>E</given-names></name>, <name name-style="western"><surname>Crombach</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Janssens</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Alcaine-Colet</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Lemke</surname> <given-names>S</given-names></name>, <etal>et al</etal>. <article-title>Quantitative system drift compensates for altered maternal inputs to the gap gene network of the scuttle fly Megaselia abdita</article-title>. <source>eLife</source>. <year>2015</year>;<volume>4</volume>:<fpage>e04785</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.7554/eLife.04785" xlink:type="simple">10.7554/eLife.04785</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref009">
<label>9</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Crombach</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Wotton</surname> <given-names>KR</given-names></name>, <name name-style="western"><surname>Jiménez-Guri</surname> <given-names>E</given-names></name>, <name name-style="western"><surname>Jaeger</surname> <given-names>J</given-names></name>. <article-title>Gap Gene Regulatory Dynamics Evolve along a Genotype Network</article-title>. <source>Molecular Biology and Evolution</source>. <year>2016</year>;<volume>33</volume>(<issue>5</issue>):<fpage>1293</fpage>–<lpage>1307</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/molbev/msw013" xlink:type="simple">10.1093/molbev/msw013</ext-link></comment> <object-id pub-id-type="pmid">26796549</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref010">
<label>10</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>True</surname> <given-names>JR</given-names></name>, <name name-style="western"><surname>Haag</surname> <given-names>ES</given-names></name>. <article-title>Developmental system drift and flexibility in evolutionary trajectories</article-title>. <source>Evolution &amp; development</source>. <year>2001</year>;<volume>3</volume>(<issue>2</issue>):<fpage>109</fpage>–<lpage>119</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1046/j.1525-142x.2001.003002109.x" xlink:type="simple">10.1046/j.1525-142x.2001.003002109.x</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref011">
<label>11</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Haag</surname> <given-names>ES</given-names></name>. <article-title>The same but different: worms reveal the pervasiveness of developmental system drift</article-title>. <source>PLoS Genet</source>. <year>2014</year>;<volume>10</volume>(<issue>2</issue>):<fpage>e1004150</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pgen.1004150" xlink:type="simple">10.1371/journal.pgen.1004150</ext-link></comment> <object-id pub-id-type="pmid">24516407</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref012">
<label>12</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Johnson</surname> <given-names>NA</given-names></name>, <name name-style="western"><surname>Porter</surname> <given-names>AH</given-names></name>. <article-title>Rapid speciation via parallel, directional selection on regulatory genetic pathways</article-title>. <source>Journal of Theoretical Biology</source>. <year>2000</year>;<volume>205</volume>(<issue>4</issue>):<fpage>527</fpage>–<lpage>542</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1006/jtbi.2000.2070" xlink:type="simple">10.1006/jtbi.2000.2070</ext-link></comment> <object-id pub-id-type="pmid">10931750</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref013">
<label>13</label>
<mixed-citation publication-type="book" xlink:type="simple">
<name name-style="western"><surname>Johnson</surname> <given-names>NA</given-names></name>, <name name-style="western"><surname>Porter</surname> <given-names>AH</given-names></name>. <chapter-title>Toward a new synthesis: population genetics and evolutionary developmental biology</chapter-title>. In: <source>Microevolution Rate, Pattern, Process</source>. <publisher-name>Springer</publisher-name>; <year>2001</year>. p. <fpage>45</fpage>–<lpage>58</lpage>.</mixed-citation>
</ref>
<ref id="pcbi.1007177.ref014">
<label>14</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Fontana</surname> <given-names>W</given-names></name>. <article-title>Modelling’evo-devo’ with RNA</article-title>. <source>Bioessays</source>. <year>2002</year>;<volume>24</volume>(<issue>12</issue>):<fpage>1164</fpage>–<lpage>1177</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1002/bies.10190" xlink:type="simple">10.1002/bies.10190</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref015">
<label>15</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Berg</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Willmann</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Lässig</surname> <given-names>M</given-names></name>. <article-title>Adaptive evolution of transcription factor binding sites</article-title>. <source>BMC Evol Biol</source>. <year>2004</year>;<volume>4</volume>(<issue>1</issue>):<fpage>42</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/1471-2148-4-42" xlink:type="simple">10.1186/1471-2148-4-42</ext-link></comment> <object-id pub-id-type="pmid">15511291</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref016">
<label>16</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Mustonen</surname> <given-names>V</given-names></name>, <name name-style="western"><surname>Kinney</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Callan</surname> <given-names>CG</given-names></name>, <name name-style="western"><surname>Lässig</surname> <given-names>M</given-names></name>. <article-title>Energy-dependent fitness: a quantitative model for the evolution of yeast transcription factor binding sites</article-title>. <source>Proceedings of the National Academy of Sciences</source>. <year>2008</year>;<volume>105</volume>(<issue>34</issue>):<fpage>12376</fpage>–<lpage>12381</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1073/pnas.0805909105" xlink:type="simple">10.1073/pnas.0805909105</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref017">
<label>17</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Khatri</surname> <given-names>BS</given-names></name>, <name name-style="western"><surname>McLeish</surname> <given-names>TCB</given-names></name>, <name name-style="western"><surname>Sear</surname> <given-names>RP</given-names></name>. <article-title>Statistical mechanics of convergent evolution in spatial patterning</article-title>. <source>Proc Natl Acad Sci U S A</source>. <year>2009</year>;<volume>106</volume>(<issue>24</issue>):<fpage>9564</fpage>–<lpage>9569</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1073/pnas.0812260106" xlink:type="simple">10.1073/pnas.0812260106</ext-link></comment> <object-id pub-id-type="pmid">19497876</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref018">
<label>18</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Hayden</surname> <given-names>EJ</given-names></name>, <name name-style="western"><surname>Ferrada</surname> <given-names>E</given-names></name>, <name name-style="western"><surname>Wagner</surname> <given-names>A</given-names></name>. <article-title>Cryptic genetic variation promotes rapid evolutionary adaptation in an RNA enzyme</article-title>. <source>Nature</source>. <year>2011</year>;<volume>474</volume>(<issue>7349</issue>):<fpage>92</fpage>–<lpage>95</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nature10083" xlink:type="simple">10.1038/nature10083</ext-link></comment> <object-id pub-id-type="pmid">21637259</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref019">
<label>19</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Goldstein</surname> <given-names>RA</given-names></name>. <article-title>The evolution and evolutionary consequences of marginal thermostability in proteins</article-title>. <source>Proteins: Structure, Function, and Bioinformatics</source>. <year>2011</year>;<volume>79</volume>(<issue>5</issue>):<fpage>1396</fpage>–<lpage>1407</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1002/prot.22964" xlink:type="simple">10.1002/prot.22964</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref020">
<label>20</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Schaper</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Louis</surname> <given-names>AA</given-names></name>. <article-title>The arrival of the frequent: how bias in genotype-phenotype maps can steer populations to local optima</article-title>. <source>PloS one</source>. <year>2014</year>;<volume>9</volume>(<issue>2</issue>):<fpage>e86635</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pone.0086635" xlink:type="simple">10.1371/journal.pone.0086635</ext-link></comment> <object-id pub-id-type="pmid">24505262</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref021">
<label>21</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Greenbury</surname> <given-names>SF</given-names></name>, <name name-style="western"><surname>Johnston</surname> <given-names>IG</given-names></name>, <name name-style="western"><surname>Louis</surname> <given-names>AA</given-names></name>, <name name-style="western"><surname>Ahnert</surname> <given-names>SE</given-names></name>. <article-title>A tractable genotype–phenotype map modelling the self-assembly of protein quaternary structure</article-title>. <source>Journal of The Royal Society Interface</source>. <year>2014</year>;<volume>11</volume>(<issue>95</issue>):<fpage>20140249</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1098/rsif.2014.0249" xlink:type="simple">10.1098/rsif.2014.0249</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref022">
<label>22</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Lynch</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Hagner</surname> <given-names>K</given-names></name>. <article-title>Evolutionary meandering of intermolecular interactions along the drift barrier</article-title>. <source>Proceedings of the National Academy of Sciences</source>. <year>2015</year>;<volume>112</volume>(<issue>1</issue>):<fpage>E30</fpage>–<lpage>E38</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1073/pnas.1421641112" xlink:type="simple">10.1073/pnas.1421641112</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref023">
<label>23</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Manrubia</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Cuesta</surname> <given-names>JA</given-names></name>. <article-title>Evolution on neutral networks accelerates the ticking rate of the molecular clock</article-title>. <source>Journal of The Royal Society Interface</source>. <year>2015</year>;<volume>12</volume>(<issue>102</issue>):<fpage>20141010</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1098/rsif.2014.1010" xlink:type="simple">10.1098/rsif.2014.1010</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref024">
<label>24</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Greenbury</surname> <given-names>SF</given-names></name>, <name name-style="western"><surname>Schaper</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Ahnert</surname> <given-names>SE</given-names></name>, <name name-style="western"><surname>Louis</surname> <given-names>AA</given-names></name>. <article-title>Genetic correlations greatly increase mutational robustness and can both reduce and enhance evolvability</article-title>. <source>PLoS Comput Biol</source>. <year>2016</year>;<volume>12</volume>(<issue>3</issue>):<fpage>e1004773</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pcbi.1004773" xlink:type="simple">10.1371/journal.pcbi.1004773</ext-link></comment> <object-id pub-id-type="pmid">26937652</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref025">
<label>25</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Goldstein</surname> <given-names>RA</given-names></name>, <name name-style="western"><surname>Pollock</surname> <given-names>DD</given-names></name>. <article-title>Sequence entropy of folding and the absolute rate of amino acid substitutions</article-title>. <source>Nature ecology &amp; evolution</source>. <year>2017</year>;<volume>1</volume>(<issue>12</issue>):<fpage>1923</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41559-017-0338-9" xlink:type="simple">10.1038/s41559-017-0338-9</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref026">
<label>26</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Khatri</surname> <given-names>BS</given-names></name>, <name name-style="western"><surname>Goldstein</surname> <given-names>RA</given-names></name>. <article-title>A coarse-grained biophysical model of sequence evolution and the population size dependence of the speciation rate</article-title>. <source>Journal of theoretical biology</source>. <year>2015</year>;<volume>378</volume>:<fpage>56</fpage>–<lpage>64</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.jtbi.2015.04.027" xlink:type="simple">10.1016/j.jtbi.2015.04.027</ext-link></comment> <object-id pub-id-type="pmid">25936759</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref027">
<label>27</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Khatri</surname> <given-names>BS</given-names></name>, <name name-style="western"><surname>Goldstein</surname> <given-names>RA</given-names></name>. <article-title>Simple biophysical model predicts faster accumulation of hybrid incompatibilities in small populations under stabilizing selection</article-title>. <source>Genetics</source>. <year>2015</year>;<volume>201</volume>(<issue>4</issue>):<fpage>1525</fpage>–<lpage>1537</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.115.181685" xlink:type="simple">10.1534/genetics.115.181685</ext-link></comment> <object-id pub-id-type="pmid">26434721</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref028">
<label>28</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Shea</surname> <given-names>MA</given-names></name>, <name name-style="western"><surname>Ackers</surname> <given-names>GK</given-names></name>. <article-title>The OR control system of bacteriophage lambda. A physical-chemical model for gene regulation</article-title>. <source>J Mol Biol</source>. <year>1985</year>;<volume>181</volume>(<issue>2</issue>):<fpage>211</fpage>–<lpage>230</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/0022-2836(85)90086-5" xlink:type="simple">10.1016/0022-2836(85)90086-5</ext-link></comment> <object-id pub-id-type="pmid">3157005</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref029">
<label>29</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Eyre-Walker</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Woolfit</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Phelps</surname> <given-names>T</given-names></name>. <article-title>The distribution of fitness effects of new deleterious amino acid mutations in humans</article-title>. <source>Genetics</source>. <year>2006</year>;<volume>173</volume>(<issue>2</issue>):<fpage>891</fpage>–<lpage>900</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.106.057570" xlink:type="simple">10.1534/genetics.106.057570</ext-link></comment> <object-id pub-id-type="pmid">16547091</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref030">
<label>30</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Huber</surname> <given-names>CD</given-names></name>, <name name-style="western"><surname>Kim</surname> <given-names>BY</given-names></name>, <name name-style="western"><surname>Marsden</surname> <given-names>CD</given-names></name>, <name name-style="western"><surname>Lohmueller</surname> <given-names>KE</given-names></name>. <article-title>Determining the factors driving selective effects of new nonsynonymous mutations</article-title>. <source>Proceedings of the National Academy of Sciences</source>. <year>2017</year>;<volume>114</volume>(<issue>17</issue>):<fpage>4465</fpage>–<lpage>4470</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1073/pnas.1619508114" xlink:type="simple">10.1073/pnas.1619508114</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref031">
<label>31</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Orr</surname> <given-names>HA</given-names></name>, <name name-style="western"><surname>Turelli</surname> <given-names>M</given-names></name>. <article-title>The evolution of postzygotic isolation: accumulating Dobzhansky-Muller incompatibilities</article-title>. <source>Evolution</source>. <year>2001</year>;<volume>55</volume>(<issue>6</issue>):<fpage>1085</fpage>–<lpage>1094</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/j.0014-3820.2001.tb00628.x" xlink:type="simple">10.1111/j.0014-3820.2001.tb00628.x</ext-link></comment> <object-id pub-id-type="pmid">11475044</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref032">
<label>32</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Bertin</surname> <given-names>E</given-names></name>, <name name-style="western"><surname>Bouchaud</surname> <given-names>JP</given-names></name>. <article-title>Subdiffusion and localization in the one-dimensional trap model</article-title>. <source>Physical Review E</source>. <year>2003</year>;<volume>67</volume>(<issue>2</issue>):<fpage>026128</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1103/PhysRevE.67.026128" xlink:type="simple">10.1103/PhysRevE.67.026128</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref033">
<label>33</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>King</surname> <given-names>MC</given-names></name>, <name name-style="western"><surname>Wilson</surname> <given-names>AC</given-names></name>. <article-title>Evolution at two levels in humans and chimpanzees</article-title>. <source>Science</source>. <year>1975</year>;<volume>188</volume>(<issue>4184</issue>):<fpage>107</fpage>–<lpage>116</lpage>.</mixed-citation>
</ref>
<ref id="pcbi.1007177.ref034">
<label>34</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Wolf</surname> <given-names>JB</given-names></name>, <name name-style="western"><surname>Lindell</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Backström</surname> <given-names>N</given-names></name>. <source>Speciation genetics: current status and evolving approaches</source>; <year>2010</year>. </mixed-citation>
</ref>
<ref id="pcbi.1007177.ref035">
<label>35</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Wray</surname> <given-names>GA</given-names></name>. <article-title>The evolutionary significance of cis-regulatory mutations</article-title>. <source>Nature Reviews Genetics</source>. <year>2007</year>;<volume>8</volume>(<issue>3</issue>):<fpage>206</fpage>–<lpage>216</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nrg2063" xlink:type="simple">10.1038/nrg2063</ext-link></comment> <object-id pub-id-type="pmid">17304246</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref036">
<label>36</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Abzhanov</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Kuo</surname> <given-names>WP</given-names></name>, <name name-style="western"><surname>Hartmann</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Grant</surname> <given-names>BR</given-names></name>, <name name-style="western"><surname>Grant</surname> <given-names>PR</given-names></name>, <name name-style="western"><surname>Tabin</surname> <given-names>CJ</given-names></name>. <article-title>The calmodulin pathway and evolution of elongated beak morphology in Darwin’s finches</article-title>. <source>Nature</source>. <year>2006</year>;<volume>442</volume>(<issue>7102</issue>):<fpage>563</fpage>–<lpage>567</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nature04843" xlink:type="simple">10.1038/nature04843</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref037">
<label>37</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Wittkopp</surname> <given-names>PJ</given-names></name>, <name name-style="western"><surname>Haerum</surname> <given-names>BK</given-names></name>, <name name-style="western"><surname>Clark</surname> <given-names>AG</given-names></name>. <article-title>Regulatory changes underlying expression differences within and between Drosophila species</article-title>. <source>Nature genetics</source>. <year>2008</year>;<volume>40</volume>(<issue>3</issue>):<fpage>346</fpage>–<lpage>350</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng.77" xlink:type="simple">10.1038/ng.77</ext-link></comment> <object-id pub-id-type="pmid">18278046</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref038">
<label>38</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Ting</surname> <given-names>CT</given-names></name>, <name name-style="western"><surname>Tsaur</surname> <given-names>SC</given-names></name>, <name name-style="western"><surname>Wu</surname> <given-names>ML</given-names></name>, <name name-style="western"><surname>Wu</surname> <given-names>CI</given-names></name>. <article-title>A rapidly evolving homeobox at the site of a hybrid sterility gene</article-title>. <source>Science</source>. <year>1998</year>;<volume>282</volume>(<issue>5393</issue>):<fpage>1501</fpage>–<lpage>1504</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1126/science.282.5393.1501" xlink:type="simple">10.1126/science.282.5393.1501</ext-link></comment> <object-id pub-id-type="pmid">9822383</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref039">
<label>39</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Brideau</surname> <given-names>NJ</given-names></name>, <name name-style="western"><surname>Flores</surname> <given-names>HA</given-names></name>, <name name-style="western"><surname>Wang</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Maheshwari</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Wang</surname> <given-names>X</given-names></name>, <name name-style="western"><surname>Barbash</surname> <given-names>DA</given-names></name>. <article-title>Two Dobzhansky-Muller genes interact to cause hybrid lethality in Drosophila</article-title>. <source>science</source>. <year>2006</year>;<volume>314</volume>(<issue>5803</issue>):<fpage>1292</fpage>–<lpage>1295</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1126/science.1133953" xlink:type="simple">10.1126/science.1133953</ext-link></comment> <object-id pub-id-type="pmid">17124320</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref040">
<label>40</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Bayes</surname> <given-names>JJ</given-names></name>, <name name-style="western"><surname>Malik</surname> <given-names>HS</given-names></name>. <article-title>Altered heterochromatin binding by a hybrid sterility protein in Drosophila sibling species</article-title>. <source>Science</source>. <year>2009</year>;<volume>326</volume>(<issue>5959</issue>):<fpage>1538</fpage>–<lpage>1541</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1126/science.1181756" xlink:type="simple">10.1126/science.1181756</ext-link></comment> <object-id pub-id-type="pmid">19933102</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref041">
<label>41</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Liénard</surname> <given-names>MA</given-names></name>, <name name-style="western"><surname>Araripe</surname> <given-names>LO</given-names></name>, <name name-style="western"><surname>Hartl</surname> <given-names>DL</given-names></name>. <article-title>Neighboring genes for DNA-binding proteins rescue male sterility in Drosophila hybrids</article-title>. <source>Proceedings of the National Academy of Sciences</source>. <year>2016</year>;<volume>113</volume>(<issue>29</issue>):<fpage>E4200</fpage>–<lpage>E4207</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1073/pnas.1608337113" xlink:type="simple">10.1073/pnas.1608337113</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref042">
<label>42</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Mack</surname> <given-names>KL</given-names></name>, <name name-style="western"><surname>Nachman</surname> <given-names>MW</given-names></name>. <article-title>Gene Regulation and Speciation</article-title>. <source>Trends in Genetics</source>. <year>2016</year>;. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.tig.2016.11.003" xlink:type="simple">10.1016/j.tig.2016.11.003</ext-link></comment> <object-id pub-id-type="pmid">27914620</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref043">
<label>43</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Gavin-Smyth</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Matute</surname> <given-names>DR</given-names></name>. <article-title>Embryonic lethality leads to hybrid male inviability in hybrids between Drosophila melanogaster and D. santomea</article-title>. <source>Ecology and evolution</source>. <year>2013</year>;<volume>3</volume>(<issue>6</issue>):<fpage>1580</fpage>–<lpage>1589</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1002/ece3.573" xlink:type="simple">10.1002/ece3.573</ext-link></comment> <object-id pub-id-type="pmid">23789069</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref044">
<label>44</label>
<mixed-citation publication-type="book" xlink:type="simple">
<name name-style="western"><surname>Fisher</surname> <given-names>RA</given-names></name>. <source>The Genetical Theory of Natural Selection</source>. <publisher-loc>Oxford</publisher-loc>: <publisher-name>Oxford Univ. Press</publisher-name>; <year>1930</year>.</mixed-citation>
</ref>
<ref id="pcbi.1007177.ref045">
<label>45</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Wright</surname> <given-names>S</given-names></name>. <article-title>Evolution in Mendelian Populations</article-title>. <source>Genetics</source>. <year>1931</year>;<volume>16</volume>(<issue>2</issue>):<fpage>97</fpage>–<lpage>159</lpage>. <object-id pub-id-type="pmid">17246615</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref046">
<label>46</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Kimura</surname> <given-names>M</given-names></name>. <article-title>Diffusion models in population genetics</article-title>. <source>Journal of Applied Probability</source>. <year>1964</year>;<volume>1</volume>(<issue>2</issue>):<fpage>177</fpage>–<lpage>232</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.2307/3211856" xlink:type="simple">10.2307/3211856</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref047">
<label>47</label>
<mixed-citation publication-type="book" xlink:type="simple">
<name name-style="western"><surname>Crow</surname> <given-names>JF</given-names></name>, <name name-style="western"><surname>Kimura</surname> <given-names>M</given-names></name>. <chapter-title>An Introduction to Population Genetics Theory</chapter-title>. <publisher-name>Harper &amp; Row</publisher-name>; <year>1970</year>.</mixed-citation>
</ref>
<ref id="pcbi.1007177.ref048">
<label>48</label>
<mixed-citation publication-type="book" xlink:type="simple">
<name name-style="western"><surname>Ewens</surname> <given-names>WJ</given-names></name>. <chapter-title>Mathematical Population Genetics</chapter-title>: 1. <source>A Theoretical Introduction</source>. <publisher-name>Springer</publisher-name>; <year>2010</year>.</mixed-citation>
</ref>
<ref id="pcbi.1007177.ref049">
<label>49</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Mustonen</surname> <given-names>V</given-names></name>, <name name-style="western"><surname>Lässig</surname> <given-names>M</given-names></name>. <article-title>Evolutionary population genetics of promoters: predicting binding sites and functional phylogenies</article-title>. <source>Proceedings of the National Academy of Sciences of the United States of America</source>. <year>2005</year>;<volume>102</volume>(<issue>44</issue>):<fpage>15936</fpage>–<lpage>15941</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1073/pnas.0505537102" xlink:type="simple">10.1073/pnas.0505537102</ext-link></comment> <object-id pub-id-type="pmid">16236723</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref050">
<label>50</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Haldane</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Manhart</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Morozov</surname> <given-names>AV</given-names></name>. <article-title>Biophysical fitness landscapes for transcription factor binding sites</article-title>. <source>PLoS computational biology</source>. <year>2014</year>;<volume>10</volume>(<issue>7</issue>):<fpage>e1003683</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pcbi.1003683" xlink:type="simple">10.1371/journal.pcbi.1003683</ext-link></comment> <object-id pub-id-type="pmid">25010228</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref051">
<label>51</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>von Hippel</surname> <given-names>PH</given-names></name>, <name name-style="western"><surname>Berg</surname> <given-names>OG</given-names></name>. <article-title>On the specificity of DNA-protein interactions</article-title>. <source>Proc Natl Acad Sci U S A</source>. <year>1986</year>;<volume>83</volume>(<issue>6</issue>):<fpage>1608</fpage>–<lpage>1612</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1073/pnas.83.6.1608" xlink:type="simple">10.1073/pnas.83.6.1608</ext-link></comment> <object-id pub-id-type="pmid">3456604</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref052">
<label>52</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Gerland</surname> <given-names>U</given-names></name>, <name name-style="western"><surname>Moroz</surname> <given-names>JD</given-names></name>, <name name-style="western"><surname>Hwa</surname> <given-names>T</given-names></name>. <article-title>Physical constraints and functional characteristics of transcription factor-DNA interaction</article-title>. <source>Proc Natl Acad Sci U S A</source>. <year>2002</year>;<volume>99</volume>(<issue>19</issue>):<fpage>12015</fpage>–<lpage>12020</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1073/pnas.192693599" xlink:type="simple">10.1073/pnas.192693599</ext-link></comment> <object-id pub-id-type="pmid">12218191</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref053">
<label>53</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Iwasa</surname> <given-names>Y</given-names></name>. <article-title>Free fitness that always increases in evolution</article-title>. <source>Journal of Theoretical Biology</source>. <year>1988</year>;<volume>135</volume>(<issue>3</issue>):<fpage>265</fpage>—<lpage>281</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/S0022-5193(88)80243-1" xlink:type="simple">10.1016/S0022-5193(88)80243-1</ext-link></comment> <object-id pub-id-type="pmid">3256719</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref054">
<label>54</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Tulchinsky</surname> <given-names>AY</given-names></name>, <name name-style="western"><surname>Johnson</surname> <given-names>NA</given-names></name>, <name name-style="western"><surname>Watt</surname> <given-names>WB</given-names></name>, <name name-style="western"><surname>Porter</surname> <given-names>AH</given-names></name>. <article-title>Hybrid incompatibility arises in a sequence-based bioenergetic model of transcription factor binding</article-title>. <source>Genetics</source>. <year>2014</year>;<volume>198</volume>(<issue>3</issue>):<fpage>1155</fpage>–<lpage>1166</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.114.168112" xlink:type="simple">10.1534/genetics.114.168112</ext-link></comment> <object-id pub-id-type="pmid">25173845</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref055">
<label>55</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Coyne</surname> <given-names>JA</given-names></name>, <name name-style="western"><surname>Orr</surname> <given-names>HA</given-names></name>. <article-title>The evolutionary genetics of speciation</article-title>. <source>Philos Trans R Soc Lond B Biol Sci</source>. <year>1998</year>;<volume>353</volume>(<issue>1366</issue>):<fpage>287</fpage>–<lpage>305</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1098/rstb.1998.0210" xlink:type="simple">10.1098/rstb.1998.0210</ext-link></comment> <object-id pub-id-type="pmid">9533126</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref056">
<label>56</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Barraclough</surname> <given-names>TG</given-names></name>, <name name-style="western"><surname>Nee</surname> <given-names>S</given-names></name>. <article-title>Phylogenetics and speciation</article-title>. <source>Trends in Ecology &amp; Evolution</source>. <year>2001</year>;<volume>16</volume>(<issue>7</issue>):<fpage>391</fpage>–<lpage>399</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/S0169-5347(01)02161-9" xlink:type="simple">10.1016/S0169-5347(01)02161-9</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref057">
<label>57</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Nee</surname> <given-names>S</given-names></name>. <article-title>Inferring speciation rates from phylogenies</article-title>. <source>Evolution</source>. <year>2001</year>;<volume>55</volume>(<issue>4</issue>):<fpage>661</fpage>–<lpage>668</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1554/0014-3820(2001)055%5B0661:ISRFP%5D2.0.CO;2" xlink:type="simple">10.1554/0014-3820(2001)055%5B0661:ISRFP%5D2.0.CO;2</ext-link></comment> <object-id pub-id-type="pmid">11392383</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref058">
<label>58</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Fitzpatrick</surname> <given-names>BM</given-names></name>. <article-title>Rates of evolution of hybrid inviability in birds and mammals</article-title>. <source>Evolution</source>. <year>2004</year>;<volume>58</volume>(<issue>8</issue>):<fpage>1865</fpage>–<lpage>1870</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1554/04-190" xlink:type="simple">10.1554/04-190</ext-link></comment> <object-id pub-id-type="pmid">15446440</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref059">
<label>59</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Stelkens</surname> <given-names>RB</given-names></name>, <name name-style="western"><surname>Young</surname> <given-names>KA</given-names></name>, <name name-style="western"><surname>Seehausen</surname> <given-names>O</given-names></name>. <article-title>The accumulation of reproductive incompatibilities in African cichlid fish</article-title>. <source>Evolution</source>. <year>2010</year>;<volume>64</volume>(<issue>3</issue>):<fpage>617</fpage>–<lpage>633</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/j.1558-5646.2009.00849.x" xlink:type="simple">10.1111/j.1558-5646.2009.00849.x</ext-link></comment> <object-id pub-id-type="pmid">19796149</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref060">
<label>60</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Cooper</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Penny</surname> <given-names>D</given-names></name>. <article-title>Mass survival of birds across the Cretaceous-Tertiary boundary: molecular evidence</article-title>. <source>Science</source>. <year>1997</year>;<volume>275</volume>(<issue>5303</issue>):<fpage>1109</fpage>–<lpage>1113</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1126/science.275.5303.1109" xlink:type="simple">10.1126/science.275.5303.1109</ext-link></comment> <object-id pub-id-type="pmid">9027308</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref061">
<label>61</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Van Oppen</surname> <given-names>MH</given-names></name>, <name name-style="western"><surname>Turner</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Rico</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Deutsch</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Ibrahim</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Robinson</surname> <given-names>R</given-names></name>, <etal>et al</etal>. <article-title>Unusually fine–scale genetic structuring found in rapidly speciating Malawi cichlid fishes</article-title>. <source>Proceedings of the Royal Society of London B: Biological Sciences</source>. <year>1997</year>;<volume>264</volume>(<issue>1389</issue>):<fpage>1803</fpage>–<lpage>1812</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1098/rspb.1997.0248" xlink:type="simple">10.1098/rspb.1997.0248</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref062">
<label>62</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Fiumera</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Parker</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Fuerst</surname> <given-names>P</given-names></name>. <article-title>Effective population size and maintenance of genetic diversity in captive-bred populations of a lake Victoria cichlid</article-title>. <source>Conservation Biology</source>. <year>2000</year>;<volume>14</volume>(<issue>3</issue>):<fpage>886</fpage>–<lpage>892</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1046/j.1523-1739.2000.97337.x" xlink:type="simple">10.1046/j.1523-1739.2000.97337.x</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref063">
<label>63</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Jorde</surname> <given-names>LB</given-names></name>, <name name-style="western"><surname>Bamshad</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Rogers</surname> <given-names>AR</given-names></name>. <article-title>Using mitochondrial and nuclear DNA markers to reconstruct human evolution</article-title>. <source>Bioessays</source>. <year>1998</year>;<volume>20</volume>(<issue>2</issue>):<fpage>126</fpage>–<lpage>136</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1002/(SICI)1521-1878(199802)20:2&lt;126::AID-BIES5&gt;3.0.CO;2-R" xlink:type="simple">10.1002/(SICI)1521-1878(199802)20:2&lt;126::AID-BIES5&gt;3.0.CO;2-R</ext-link></comment> <object-id pub-id-type="pmid">9631658</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref064">
<label>64</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Gattepaille</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Günther</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Jakobsson</surname> <given-names>M</given-names></name>. <article-title>Inferring past effective population size from distributions of coalescent times</article-title>. <source>Genetics</source>. <year>2016</year>;<volume>204</volume>(<issue>3</issue>):<fpage>1191</fpage>–<lpage>1206</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.115.185058" xlink:type="simple">10.1534/genetics.115.185058</ext-link></comment> <object-id pub-id-type="pmid">27638421</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref065">
<label>65</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Sawai</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Kim</surname> <given-names>HL</given-names></name>, <name name-style="western"><surname>Kuno</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Suzuki</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Gotoh</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Takada</surname> <given-names>M</given-names></name>, <etal>et al</etal>. <article-title>The origin and genetic variation of domestic chickens with special reference to junglefowls Gallus g. gallus and G. varius</article-title>. <source>PloS one</source>. <year>2010</year>;<volume>5</volume>(<issue>5</issue>):<fpage>e10639</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pone.0010639" xlink:type="simple">10.1371/journal.pone.0010639</ext-link></comment> <object-id pub-id-type="pmid">20502703</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref066">
<label>66</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Lande</surname> <given-names>R</given-names></name>. <article-title>Effective deme sizes during long-term evolution estimated from rates of chromosomal rearrangement</article-title>. <source>Evolution</source>. <year>1979</year>;<volume>33</volume>(<issue>1Part1</issue>):<fpage>234</fpage>–<lpage>251</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/j.1558-5646.1979.tb04678.x" xlink:type="simple">10.1111/j.1558-5646.1979.tb04678.x</ext-link></comment> <object-id pub-id-type="pmid">28568063</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref067">
<label>67</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Lande</surname> <given-names>R</given-names></name>. <article-title>Expected time for random genetic drift of a population between stable phenotypic states</article-title>. <source>Proc Natl Acad Sci U S A</source>. <year>1985</year>;<volume>82</volume>(<issue>22</issue>):<fpage>7641</fpage>–<lpage>7645</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1073/pnas.82.22.7641" xlink:type="simple">10.1073/pnas.82.22.7641</ext-link></comment> <object-id pub-id-type="pmid">3865184</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref068">
<label>68</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Barton</surname> <given-names>NH</given-names></name>, <name name-style="western"><surname>Charlesworth</surname> <given-names>B</given-names></name>. <article-title>Genetic Revolutions, Founder Effects, and Speciation</article-title>. <source>Annual Review of Ecology and Systematics</source>. <year>1984</year>;<volume>15</volume>(<issue>1</issue>):<fpage>133</fpage>–<lpage>164</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1146/annurev.es.15.110184.001025" xlink:type="simple">10.1146/annurev.es.15.110184.001025</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref069">
<label>69</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Barton</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Rouhani</surname> <given-names>S</given-names></name>. <article-title>The frequency of shifts between alternative equilibria</article-title>. <source>Journal of theoretical biology</source>. <year>1987</year>;<volume>125</volume>(<issue>4</issue>):<fpage>397</fpage>–<lpage>418</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/S0022-5193(87)80210-2" xlink:type="simple">10.1016/S0022-5193(87)80210-2</ext-link></comment> <object-id pub-id-type="pmid">3657219</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref070">
<label>70</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Moyle</surname> <given-names>LC</given-names></name>, <name name-style="western"><surname>Nakazato</surname> <given-names>T</given-names></name>. <article-title>Hybrid incompatibility “snowballs” between Solanum species</article-title>. <source>Science</source>. <year>2010</year>;<volume>329</volume>(<issue>5998</issue>):<fpage>1521</fpage>–<lpage>1523</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1126/science.1193063" xlink:type="simple">10.1126/science.1193063</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref071">
<label>71</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Schumer</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Cui</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Powell</surname> <given-names>DL</given-names></name>, <name name-style="western"><surname>Dresner</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Rosenthal</surname> <given-names>GG</given-names></name>, <name name-style="western"><surname>Andolfatto</surname> <given-names>P</given-names></name>. <article-title>High-resolution mapping reveals hundreds of genetic incompatibilities in hybridizing fish species</article-title>. <source>Elife</source>. <year>2014</year>;<volume>3</volume>:<fpage>e02535</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.7554/eLife.02535" xlink:type="simple">10.7554/eLife.02535</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref072">
<label>72</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Weinreich</surname> <given-names>DM</given-names></name>, <name name-style="western"><surname>Lan</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Wylie</surname> <given-names>CS</given-names></name>, <name name-style="western"><surname>Heckendorn</surname> <given-names>RB</given-names></name>. <source>Should evolutionary geneticists worry about higher-order epistasis? Current opinion in genetics &amp; development</source>. <year>2013</year>;<volume>23</volume>(<issue>6</issue>):<fpage>700</fpage>–<lpage>707</lpage>.</mixed-citation>
</ref>
<ref id="pcbi.1007177.ref073">
<label>73</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Kalirad</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Azevedo</surname> <given-names>RB</given-names></name>. <article-title>Spiraling complexity: a test of the snowball effect in a computational model of RNA folding</article-title>. <source>Genetics</source>. <year>2017</year>;<volume>206</volume>(<issue>1</issue>):<fpage>377</fpage>–<lpage>388</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.116.196030" xlink:type="simple">10.1534/genetics.116.196030</ext-link></comment> <object-id pub-id-type="pmid">28007889</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref074">
<label>74</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Bintu</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Buchler</surname> <given-names>NE</given-names></name>, <name name-style="western"><surname>Garcia</surname> <given-names>HG</given-names></name>, <name name-style="western"><surname>Gerland</surname> <given-names>U</given-names></name>, <name name-style="western"><surname>Hwa</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Kondev</surname> <given-names>J</given-names></name>, <etal>et al</etal>. <article-title>Transcriptional regulation by the numbers: models</article-title>. <source>Curr Opin Genet Dev</source>. <year>2005</year>;<volume>15</volume>(<issue>2</issue>):<fpage>116</fpage>–<lpage>124</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.gde.2005.02.007" xlink:type="simple">10.1016/j.gde.2005.02.007</ext-link></comment> <object-id pub-id-type="pmid">15797194</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref075">
<label>75</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Spitz</surname> <given-names>F</given-names></name>, <name name-style="western"><surname>Furlong</surname> <given-names>EE</given-names></name>. <article-title>Transcription factors: from enhancer binding to developmental control</article-title>. <source>Nature Reviews Genetics</source>. <year>2012</year>;<volume>13</volume>(<issue>9</issue>):<fpage>613</fpage>–<lpage>626</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nrg3207" xlink:type="simple">10.1038/nrg3207</ext-link></comment> <object-id pub-id-type="pmid">22868264</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref076">
<label>76</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Levo</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Segal</surname> <given-names>E</given-names></name>. <article-title>In pursuit of design principles of regulatory sequences</article-title>. <source>Nature Reviews Genetics</source>. <year>2014</year>;<volume>15</volume>(<issue>7</issue>):<fpage>453</fpage>–<lpage>468</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nrg3684" xlink:type="simple">10.1038/nrg3684</ext-link></comment> <object-id pub-id-type="pmid">24913666</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref077">
<label>77</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Taylor</surname> <given-names>MB</given-names></name>, <name name-style="western"><surname>Ehrenreich</surname> <given-names>IM</given-names></name>. <article-title>Higher-order genetic interactions and their contribution to complex traits</article-title>. <source>Trends in genetics</source>. <year>2015</year>;<volume>31</volume>(<issue>1</issue>):<fpage>34</fpage>–<lpage>40</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.tig.2014.09.001" xlink:type="simple">10.1016/j.tig.2014.09.001</ext-link></comment> <object-id pub-id-type="pmid">25284288</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref078">
<label>78</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Orr</surname> <given-names>HA</given-names></name>, <name name-style="western"><surname>Irving</surname> <given-names>S</given-names></name>. <article-title>Complex epistasis and the genetic basis of hybrid sterility in the Drosophila pseudoobscura Bogota-USA hybridization</article-title>. <source>Genetics</source>. <year>2001</year>;<volume>158</volume>(<issue>3</issue>):<fpage>1089</fpage>–<lpage>1100</lpage>. <object-id pub-id-type="pmid">11454758</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref079">
<label>79</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Cabot</surname> <given-names>EL</given-names></name>, <name name-style="western"><surname>Davis</surname> <given-names>AW</given-names></name>, <name name-style="western"><surname>Johnson</surname> <given-names>NA</given-names></name>, <name name-style="western"><surname>Wu</surname> <given-names>CI</given-names></name>. <article-title>Genetics of reproductive isolation in the Drosophila simulans clade: complex epistasis underlying hybrid male sterility</article-title>. <source>Genetics</source>. <year>1994</year>;<volume>137</volume>(<issue>1</issue>):<fpage>175</fpage>–<lpage>189</lpage>. <object-id pub-id-type="pmid">8056308</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref080">
<label>80</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Palopoli</surname> <given-names>MF</given-names></name>, <name name-style="western"><surname>Wu</surname> <given-names>CI</given-names></name>. <article-title>Genetics of hybrid male sterility between drosophila sibling species: a complex web of epistasis is revealed in interspecific studies</article-title>. <source>Genetics</source>. <year>1994</year>;<volume>138</volume>(<issue>2</issue>):<fpage>329</fpage>–<lpage>341</lpage>. <object-id pub-id-type="pmid">7828817</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref081">
<label>81</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Fraïsse</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Elderfield</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Welch</surname> <given-names>J</given-names></name>. <article-title>The genetics of speciation: are complex incompatibilities easier to evolve?</article-title> <source>Journal of evolutionary biology</source>. <year>2014</year>;<volume>27</volume>(<issue>4</issue>):<fpage>688</fpage>–<lpage>699</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/jeb.12339" xlink:type="simple">10.1111/jeb.12339</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref082">
<label>82</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Lässig</surname> <given-names>M</given-names></name>. <article-title>From biophysics to evolutionary genetics: statistical aspects of gene regulation</article-title>. <source>BMC Bioinformatics</source>. <year>2007</year>;<volume>8</volume> <issue>Suppl 6</issue>:<fpage>S7</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/1471-2105-8-S6-S7" xlink:type="simple">10.1186/1471-2105-8-S6-S7</ext-link></comment> <object-id pub-id-type="pmid">17903288</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref083">
<label>83</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Buchler</surname> <given-names>NE</given-names></name>, <name name-style="western"><surname>Gerland</surname> <given-names>U</given-names></name>, <name name-style="western"><surname>Hwa</surname> <given-names>T</given-names></name>. <article-title>On schemes of combinatorial transcription logic</article-title>. <source>Proc Natl Acad Sci U S A</source>. <year>2003</year>;<volume>100</volume>(<issue>9</issue>):<fpage>5136</fpage>–<lpage>5141</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1073/pnas.0930314100" xlink:type="simple">10.1073/pnas.0930314100</ext-link></comment> <object-id pub-id-type="pmid">12702751</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref084">
<label>84</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Gillespie</surname> <given-names>DT</given-names></name>. <article-title>A general method for numerically simulating the stochastic time evolution of coupled chemical reactions</article-title>. <source>Journal of computational physics</source>. <year>1976</year>;<volume>22</volume>(<issue>4</issue>):<fpage>403</fpage>–<lpage>434</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/0021-9991(76)90041-3" xlink:type="simple">10.1016/0021-9991(76)90041-3</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref085">
<label>85</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Kimura</surname> <given-names>M</given-names></name>. <article-title>On the probability of fixation of mutant genes in a population</article-title>. <source>Genetics</source>. <year>1962</year>;<volume>47</volume>:<fpage>713</fpage>–<lpage>719</lpage>. <object-id pub-id-type="pmid">14456043</object-id></mixed-citation>
</ref>
<ref id="pcbi.1007177.ref086">
<label>86</label>
<mixed-citation publication-type="book" xlink:type="simple">
<name name-style="western"><surname>MacKay</surname> <given-names>DJC</given-names></name>. IV. In: <source>Information Theory, Inference, and Learning Algorithms</source>. <publisher-name>Cambridge University Press</publisher-name>; <year>2007</year>. p. <fpage>343</fpage>.</mixed-citation>
</ref>
</ref-list>
</back>
</article>