<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.1d3 20150301//EN" "http://jats.nlm.nih.gov/publishing/1.1d3/JATS-journalpublishing1.dtd">
<article article-type="research-article" dtd-version="1.1d3" xml:lang="en" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="nlm-ta">PLoS Comput Biol</journal-id>
<journal-id journal-id-type="publisher-id">plos</journal-id>
<journal-id journal-id-type="pmc">ploscomp</journal-id>
<journal-title-group>
<journal-title>PLOS Computational Biology</journal-title>
</journal-title-group>
<issn pub-type="ppub">1553-734X</issn>
<issn pub-type="epub">1553-7358</issn>
<publisher>
<publisher-name>Public Library of Science</publisher-name>
<publisher-loc>San Francisco, CA USA</publisher-loc>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">PCOMPBIOL-D-18-01929</article-id>
<article-id pub-id-type="doi">10.1371/journal.pcbi.1006650</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Research Article</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>BEAST 2.5: An advanced software platform for Bayesian evolutionary analysis</article-title>
<alt-title alt-title-type="running-head">BEAST 2.5 for Bayesian evolutionary analysis</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0001-6765-3813</contrib-id>
<name name-style="western">
<surname>Bouckaert</surname> <given-names>Remco</given-names></name>
<role content-type="http://credit.casrai.org/">Formal analysis</role>
<role content-type="http://credit.casrai.org/">Investigation</role>
<role content-type="http://credit.casrai.org/">Methodology</role>
<role content-type="http://credit.casrai.org/">Project administration</role>
<role content-type="http://credit.casrai.org/">Software</role>
<role content-type="http://credit.casrai.org/">Validation</role>
<role content-type="http://credit.casrai.org/">Visualization</role>
<role content-type="http://credit.casrai.org/">Writing – original draft</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
<xref ref-type="corresp" rid="cor001">*</xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Vaughan</surname> <given-names>Timothy G.</given-names></name>
<role content-type="http://credit.casrai.org/">Software</role>
<role content-type="http://credit.casrai.org/">Writing – original draft</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff003"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff004"><sup>4</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0002-5220-5468</contrib-id>
<name name-style="western">
<surname>Barido-Sottani</surname> <given-names>Joëlle</given-names></name>
<role content-type="http://credit.casrai.org/">Software</role>
<xref ref-type="aff" rid="aff003"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff004"><sup>4</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0002-2863-0907</contrib-id>
<name name-style="western">
<surname>Duchêne</surname> <given-names>Sebastián</given-names></name>
<role content-type="http://credit.casrai.org/">Software</role>
<xref ref-type="aff" rid="aff005"><sup>5</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0001-8153-9822</contrib-id>
<name name-style="western">
<surname>Fourment</surname> <given-names>Mathieu</given-names></name>
<role content-type="http://credit.casrai.org/">Software</role>
<xref ref-type="aff" rid="aff006"><sup>6</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Gavryushkina</surname> <given-names>Alexandra</given-names></name>
<role content-type="http://credit.casrai.org/">Investigation</role>
<role content-type="http://credit.casrai.org/">Software</role>
<role content-type="http://credit.casrai.org/">Validation</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff007"><sup>7</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0002-2403-7997</contrib-id>
<name name-style="western">
<surname>Heled</surname> <given-names>Joseph</given-names></name>
<role content-type="http://credit.casrai.org/">Software</role>
<xref ref-type="aff" rid="aff008"><sup>8</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0002-9686-5871</contrib-id>
<name name-style="western">
<surname>Jones</surname> <given-names>Graham</given-names></name>
<role content-type="http://credit.casrai.org/">Software</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff009"><sup>9</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0002-5657-018X</contrib-id>
<name name-style="western">
<surname>Kühnert</surname> <given-names>Denise</given-names></name>
<role content-type="http://credit.casrai.org/">Software</role>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0002-1776-8564</contrib-id>
<name name-style="western">
<surname>De Maio</surname> <given-names>Nicola</given-names></name>
<role content-type="http://credit.casrai.org/">Software</role>
<role content-type="http://credit.casrai.org/">Writing – original draft</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff010"><sup>10</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Matschiner</surname> <given-names>Michael</given-names></name>
<role content-type="http://credit.casrai.org/">Data curation</role>
<role content-type="http://credit.casrai.org/">Software</role>
<role content-type="http://credit.casrai.org/">Visualization</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff011"><sup>11</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0001-6204-7208</contrib-id>
<name name-style="western">
<surname>Mendes</surname> <given-names>Fábio K.</given-names></name>
<role content-type="http://credit.casrai.org/">Software</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Müller</surname> <given-names>Nicola F.</given-names></name>
<role content-type="http://credit.casrai.org/">Formal analysis</role>
<role content-type="http://credit.casrai.org/">Software</role>
<role content-type="http://credit.casrai.org/">Visualization</role>
<role content-type="http://credit.casrai.org/">Writing – original draft</role>
<xref ref-type="aff" rid="aff003"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff004"><sup>4</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0003-1589-6885</contrib-id>
<name name-style="western">
<surname>Ogilvie</surname> <given-names>Huw A.</given-names></name>
<role content-type="http://credit.casrai.org/">Software</role>
<role content-type="http://credit.casrai.org/">Writing – original draft</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff012"><sup>12</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>du Plessis</surname> <given-names>Louis</given-names></name>
<role content-type="http://credit.casrai.org/">Formal analysis</role>
<role content-type="http://credit.casrai.org/">Software</role>
<role content-type="http://credit.casrai.org/">Visualization</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff013"><sup>13</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Popinga</surname> <given-names>Alex</given-names></name>
<role content-type="http://credit.casrai.org/">Software</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Rambaut</surname> <given-names>Andrew</given-names></name>
<role content-type="http://credit.casrai.org/">Conceptualization</role>
<xref ref-type="aff" rid="aff014"><sup>14</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Rasmussen</surname> <given-names>David</given-names></name>
<role content-type="http://credit.casrai.org/">Software</role>
<xref ref-type="aff" rid="aff015"><sup>15</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0003-2595-3062</contrib-id>
<name name-style="western">
<surname>Siveroni</surname> <given-names>Igor</given-names></name>
<role content-type="http://credit.casrai.org/">Software</role>
<xref ref-type="aff" rid="aff016"><sup>16</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0001-9818-479X</contrib-id>
<name name-style="western">
<surname>Suchard</surname> <given-names>Marc A.</given-names></name>
<role content-type="http://credit.casrai.org/">Conceptualization</role>
<xref ref-type="aff" rid="aff017"><sup>17</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Wu</surname> <given-names>Chieh-Hsi</given-names></name>
<role content-type="http://credit.casrai.org/">Software</role>
<xref ref-type="aff" rid="aff018"><sup>18</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Xie</surname> <given-names>Dong</given-names></name>
<role content-type="http://credit.casrai.org/">Software</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0001-6009-5273</contrib-id>
<name name-style="western">
<surname>Zhang</surname> <given-names>Chi</given-names></name>
<role content-type="http://credit.casrai.org/">Software</role>
<role content-type="http://credit.casrai.org/">Visualization</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff019"><sup>19</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0001-6431-535X</contrib-id>
<name name-style="western">
<surname>Stadler</surname> <given-names>Tanja</given-names></name>
<role content-type="http://credit.casrai.org/">Conceptualization</role>
<role content-type="http://credit.casrai.org/">Methodology</role>
<role content-type="http://credit.casrai.org/">Supervision</role>
<role content-type="http://credit.casrai.org/">Writing – original draft</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff003"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff004"><sup>4</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0003-4454-2576</contrib-id>
<name name-style="western">
<surname>Drummond</surname> <given-names>Alexei J.</given-names></name>
<role content-type="http://credit.casrai.org/">Conceptualization</role>
<role content-type="http://credit.casrai.org/">Funding acquisition</role>
<role content-type="http://credit.casrai.org/">Methodology</role>
<role content-type="http://credit.casrai.org/">Project administration</role>
<role content-type="http://credit.casrai.org/">Resources</role>
<role content-type="http://credit.casrai.org/">Software</role>
<role content-type="http://credit.casrai.org/">Supervision</role>
<role content-type="http://credit.casrai.org/">Visualization</role>
<role content-type="http://credit.casrai.org/">Writing – original draft</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
<xref ref-type="corresp" rid="cor001">*</xref>
</contrib>
</contrib-group>
<aff id="aff001">
<label>1</label>
<addr-line>Centre of Computational Evolution, University of Auckland, Auckland, New Zealand</addr-line>
</aff>
<aff id="aff002">
<label>2</label>
<addr-line>Max Planck Institute for the Science of Human History, Jena, Germany</addr-line>
</aff>
<aff id="aff003">
<label>3</label>
<addr-line>ETH Zürich, Department of Biosystems Science and Engineering, 4058 Basel, Switzerland</addr-line>
</aff>
<aff id="aff004">
<label>4</label>
<addr-line>Swiss Institute of Bioinformatics, Lausanne, Switzerland</addr-line>
</aff>
<aff id="aff005">
<label>5</label>
<addr-line>Department of Biochemistry and Molecular Biology, University of Melbourne, Melbourne, Victoria, Australia</addr-line>
</aff>
<aff id="aff006">
<label>6</label>
<addr-line>ithree institute, University of Technology Sydney, Sydney, Australia</addr-line>
</aff>
<aff id="aff007">
<label>7</label>
<addr-line>Department of Biochemistry, University of Otago, Dunedin 9016, New Zealand</addr-line>
</aff>
<aff id="aff008">
<label>8</label>
<addr-line>Independent researcher, Auckland, New Zealand</addr-line>
</aff>
<aff id="aff009">
<label>9</label>
<addr-line>Department of Biological and Environmental Sciences, University of Gothenburg, Box 461, SE 405 30 Göteborg, Sweden</addr-line>
</aff>
<aff id="aff010">
<label>10</label>
<addr-line>European Molecular Biology Laboratory, European Bioinformatics Institute (EMBL-EBI), Cambridgeshire, UK</addr-line>
</aff>
<aff id="aff011">
<label>11</label>
<addr-line>Department of Environmental Sciences, University of Basel, 4051 Basel, Switzerland</addr-line>
</aff>
<aff id="aff012">
<label>12</label>
<addr-line>Department of Computer Science, Rice University, Houston, TX 77005-1892, USA</addr-line>
</aff>
<aff id="aff013">
<label>13</label>
<addr-line>Department of Zoology, University of Oxford, Oxford, OX1 3PS, UK</addr-line>
</aff>
<aff id="aff014">
<label>14</label>
<addr-line>Institute of Evolutionary Biology, University of Edinburgh, Ashworth Laboratories, Edinburgh, EH9 3FL UK</addr-line>
</aff>
<aff id="aff015">
<label>15</label>
<addr-line>Department of Entomology and Plant Pathology, North Carolina State University, Raleigh, NC 27695, USA</addr-line>
</aff>
<aff id="aff016">
<label>16</label>
<addr-line>Department of Infectious Disease Epidemiology, Imperial College London, Norfolk Place, W2 1PG, UK</addr-line>
</aff>
<aff id="aff017">
<label>17</label>
<addr-line>Department of Biomathematics, David Geffen School of Medicine, University of California, Los Angeles, CA, USA</addr-line>
</aff>
<aff id="aff018">
<label>18</label>
<addr-line>Department of Statistics, University of Oxford, OX1 3LB, UK</addr-line>
</aff>
<aff id="aff019">
<label>19</label>
<addr-line>Institute of Vertebrate Paleontology and Paleoanthropology, Chinese Academy of Sciences, Beijing, China</addr-line>
</aff>
<contrib-group>
<contrib contrib-type="editor" xlink:type="simple">
<name name-style="western">
<surname>Pertea</surname> <given-names>Mihaela</given-names></name>
<role>Editor</role>
<xref ref-type="aff" rid="edit1"/>
</contrib>
</contrib-group>
<aff id="edit1">
<addr-line>Johns Hopkins University, UNITED STATES</addr-line>
</aff>
<author-notes>
<fn fn-type="conflict" id="coi001">
<p>The authors have declared that no competing interests exist.</p>
</fn>
<corresp id="cor001">* E-mail: <email xlink:type="simple">r.bouckaert@auckland.ac.nz</email> (RB); <email xlink:type="simple">alexei@cs.auckland.ac.nz</email> (AJD)</corresp>
</author-notes>
<pub-date pub-type="collection">
<month>4</month>
<year>2019</year>
</pub-date>
<pub-date pub-type="epub">
<day>8</day>
<month>4</month>
<year>2019</year>
</pub-date>
<volume>15</volume>
<issue>4</issue>
<elocation-id>e1006650</elocation-id>
<history>
<date date-type="received">
<day>14</day>
<month>11</month>
<year>2018</year>
</date>
<date date-type="accepted">
<day>4</day>
<month>2</month>
<year>2019</year>
</date>
</history>
<permissions>
<copyright-year>2019</copyright-year>
<copyright-holder>Bouckaert et al</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">
<license-p>This is an open access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">Creative Commons Attribution License</ext-link>, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
</license>
</permissions>
<self-uri content-type="pdf" xlink:href="info:doi/10.1371/journal.pcbi.1006650"/>
<abstract>
<p>Elaboration of Bayesian phylogenetic inference methods has continued at pace in recent years with major new advances in nearly all aspects of the joint modelling of evolutionary data. It is increasingly appreciated that some evolutionary questions can only be adequately answered by combining evidence from multiple independent sources of data, including genome sequences, sampling dates, phenotypic data, radiocarbon dates, fossil occurrences, and biogeographic range information among others. Including all relevant data into a single joint model is very challenging both conceptually and computationally. Advanced computational software packages that allow robust development of compatible (sub-)models which can be composed into a full model hierarchy have played a key role in these developments. Developing such software frameworks is increasingly a major scientific activity in its own right, and comes with specific challenges, from practical software design, development and engineering challenges to statistical and conceptual modelling challenges. BEAST 2 is one such computational software platform, and was first announced over 4 years ago. Here we describe a series of major new developments in the BEAST 2 core platform and model hierarchy that have occurred since the first release of the software, culminating in the recent 2.5 release.</p>
</abstract>
<abstract abstract-type="summary">
<title>Author summary</title>
<p>Bayesian phylogenetic inference methods have undergone considerable development in recent years, and joint modelling of rich evolutionary data, including genomes, phenotypes and fossil occurrences is increasingly common. Advanced computational software packages that allow robust development of compatible (sub-)models which can be composed into a full model hierarchy have played a key role in these developments. Developing scientific software is increasingly crucial to advancement in many fields of biology. The challenges range from practical software development and engineering, distributed team coordination, conceptual development and statistical modelling, to validation and testing. BEAST 2 is one such computational software platform for phylogenetics, population genetics and phylodynamics, and was first announced over 4 years ago. Here we describe the full range of new tools and models available on the BEAST 2.5 platform, which expand joint evolutionary inference in many new directions, especially for joint inference over multiple data types, non-tree models and complex phylodynamics.</p>
</abstract>
<funding-group>
<award-group id="award001">
<funding-source>
<institution-wrap>
<institution-id institution-id-type="funder-id">http://dx.doi.org/10.13039/501100009193</institution-id>
<institution>Marsden Fund</institution>
</institution-wrap>
</funding-source>
<award-id>16-UOA-277</award-id>
<principal-award-recipient>
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0003-4454-2576</contrib-id>
<name name-style="western">
<surname>Drummond</surname> <given-names>Alexei J.</given-names></name>
</principal-award-recipient>
</award-group>
<funding-statement>AJD would like to acknowledge support from a Royal Society of New Zealand Marsden award (#UOA1611; 16-UOA-277). LdP would like to acknowledge support from the European Research Council under the Seventh Framework Programme of the European Commission (PATHPHYLODYN: grant agreement number 614725). IS would like to acknowledge support from the NIH MIDAS U01 GM110749 grant. NFM and TS are funded in part by the Swiss National Science foundation (SNF; grant number CR32I3 166258). TS, JB-S, LdP, TGV, and CZ were supported in part by the European Research Council under the Seventh Framework Programme of the European Commission (PhyPD: grant agreement number 335529). DK would like to acknowledge support from the Max Planck Society. NDM was supported by EMBL. MM acknowledges support from the Swiss National Science Foundation (SNP; grant number PBBSP3-138680). The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</funding-statement>
</funding-group>
<counts>
<fig-count count="6"/>
<table-count count="1"/>
<page-count count="28"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>PLOS Publication Stage</meta-name>
<meta-value>vor-update-to-uncorrected-proof</meta-value>
</custom-meta>
<custom-meta>
<meta-name>Publication Update</meta-name>
<meta-value>2019-04-18</meta-value>
</custom-meta>
<custom-meta id="data-availability">
<meta-name>Data Availability</meta-name>
<meta-value>The XML file and log files used for the bModelTest analyses shown in <xref ref-type="fig" rid="pcbi.1006650.g002">Fig 2</xref> are available from <ext-link ext-link-type="uri" xlink:href="http://www.doi.org/10.5281/zenodo.1475369" xlink:type="simple">http://www.doi.org/10.5281/zenodo.1475369</ext-link>. The XML file, log file, MCC tree and post-processing scripts for the bdsky analyses shown in <xref ref-type="fig" rid="pcbi.1006650.g003">Fig 3</xref> are available from <ext-link ext-link-type="uri" xlink:href="http://www.doi.org/10.5281/zenodo.1476124" xlink:type="simple">http://www.doi.org/10.5281/zenodo.1476124</ext-link>. The alignments, XML files, log files and post processing scripts for the AIM analysis shown in <xref ref-type="fig" rid="pcbi.1006650.g005">Fig 5</xref> can be found at <ext-link ext-link-type="uri" xlink:href="https://github.com/nicfel/Neolamprologus" xlink:type="simple">https://github.com/nicfel/Neolamprologus</ext-link>. The XML files and a script to generate the TreeModelAdequacy analyses shown in <xref ref-type="fig" rid="pcbi.1006650.g006">Fig 6</xref> are available from <ext-link ext-link-type="uri" xlink:href="http://doi.org/10.5281/zenodo.1473852" xlink:type="simple">http://doi.org/10.5281/zenodo.1473852</ext-link>.</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<disp-quote>
<p>This is a PLOS Computational Biology Software paper.</p>
</disp-quote>
<sec id="sec001" sec-type="intro">
<title>Introduction</title>
<p>Bayesian Evolutionary Analysis by Sampling Trees (BEAST) is a software package for performing Bayesian phylogenetic and phylodynamic analyses. BEAST samples from the posterior distribution of trees (or networks) and parameters given the input data using the Markov chain Monte Carlo (MCMC) algorithm. Four years ago, BEAST 2 [<xref ref-type="bibr" rid="pcbi.1006650.ref001">1</xref>, <xref ref-type="bibr" rid="pcbi.1006650.ref002">2</xref>] was published as a complete rewrite of the original BEAST software. A main goal of this rewrite was to develop a more modular software framework, one that could be easily extended by third parties. The software platform is comprised of various standalone programs including BEAUti (a graphical user interface [GUI] for setting up an analysis), BEAST to run MCMC analysis, and post processing tools such as LogAnalyser, LogCombiner, TreeAnnotator, DensiTree [<xref ref-type="bibr" rid="pcbi.1006650.ref003">3</xref>], as well as a package manager.</p>
<p>Shortly after its release, a number of packages were added, such as MASTER for simulating stochastic population dynamics models [<xref ref-type="bibr" rid="pcbi.1006650.ref004">4</xref>], MultiTypeTree for inferring structured coalescent models [<xref ref-type="bibr" rid="pcbi.1006650.ref005">5</xref>], RBS for reversible jump across substitution models [<xref ref-type="bibr" rid="pcbi.1006650.ref006">6</xref>], SNAPP for multi species coalescent over SNP data [<xref ref-type="bibr" rid="pcbi.1006650.ref007">7</xref>], subst-bma for Bayesian model averaging over site models [<xref ref-type="bibr" rid="pcbi.1006650.ref008">8</xref>], and BDSKY for the birth-death skyline tree model [<xref ref-type="bibr" rid="pcbi.1006650.ref009">9</xref>]. All these packages have been very popular on their own right, and since the initial release of BEAST 2 a large amount of functionality and packages have been added, showing the success of the approach. In this paper, we summarize the significant advances that have been made.</p>
<sec id="sec002">
<title>What is BEAST?</title>
<p>BEAST is a package for conducting Bayesian phylogenetic inference using MCMC. At its core are rooted time trees (or time networks in latest developments), which can be inferred from multiple sources of data. BEAST supports sequence data for nucleotides, amino acids, codon models, discrete and continuous morphological features, language, microsatellites and SNPs as well as user-defined discrete and biogeographical data. Bayesian inference allows the incorporation of many sources of information in the same analysis, such as DNA sequences from extant and extinct species, combined with information from the fossil record. Apart from inferring rooted time trees, which are valuable in and of themselves [<xref ref-type="bibr" rid="pcbi.1006650.ref010">10</xref>], BEAST also allows addressing many kinds of micro- and macroevolutionary questions, such as determining the age and location of the origin of species and cultures, rates of mutation and migration, and rate of spread of epidemics.</p>
</sec>
</sec>
<sec id="sec003">
<title>New BEAST functionality</title>
<p>At the core of BEAST is its MCMC sampling mechanism. This mechanism has been improved for better performance, which is especially useful for analyses with a large number of taxa but little data, such as a geography-only analysis. The calculation time of Felsenstein’s likelihood, i.e., the probability of sequence data given a tree or network and model parameters, which typically takes up the bulk of computing time, has been made more efficient for the case where there is a proportion of invariable sites.</p>
<p>BEAUti has been improved so as to make it easier and more intuitive to set up an analysis. For example, when many tip or clade calibrations are required, these can now be read from a NEXUS file, which tends to be easier to manage than editing calibrations one by one in a GUI. BEAUti now also allows specification of custom tree priors, such as multiple monophyletic constraints encoded as a multifurcating tree in Newick format, as well as switching top-level analyses from MCMC to nested sampling, for example.</p>
<p>While the core of BEAST 2 provides basic functionality for Bayesian phylogenetic analyses, it is mostly a platform for building packages on. Package management has matured to include a command line as well as graphical user interface that can deal with different package repositories. Different versions of packages can be installed at the same time. This is as practical as it is important for reproducibility, because an analysis specification file (the BEAST XML file) generated using an older package version can still be run using that older version without the usual necessity of uninstalling the latest package release. Packages are linked by the GUI to websites, making it easy to find information such as tutorials and user documentation. Packages can also be automatically updated to ensure the latest bug fixes and new features are available.</p>
<p>Finally, BEAST 2 and its tools have been improved and extended to facilitate the implementation of several new packages, which have also been made faster as well as more efficient in their memory usage. The new packages contain most of the new features. In particular, (i) the time trees were extended to generalized phylogenetic structures, (ii) new models for the existing and new structures were developed, (iii) tools for model selection were developed, (iv) and tools for simulating under such models were implemented. We outline these advances in the rest of this paper.</p>
</sec>
<sec id="sec004">
<title>Beyond time trees: Extended phylogenetic structures</title>
<p>BEAST software packages have always dealt exclusively with phylogenetic trees that have an explicit time dimension. The developers of BEAST (and some other Bayesian phylogenetics packages) have championed the notion that time is a fundamental dimension to connect independent sources of evidence about evolution and ancestry; in other words, all evolutionary hypotheses should have the time dimension as an explicit part of their parameterisation. The attraction of doing so is manifold, and has been the primary means by which different quantitative theories from phylo- and population genetics have been melded together into increasingly sophisticated hierarchical phylogenetic models that are now starting to be more regularly employed.</p>
<p>The ancestral structures estimated by BEAST all have a time dimension, but they are not all the classic binary rooted time trees with samples at the tips. Generalizations of a binary rooted time tree structure (<xref ref-type="fig" rid="pcbi.1006650.g001">Fig 1a</xref>) are essential in certain cases, for example:</p>
<list list-type="bullet">
<list-item>
<p><bold>population and transmission trees</bold>: branches represent not one lineage, but entire populations (or species) [<xref ref-type="bibr" rid="pcbi.1006650.ref007">7</xref>, <xref ref-type="bibr" rid="pcbi.1006650.ref011">11</xref>], and branching events represent population splits (or speciation or transmission events) [<xref ref-type="bibr" rid="pcbi.1006650.ref012">12</xref>] (<xref ref-type="fig" rid="pcbi.1006650.g001">Fig 1b</xref>),</p>
</list-item>
<list-item>
<p><bold>sampled ancestors</bold>: fossils may be direct ancestors of other fossils or extant species [<xref ref-type="bibr" rid="pcbi.1006650.ref013">13</xref>] (<xref ref-type="fig" rid="pcbi.1006650.g001">Fig 1d</xref>),</p>
</list-item>
<list-item>
<p><bold>structured populations</bold>: branches are painted according to which population the individual belongs to [<xref ref-type="bibr" rid="pcbi.1006650.ref005">5</xref>] (<xref ref-type="fig" rid="pcbi.1006650.g001">Fig 1c</xref>),</p>
</list-item>
<list-item>
<p><bold>clonal frame ancestral recombination graph</bold>: some gene regions have alternative parent edges added to a “clonal frame” phylogeny, resulting in a tree-based network [<xref ref-type="bibr" rid="pcbi.1006650.ref014">14</xref>] (<xref ref-type="fig" rid="pcbi.1006650.g001">Fig 1e</xref>),</p>
</list-item>
<list-item>
<p><bold>species networks</bold>: hybridization or admixture after isolation events are included in the species history (so that the species history is a directed network) but gene histories (genealogies) are still represented by binary trees [<xref ref-type="bibr" rid="pcbi.1006650.ref015">15</xref>] (<xref ref-type="fig" rid="pcbi.1006650.g001">Fig 1f</xref>),</p>
</list-item>
<list-item>
<p><bold>polytomies</bold>: one individual gives rise to many lineages at the same time.</p>
</list-item>
</list>
<fig id="pcbi.1006650.g001" position="float">
<object-id pub-id-type="doi">10.1371/journal.pcbi.1006650.g001</object-id>
<label>Fig 1</label>
<caption>
<title>Phylogenetic structures available in BEAST 2.</title>
<p>(a) A tip-dated time tree, with leaf times as boundary conditions but not data (generally a coalescent prior is applied in this setting). (b) A species tree with one or more embedded gene trees (c) A multi-type time tree has measured types at the leaves and the type changes that paint the ancestral lineages in the tree are sampled as latent variables by MCMC. (d) A sampled ancestor tree, with two types of sampling events: extinct species (red) and extant species (blue). Extinct species can be leaves or, if they are the direct ancestor of another sample, degree-2 sampled ancestor nodes. (e) An ancestral gene conversion graph is composed of a clonal frame (solid time tree) and an extra edge and gene boundaries for each gene conversion event. (f) A species network with one or more embedded gene trees.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1006650.g001" xlink:type="simple"/>
</fig>
<p>Since the first release of BEAST 2, a range of Metropolis-Hastings proposal distributions has been developed to sample these extended phylogenetic data structures using MCMC. Additionally, we need to assume a phylogenetic (or “tree”) prior or model for each such phylogenetic structure. This expansion of the space of possible hypotheses that can be addressed by BEAST 2 continues at pace. In the next section, we will highlight the generative priors for the first four classes of extended phylogenetic structures as well as recent advances on new models for classic binary rooted time trees. In addition, some of us (TGV, TS) are currently working on including time tree polytomies in BEAST 2, as may be relevant to, for example, super-spreading events in infectious disease.</p>
</sec>
<sec id="sec005">
<title>New models</title>
<p>A Bayesian phylodynamic analysis requires the specification of a model for substitutions, a clock model, and a population dynamic model generating the phylogenetic structure, whether that be a tree, a phylogenetic network or a hierarchical combination of the two. These models induce probability distributions for the proposed states of the MCMC, the MCMC samples from the posterior distribution
<disp-formula id="pcbi.1006650.e001"><alternatives><graphic id="pcbi.1006650.e001g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1006650.e001" xlink:type="simple"/><mml:math display="block" id="M1"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>P</mml:mi> <mml:mo>(</mml:mo> <mml:mi>T</mml:mi> <mml:mo>,</mml:mo> <mml:mi>θ</mml:mi> <mml:mo>|</mml:mo> <mml:mi>D</mml:mi> <mml:mo>)</mml:mo> <mml:mo>∝</mml:mo> <mml:mi>P</mml:mi> <mml:mo>(</mml:mo> <mml:mi>D</mml:mi> <mml:mo>|</mml:mo> <mml:mi>T</mml:mi> <mml:mo>,</mml:mo> <mml:mi>θ</mml:mi> <mml:mo>)</mml:mo> <mml:mi>P</mml:mi> <mml:mo>(</mml:mo> <mml:mi>T</mml:mi> <mml:mo>|</mml:mo> <mml:mi>θ</mml:mi> <mml:mo>)</mml:mo> <mml:mi>P</mml:mi> <mml:mo>(</mml:mo> <mml:mi>θ</mml:mi> <mml:mo>)</mml:mo> <mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula></p>
<p>Here <italic>D</italic> is the sequence data and any other sort of data, <italic>T</italic> is the phylogenetic structure as introduced in the previous section, <italic>θ</italic> is the collection of the phylodynamic model parameters, as well as parameters for the substitution, site and branch rate sub-models. The strength of BEAST 2 is that developers can contribute new (sub-)models via packages. <xref ref-type="table" rid="pcbi.1006650.t001">Table 1</xref> shows the majority of currently available packages—ordered by their features. An up-to-date list of packages can be seen either from the <italic>Package Manager</italic> embedded in BEAST 2 or using <italic>Package Viewer</italic> (<ext-link ext-link-type="uri" xlink:href="http://compevol.github.io/CBAN/" xlink:type="simple">http://compevol.github.io/CBAN/</ext-link>) online.</p>
<table-wrap id="pcbi.1006650.t001" position="float">
<object-id pub-id-type="doi">10.1371/journal.pcbi.1006650.t001</object-id>
<label>Table 1</label>
<caption>
<title>BEAST 2 packages.</title>
</caption>
<alternatives>
<graphic id="pcbi.1006650.t001g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1006650.t001" xlink:type="simple"/>
<table border="0" frame="box" rules="all">
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="center" style="border-top:thick;border-bottom:thick">Package</th>
<th align="center" style="border-top:thick;border-bottom:thick">Subspecification</th>
<th align="center" style="border-top:thick;border-bottom:thick">Special Feature</th>
<th align="center" style="border-top:thick;border-bottom:thick">Reference</th>
</tr>
</thead>
<tbody>
<tr>
<td align="center"><italic>Substitution models</italic>:</td>
<td align="center"/>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="center">bModelTest</td>
<td align="center">nucleotide subst.<xref ref-type="table-fn" rid="t001fn002"><sup>1</sup></xref> model</td>
<td align="center">model averaging, model comparison</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref016">16</xref>]</td>
</tr>
<tr>
<td align="center">SSM</td>
<td align="center">nucleotide. subst. model</td>
<td align="center">standard named nucleotide models</td>
<td align="center">-</td>
</tr>
<tr>
<td align="center">CodonSubstModels</td>
<td align="center">codon subst. model</td>
<td align="center">M0</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref017">17</xref>, <xref ref-type="bibr" rid="pcbi.1006650.ref018">18</xref>]</td>
</tr>
<tr>
<td align="center">MM</td>
<td align="center">morphological model</td>
<td align="center">discrete</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref019">19</xref>]</td>
</tr>
<tr>
<td align="center">BEASTvntr</td>
<td align="center">microsatellite model</td>
<td align="center">variable number of tandem repeat data</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref020">20</xref>, <xref ref-type="bibr" rid="pcbi.1006650.ref021">21</xref>]</td>
</tr>
<tr>
<td align="center">RBS</td>
<td align="center">subst.<xref ref-type="table-fn" rid="t001fn002"><sup>1</sup></xref> model</td>
<td align="center">model averaging for contiguous site partitions</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref006">6</xref>]</td>
</tr>
<tr>
<td align="center">PoMo</td>
<td align="center">nucleotide subst. model</td>
<td align="center">mutation-selection<break/>&amp; species tree</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref022">22</xref>]<break/>[<xref ref-type="bibr" rid="pcbi.1006650.ref011">11</xref>]</td>
</tr>
<tr>
<td align="center"><italic>Site models</italic>:</td>
<td align="center"/>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="center">MGSM</td>
<td align="center">site model</td>
<td align="center">multi-gamma &amp; relaxed gamma</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref023">23</xref>]</td>
</tr>
<tr>
<td align="center">substBMA</td>
<td align="center">site model</td>
<td align="center">Dirichlet mixture model for site partitions</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref008">8</xref>]</td>
</tr>
<tr>
<td align="center"><italic>Clock model</italic>:</td>
<td align="center"/>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="center">FLC</td>
<td align="center">molecular clock model</td>
<td align="center">strict and relaxed clocks within local clock model</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref024">24</xref>]</td>
</tr>
<tr>
<td align="center"><italic>Tree models</italic>:</td>
<td align="center"/>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="center">SA</td>
<td align="center">unstructured population, non-par.<xref ref-type="table-fn" rid="t001fn003"><sup>2</sup></xref></td>
<td align="center">sampled ancestor<xref ref-type="table-fn" rid="t001fn001">*</xref> / fossilized BD<xref ref-type="table-fn" rid="t001fn004"><sup>3</sup></xref></td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref013">13</xref>]</td>
</tr>
<tr>
<td align="center">CA</td>
<td align="center">unstructured population, non-par.</td>
<td align="center">calibration density, sampling rate estimate</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref025">25</xref>]</td>
</tr>
<tr>
<td align="center" rowspan="2">BDSKY</td>
<td align="center" rowspan="2">unstructured population, non-par.</td>
<td align="center">BD serial skyline<xref ref-type="table-fn" rid="t001fn001">*</xref>, BD serial sampling</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref009">9</xref>]</td>
</tr>
<tr>
<td align="center">BD incomplete sampling (no <italic>ψ</italic>)</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref026">26</xref>]</td>
</tr>
<tr>
<td align="center" rowspan="2">phylodynamics</td>
<td align="center" rowspan="2">unstructured population, par.<xref ref-type="table-fn" rid="t001fn003"><sup>2</sup></xref></td>
<td align="center">deterministic closed SIR, stochastic closed SIR</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref027">27</xref>]</td>
</tr>
<tr>
<td align="center">birth-death SIR</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref028">28</xref>]</td>
</tr>
<tr>
<td align="center">EpiInf</td>
<td align="center">unstructured population, par.</td>
<td align="center">prevalence estimation, particle filtering</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref029">29</xref>]</td>
</tr>
<tr>
<td align="center">PhyDyn</td>
<td align="center">unstructured and structured populations, par.</td>
<td align="center">define epidemic model by ODEs<xref ref-type="table-fn" rid="t001fn005"><sup>4</sup></xref></td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref030">30</xref>]</td>
</tr>
<tr>
<td align="center">MultiTypeTree</td>
<td align="center">structured population</td>
<td align="center">structured tree</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref005">5</xref>]</td>
</tr>
<tr>
<td align="center">BadTrIP</td>
<td align="center">structured population</td>
<td align="center">within-host, transmission inference</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref012">12</xref>]</td>
</tr>
<tr>
<td align="center">BDMM</td>
<td align="center">structured population</td>
<td align="center">multitype BD<xref ref-type="table-fn" rid="t001fn004"><sup>3</sup></xref> model and sampled ancestors</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref031">31</xref>]</td>
</tr>
<tr>
<td align="center">BASTA</td>
<td align="center">structured population</td>
<td align="center">approx. structured coalescent</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref032">32</xref>]</td>
</tr>
<tr>
<td align="center">MASCOT</td>
<td align="center">structured population</td>
<td align="center">approx. structured coalescent and time variant GLM’s</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref033">33</xref>, <xref ref-type="bibr" rid="pcbi.1006650.ref034">34</xref>]</td>
</tr>
<tr>
<td align="center">SCOTTI</td>
<td align="center">structured population</td>
<td align="center">transmission inference</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref035">35</xref>]</td>
</tr>
<tr>
<td align="center">BREAK AWAY</td>
<td align="center">geographical model</td>
<td align="center">break-away model of phylogeography</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref036">36</xref>]</td>
</tr>
<tr>
<td align="center">GEO SPRE</td>
<td align="center">geographical model</td>
<td align="center">whole world phylogeography</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref037">37</xref>]</td>
</tr>
<tr>
<td align="center">SSE</td>
<td align="center">Geographical and structured population</td>
<td align="center">State-dependent birth-death + cladogenic events</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref038">38</xref>]</td>
</tr>
<tr>
<td align="center"><italic>Network models</italic>:</td>
<td align="center"/>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="center">BACTER</td>
<td align="center">network model</td>
<td align="center">clonal frame ancestral recombination graph</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref014">14</xref>, <xref ref-type="bibr" rid="pcbi.1006650.ref039">39</xref>]</td>
</tr>
<tr>
<td align="center">SpeciesNetwork</td>
<td align="center">network model</td>
<td align="center">species networks</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref015">15</xref>]</td>
</tr>
<tr>
<td align="center"><italic>Nested models</italic>:</td>
<td align="center"/>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="center">DENIM</td>
<td align="center">multispecies coalescent</td>
<td align="center">species tree estimation with gene flow</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref040">40</xref>]</td>
</tr>
<tr>
<td align="center">SNAPP</td>
<td align="center">multispecies coalescent</td>
<td align="center">from independent biallelic markers</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref007">7</xref>]</td>
</tr>
<tr>
<td align="center">STACEY</td>
<td align="center">multispecies coalescent</td>
<td align="center">species delimitation &amp; species tree estimation</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref041">41</xref>]</td>
</tr>
<tr>
<td align="center">StarBEAST 2</td>
<td align="center">multispecies coalescent</td>
<td align="center">faster, species tree clocks, FBD-MSC, AIM</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref042">42</xref>–<xref ref-type="bibr" rid="pcbi.1006650.ref045">45</xref>]</td>
</tr>
<tr>
<td align="center"><italic>Model selection</italic>:</td>
<td align="center"/>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="center">MODEL SELECTION</td>
<td align="center">model selection</td>
<td align="center">path sampling, stepping stone</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref046">46</xref>]</td>
</tr>
<tr>
<td align="center">NS</td>
<td align="center">model selection</td>
<td align="center">nested sampling</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref047">47</xref>]</td>
</tr>
<tr>
<td align="center"><italic>Simulation tools</italic>:</td>
<td align="center"/>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td align="center">MASTER</td>
<td align="center">simulation</td>
<td align="center">stochastic population dynamics simulation</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref048">48</xref>]</td>
</tr>
<tr>
<td align="center">TreeModelAdequacy</td>
<td align="center">model adequacy using simulation</td>
<td align="center">phylodynamic model adequacy using phylogenetic tree test statistics</td>
<td align="center">[<xref ref-type="bibr" rid="pcbi.1006650.ref049">49</xref>]</td>
</tr>
</tbody>
</table>
</alternatives>
<table-wrap-foot>
<fn id="t001fn001">
<p>* birth-death skyline handles sampled ancestors.</p>
</fn>
<fn id="t001fn002">
<p><sup>1</sup> subst. for substitution models;</p>
</fn>
<fn id="t001fn003">
<p><sup>2</sup> par. for parametric and non-par. for nonparametric models;</p>
</fn>
<fn id="t001fn004">
<p><sup>3</sup> BD for birth-death;</p>
</fn>
<fn id="t001fn005">
<p><sup>4</sup> ODEs for ordinary differential equations;</p>
</fn>
<fn id="t001fn006">
<p><sup>5</sup> analy. integ. of pop. for analytical integration of population.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>Below, we highlight some of the key new models in BEAST 2.5, that have been developed since our first description of the BEAST 2 software platform.</p>
<sec id="sec006">
<title>Site models</title>
<p>The site model (encompassing the substitution model and the model rate heterogeneity across sites), together with the clock model, determine the probability <italic>P</italic>(<italic>D</italic>|<italic>T</italic>, <italic>θ</italic>) (the phylogenetic likelihood). Model averaging and model comparison of site models are both provided by the new <monospace>bModelTest</monospace> package [<xref ref-type="bibr" rid="pcbi.1006650.ref016">16</xref>]. This package implements reversible-jump MCMC between time-reversible site models for nucleotides, as well as the estimation of the relative support for (i) equal or unequal base frequencies, (ii) uniform or gamma rate heterogeneity across sites, and (iii) zero or non-zero proportion of invariable sites. By providing model averaging of site models within a single MCMC analysis the uncertainty of the site model is integrated out, so that the phylogenetic analysis does not depend on committing to a specific site model. If the site model is not of direct interest, then the posterior distribution on site models can be ignored (knowing it has been model-averaged); otherwise, if the site model is of interest, then bModelTest provides a posterior distribution over site models, so that a credible set of site models can be constructed, and all pairs of site models can be compared for relative support <italic>a posteriori</italic>.</p>
<p>
<xref ref-type="fig" rid="pcbi.1006650.g002">Fig 2</xref> shows the posterior distribution resulting from a bModelTest analysis of substitution models for 906 nucleotides of cytochrome oxidase II and cytochrome b of 36 mammalian species [<xref ref-type="bibr" rid="pcbi.1006650.ref050">50</xref>] (for details see <ext-link ext-link-type="uri" xlink:href="http://www.doi.org/10.5281/zenodo.1475369" xlink:type="simple">http://www.doi.org/10.5281/zenodo.1475369</ext-link>). Each circle represents a substitution model indicated by a six digit number corresponding to the six rates of reversible substitution models (see <xref ref-type="fig" rid="pcbi.1006650.g002">Fig 2</xref> caption for more details).</p>
<fig id="pcbi.1006650.g002" position="float">
<object-id pub-id-type="doi">10.1371/journal.pcbi.1006650.g002</object-id>
<label>Fig 2</label>
<caption>
<title>bModelTest analysis for 36 mammalian species [<xref ref-type="bibr" rid="pcbi.1006650.ref050">50</xref>].</title>
<p>a) Posterior distribution of substitution models. Each circle represents a substitution model indicated by a six digit number corresponding to the six rates of reversible substitution models. In alphabetical order, these are A→C, A→G, A→T, C→G, C→T, and G→T, which can be shared in groups. The six digit numbers indicate these groupings, for example 121121 indicates the HKY model, which has shared rates for transitions and shared rates for transversions. Here, only models are considered that are reversible and do not share transition and transversion rates (with the exception of the JC69 and F81 models). Other substitution model sets are available. Links between substitution models indicate possible jumps during the MCMC chain from simpler (tail of arrow) to more complex (head of arrow) models and back. There is no single preferred substitution model for this data, as the posterior probability is spread over a number of alternative substitution models. Blue circles indicate the eight models contained in the 95% credible set, models with red circles are outside of this set, and models without circles have negligible support. b) Posterior tree distribution resulting from the bModelTest analysis.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1006650.g002" xlink:type="simple"/>
</fig>
<p>Other substitution and site models added are the polymorphism-aware model (PoMo) [<xref ref-type="bibr" rid="pcbi.1006650.ref011">11</xref>, <xref ref-type="bibr" rid="pcbi.1006650.ref022">22</xref>] (which can account for within-species variation and GC-biased gene conversion), pseudo Dollo [<xref ref-type="bibr" rid="pcbi.1006650.ref051">51</xref>], codon models [<xref ref-type="bibr" rid="pcbi.1006650.ref017">17</xref>, <xref ref-type="bibr" rid="pcbi.1006650.ref052">52</xref>], standard named nucleotide models (<monospace>SSM</monospace> package), standard empirical amino acid models (<monospace>OBAMA</monospace> package), morphological models (<monospace>MM</monospace> package) [<xref ref-type="bibr" rid="pcbi.1006650.ref019">19</xref>] and microsatellite models (<monospace>BEASTvntr</monospace> package) [<xref ref-type="bibr" rid="pcbi.1006650.ref021">21</xref>].</p>
</sec>
<sec id="sec007">
<title>Molecular clock models</title>
<p>The core BEAST 2 package already provides the relaxed [<xref ref-type="bibr" rid="pcbi.1006650.ref053">53</xref>] and random local [<xref ref-type="bibr" rid="pcbi.1006650.ref054">54</xref>] clock models to model substitution rate heterogeneity along a phylogeny. The <monospace>FLC</monospace> [<xref ref-type="bibr" rid="pcbi.1006650.ref024">24</xref>] package provides a framework that integrates the flexibility of the relaxed clock model into the local clock model. Specifically, the FLC model allows a local clock to be either strict (i.e. as in the original local model definition) or relaxed. In practice, this means closely related lineages can be modelled with a single constant rate substitution model (i.e. strict clock model) while other lineages with significant rate variation can be described more accurately with a relaxed clock model. As in the original formulation of the local clock model, the user needs to define the location of the local clock <italic>a priori</italic>.</p>
</sec>
<sec id="sec008">
<title>Population dynamic models for trees</title>
<p>Population dynamic models provide the probability density of the phylogeny given the parameters, <italic>P</italic>(<italic>T</italic>|<italic>θ</italic>). Population dynamic models giving rise to phylogenies are also called phylodynamic models.</p>
<sec id="sec009">
<title>Tree models for unstructured populations</title>
<p>There are two common approaches for modelling the phylogenetic tree, or the genealogy, in phylogenetic inference. The first assumes a classic population dynamic model, namely the birth-death model [<xref ref-type="bibr" rid="pcbi.1006650.ref055">55</xref>, <xref ref-type="bibr" rid="pcbi.1006650.ref056">56</xref>], to model the growth of a tree. In a population dynamic birth-death model, through time, each individual gives rise to one additional offspring with rate λ and dies with rate <italic>μ</italic>. As we only analyse a fraction of individuals arising in this process, it is necessary to model the sampling process for tips of a birth-death tree. For a variety of simple partially-sampled birth-death trees, the distribution of branch lengths has been derived exactly [<xref ref-type="bibr" rid="pcbi.1006650.ref057">57</xref>].</p>
<p>Alternatively, a mathematical model for trees known as the coalescent [<xref ref-type="bibr" rid="pcbi.1006650.ref058">58</xref>, <xref ref-type="bibr" rid="pcbi.1006650.ref059">59</xref>] can be used to parameterize the tree in terms of the effective size of the background population, and changes in this effective population size through time. One can interpret the effective population size and its changes as birth-death parameters when making some coalescent approximations [<xref ref-type="bibr" rid="pcbi.1006650.ref030">30</xref>]. Partially-sampled birth-death models do not make the approximations that coalescent models do, but they depend on a model of the sampling process, and simple sampling models may not always be an adequate description of real data sets. It is an ongoing debate and topic of research to investigate the consequences of coalescent approximations and sampling model assumptions.</p>
<p>Coalescent approaches have been embedded within BEAST since its genesis [<xref ref-type="bibr" rid="pcbi.1006650.ref060">60</xref>, <xref ref-type="bibr" rid="pcbi.1006650.ref061">61</xref>]. Thus, we will not further discuss the basic coalescent approach here. In what follows, we will introduce the basic birth-death models which underwent major development in recent years. Then, we discuss the more sophisticated birth-death and coalescent approaches side by side.</p>
<p>In birth-death models, it is assumed that the first individual appears at some time <italic>t</italic><sub>0</sub> before the present. Through time, each individual gives rise to one additional offspring with rate λ and dies with rate <italic>μ</italic>. An individual is sampled (e.g. the pathogen of an infected individual is sequenced, or ancient DNA for an individual is sequenced; or a fossil is observed) with rate <italic>ψ</italic>. Upon sampling, we assume that the individual representing the sample is removed from the population with probability <italic>r</italic>. In the case of infectious diseases, <italic>r</italic> is the probability of being cured or treated, such that the individual is not infectious any more upon sampling. In the case of species, we typically assume <italic>r</italic> = 0 as the species continues to exist upon sampling of a fossil. At the end of the process, each extant individual is sampled with probability <italic>ρ</italic>. The probability of a tree (<xref ref-type="fig" rid="pcbi.1006650.g001">Fig 1d</xref>), given parameters <italic>t</italic><sub>0</sub>, λ, <italic>μ</italic>, <italic>ψ</italic>, <italic>r</italic>, <italic>ρ</italic> has been derived in [<xref ref-type="bibr" rid="pcbi.1006650.ref057">57</xref>] for <italic>r</italic> = 0, and generalized for <italic>r</italic> ∈ [0, 1] in [<xref ref-type="bibr" rid="pcbi.1006650.ref062">62</xref>]. A value <italic>r</italic> &lt; 1 necessitates using an MCMC algorithm capable of producing trees with sampled ancestors. Such an algorithm is provided in BEAST 2 via the <monospace>SA</monospace> (sampled ancestor) package [<xref ref-type="bibr" rid="pcbi.1006650.ref013">13</xref>].</p>
<p>This basic model has been extended to account for changes of parameters through time within the <monospace>bdsky</monospace> package [<xref ref-type="bibr" rid="pcbi.1006650.ref009">9</xref>]. In <monospace>bdsky</monospace>, time is divided up into one or more intervals, inside of which parameters are held constant but between which parameters may be completely different (i.e. the change of parameters occurs in a non-parametric way).</p>
<p>In epidemiological investigations the birth-death model can be reparameterised by setting the rate of becoming noninfectious, <italic>δ</italic> = <italic>μ</italic> + <italic>ψr</italic> (the total rate at which lineages are removed), the effective reproductive number, <italic>R</italic><sub><italic>e</italic></sub> = λ/<italic>δ</italic>, and the sampling proportion <italic>p</italic> = <italic>ψ</italic>/<italic>δ</italic> (the proportion of removed lineages that are sampled). <xref ref-type="fig" rid="pcbi.1006650.g003">Fig 3</xref> shows the posterior estimates from a bdsky analysis of the 2013–2016 West African Ebola epidemic. Estimates are based on the coding regions of 811 sequences sampled through October 24, 2015, representing more than 2.5% of known cases. There is evidence that hospital-based transmission and unsafe burials contributed infections to the epidemic [<xref ref-type="bibr" rid="pcbi.1006650.ref063">63</xref>], thus the <monospace>SA</monospace> (sampled ancestor) package was used to account for some percentage of patients continuing to transmit the virus after being sampled (by allowing <italic>r</italic> to be less than 1). <italic>R</italic><sub><italic>e</italic></sub> was allowed to change over 20 time intervals, equally-spaced between the origin of the epidemic (<italic>t</italic><sub>0</sub>) and the time of the most recent sample, while the sampling proportion was estimated for every month from March 2014 onwards (when an Ebola virus disease outbreak was declared and the first samples collected). The estimated origin time of the epidemic coincides with the onset of symptoms in the suspected index case on December 26, 2013 [<xref ref-type="bibr" rid="pcbi.1006650.ref064">64</xref>]. Estimates of <italic>R</italic><sub><italic>e</italic></sub> are consistent with WHO estimates [<xref ref-type="bibr" rid="pcbi.1006650.ref065">65</xref>], based on surveillance data alone, but with greater uncertainty. For the majority of the period between mid-May and October 2014 <italic>R</italic><sub><italic>e</italic></sub> is estimated to be above 1, consistent with the observation that September 2014 was the turning point of the epidemic and that case incidence stopped growing in October [<xref ref-type="bibr" rid="pcbi.1006650.ref065">65</xref>]. After peak incidence was reached during the last week of September 2014, <italic>R</italic><sub><italic>e</italic></sub> estimates drop below 1 during October and November 2014 and then fluctuate around 1 during 2015 as transmissions persisted in some areas, due to a combination of unwillingness to seek medical care, unsafe burials and imperfect quarantine measures [<xref ref-type="bibr" rid="pcbi.1006650.ref064">64</xref>]. <italic>R</italic><sub><italic>e</italic></sub> estimates before May 2014 and after August 2015 have a large amount of uncertainty attached to them, due to the small amount of sequences sampled during these time periods. Trends in sampling proportion estimates follow empirical estimates based on the number of confirmed cases; however, the sampling proportion is overestimated during the period of intense transmission, which suggests the existence of transmission chains not represented in the sequence dataset. In the final two months of the study period the sampling proportion is underestimated, which may indicate ongoing cryptic transmission during this period, but may also be indicative of a model bias resulting from the remaining transmission chains at this time being highly isolated from each other, which is not taken into account by the model.</p>
<fig id="pcbi.1006650.g003" position="float">
<object-id pub-id-type="doi">10.1371/journal.pcbi.1006650.g003</object-id>
<label>Fig 3</label>
<caption>
<title>Birth-death skyline (bdsky) analysis of the 2013–2016 West African Ebola virus disease epidemic.</title>
<p>(a) The maximum clade credibility tree of the 811 sequences used in the analysis. (b) The median posterior estimate of the estimated effective reproductive number (<italic>R</italic><sub><italic>e</italic></sub>) over time is shown in orange, with the 95% highest posterior density (HPD) interval in orange shading. The red dotted line indicates the epidemic threshold (<italic>R</italic><sub><italic>e</italic></sub> = 1). If <italic>R</italic><sub><italic>e</italic></sub> is below this threshold the epidemic has reached a turning point and is no longer spreading. The posterior distribution of the origin time of the epidemic (<italic>t</italic><sub>0</sub>) is shown in green. The number of laboratory-confirmed cases per week is shown in blue. Red arrows indicate weeks with fewer than 10 confirmed cases. The dotted line at A indicates the onset of symptoms in the suspected index case (see text for details). The dotted lines at B and C indicate the dates at which the WHO declared an Ebola virus disease outbreak in Guinea and a Public Health Emergency of International Concern (PHEIC), respectively. The dotted line at D indicates the first time any of the three countries with intense transmission (Liberia) was declared Ebola free following 42 days without any new infections being reported (new cases were subsequently detected in Liberia in June 2015). (c) The median posterior estimate of the monthly sampling proportion is shown in purple, with the 95% HPD interval in purple shading. The red dashed line indicates the number of sampled sequences in the dataset, divided by the number of laboratory-confirmed cases, for each month in the analysis. This serves as an empirical estimate of the true sampling proportion. The posterior distributions and medians (dashed lines) of the infected period and the mean clock rate (truncated at the 95% HPD limits) are shown in panels (d) and (e).</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1006650.g003" xlink:type="simple"/>
</fig>
<p>Popular models in epidemiology, such as the SIR model [<xref ref-type="bibr" rid="pcbi.1006650.ref066">66</xref>], or in macroevolution, such as the diversity-dependent model [<xref ref-type="bibr" rid="pcbi.1006650.ref067">67</xref>], assume that parameters change as a function of the number of susceptible individuals or non-occupied niches, for example. Thus, they are called parametric birth-death models. Such parametric rate changes can be assumed when using the <monospace>EpiInf</monospace> package [<xref ref-type="bibr" rid="pcbi.1006650.ref029">29</xref>]. This latter package additionally samples the trajectory of infectious and susceptible individuals through time and allows for the inclusion of case count data in addition to sequences. In a faster, but approximate way, the <monospace>phylodynamics</monospace> package [<xref ref-type="bibr" rid="pcbi.1006650.ref028">28</xref>] performs inference under the SIR model using genetic sequences.</p>
<p>Parametric birth-death-based population dynamic models are computationally expensive because parameters are a function of the number of co-occurring individuals: typically we do not know this number and thus have to sample it via MCMC. An alternative is to approximate the population dynamics using the coalescent, which essentially means that we assume that our sample is small within a large population, and that we condition on the sampling times instead of them being part of the data, as in the birth-death model. The <monospace>phylodynamics</monospace> package provides an approach to estimate the trees and parameters assuming an either deterministically or stochastically changing population size under an SIR-type coalescent framework [<xref ref-type="bibr" rid="pcbi.1006650.ref027">27</xref>].</p>
<p>The analysis of genetic data and fossils for reconstructing a species phylogeny can be achieved using the birth-death model when setting <italic>r</italic> = 0. This setting is also referred to as the fossilized birth-death (FBD) process [<xref ref-type="bibr" rid="pcbi.1006650.ref068">68</xref>–<xref ref-type="bibr" rid="pcbi.1006650.ref070">70</xref>]. These approaches generalize the total-evidence dating method [<xref ref-type="bibr" rid="pcbi.1006650.ref071">71</xref>, <xref ref-type="bibr" rid="pcbi.1006650.ref072">72</xref>] by allowing for sampled ancestor fossils (instead of assuming all fossils are tips in the tree) and modelling of the fossil sampling process. These FBD approaches are an alternative to dating phylogenies by node-calibration approaches. Some constructions of the latter result in complex marginal priors for calibrated nodes [<xref ref-type="bibr" rid="pcbi.1006650.ref073">73</xref>], and it is not straightforward to specify a prior distribution for each calibration node. Furthermore, node-calibration approaches do not coherently use all comparative data within a joint inference framework, since the decision of which node to calibrate with which fossil is made before phylogenetic inference. This incoherency is overcome by total-evidence approaches where all data is analyzed together and node ages and tree topology are estimated jointly. On the other hand, the FBD models use each fossil age as an observation, and can be very sensitive to a biased fossil or extant species sampling [<xref ref-type="bibr" rid="pcbi.1006650.ref069">69</xref>, <xref ref-type="bibr" rid="pcbi.1006650.ref074">74</xref>]. This is particularly problematic when only the oldest fossils of clades are included in the analysis, as is commonly done in node dating approaches. In such cases, the <monospace>CA</monospace> (CladeAge) [<xref ref-type="bibr" rid="pcbi.1006650.ref025">25</xref>] package allows unbiased age estimation; however, it requires that sampling parameters are known <italic>a priori</italic> of the analysis while the FBD approach estimates these parameters alongside the tree. On the other hand, this requirement of the CladeAge approach means that different sampling parameters can be specified for different clades, whereas all (coexisting) species are assumed to share the same sampling parameters in the FBD model.</p>
</sec>
<sec id="sec010">
<title>Tree models for structured populations</title>
<p>Methods for studying population structure and reconstructing migration history have seen considerable progress in recent years, and have been particularly bolstered by the modularity and extensibility of BEAST 2. These features represent a remarkable opportunity for end users, who can now use, test and compare different models and approaches without the need to switch platforms and formats. It also encourages method development, as the availability of packages in a single, modular platform aids future development through easy integration of ideas and code.</p>
<p>In analogy with the situation for unstructured populations, the two approaches for structured populations are (i) multi-state birth-death models [<xref ref-type="bibr" rid="pcbi.1006650.ref009">9</xref>], implemented in the bdmm [<xref ref-type="bibr" rid="pcbi.1006650.ref031">31</xref>] package, and (ii) structured coalescent approaches, with an exact implementation available within MultiTypeTree [<xref ref-type="bibr" rid="pcbi.1006650.ref005">5</xref>]. The birth-death and coalescent approaches from above are essentially generalized to allow for more than one population by assuming migration rates between, and variable birth rates across, populations.</p>
<p>The bdmm package allows for changes in dynamics through time by using a skyline, analogous to the unstructured birth-death models. Furthermore, it can quantify its parameters, such as migration rates, without MCMC sampling of the states in ancestral lineages. In other words, for <italic>T</italic> being a phylogenetic tree with its tips being assigned states, bdmm uses equations for <italic>P</italic>(<italic>T</italic>|<italic>θ</italic>) under the multi-state birth-death model. The bdmm functionality was recently extended for macroevolutionary trees through the SSE package [<xref ref-type="bibr" rid="pcbi.1006650.ref038">38</xref>]. This package implements a family of (birth-death) models of state-dependent speciation and extinction ranging back to the original BiSSE model [<xref ref-type="bibr" rid="pcbi.1006650.ref075">75</xref>] where all tips are sampled at one point in time. The “state” a species or population is in can represent the state of one of its traits, but it can also be seen as its geographical distribution. When inputs are geographical ranges, state transition parameters can be interpreted as migration rates.</p>
<p>For the structured coalescent, the MultiTypeTree package samples the ancestral states of all lineages (<xref ref-type="fig" rid="pcbi.1006650.g001">Fig 1c</xref>), using MCMC, which can become very slow (i.e. MultiTypeTree considers <italic>P</italic>(<italic>T</italic>|<italic>θ</italic>) with <italic>T</italic> being a phylogeny where all lineages at all times have states assigned). Furthermore, the package needs to assume constant population sizes through time for the different demes. These limitations have been overcome by tracking ancestral states probabilistically using different approximations [<xref ref-type="bibr" rid="pcbi.1006650.ref030">30</xref>, <xref ref-type="bibr" rid="pcbi.1006650.ref076">76</xref>], avoiding the need to sample ancestral states using MCMC. The approximation originally proposed by [<xref ref-type="bibr" rid="pcbi.1006650.ref030">30</xref>] tracks state probabilities assuming that the state of each lineage evolves completely independently of other lineages in the phylogeny. Thus, an approximate equation for <italic>P</italic>(<italic>T</italic>|<italic>θ</italic>) under the structured coalescent is employed, where <italic>T</italic> is a phylogenetic tree, with its tips being assigned states. BASTA [<xref ref-type="bibr" rid="pcbi.1006650.ref032">32</xref>] implements a highly optimized version of the approach of [<xref ref-type="bibr" rid="pcbi.1006650.ref030">30</xref>] in BEAST 2.5, allowing one to rapidly analyse scenarios with many different sub-populations.</p>
<p>MASCOT [<xref ref-type="bibr" rid="pcbi.1006650.ref033">33</xref>] implements an improved approximation, derived in [<xref ref-type="bibr" rid="pcbi.1006650.ref076">76</xref>], that is more closely related to the exact structured coalescent, in that lineage state probabilities reflect the likelihood of each lineage coalescing with other lineages based on their probable location. Simulations using MASCOT revealed no biases in the estimates of parameters and node locations [<xref ref-type="bibr" rid="pcbi.1006650.ref076">76</xref>]. MASCOT additionally allows estimates of migration rates and effective population sizes across different sub-populations and time to be informed from predictor data (such as clinical, demographic, or behavioural variables) using a generalized linear model (GLM) approach [<xref ref-type="bibr" rid="pcbi.1006650.ref034">34</xref>].</p>
<p>The PhyDyn package [<xref ref-type="bibr" rid="pcbi.1006650.ref077">77</xref>] supports a highly flexible mark-up language for defining demographic or epidemiological processes as a system of ordinary differential equations. PhyDyn implements three approximations of the structured coalescent and extended previous work [<xref ref-type="bibr" rid="pcbi.1006650.ref030">30</xref>] to improve accuracy and reduce computational cost. The package calculates migration and coalescent rates from population trajectories and uses the structured coalescent approximations to calculate the states of lineages through time. A suitable application for this approach is the estimation of parameters from complex infectious disease models with multiple compartments, and it provides a means of taking advantage of categorical metadata which is not related to geography, such as clinical, demographic, or behavioural variables in phylodynamic studies of infectious disease dynamics.</p>
<p>These coalescent frameworks in BEAST 2.5 extend earlier developments on the coalescent. Among the most popular earlier models of this class for studying migration, spread and structure were the structured coalescent-based methods of Migrate-n [<xref ref-type="bibr" rid="pcbi.1006650.ref078">78</xref>]. Migrate-n targets the same structured coalescent distribution as MultiTypeTree, but differs with respect to the exact implementation. In particular, since not embedded within BEAST, it cannot be coupled with e.g. relaxed clock models.</p>
<p>The very popular discrete trait model and continuous phylogeographic methods from Lemey and colleagues [<xref ref-type="bibr" rid="pcbi.1006650.ref079">79</xref>, <xref ref-type="bibr" rid="pcbi.1006650.ref080">80</xref>] assume that the whole tree was generated under an unstructured model, and that the trait evolved—just like a nucleotide—on that tree. This approach is extremely computationally efficient and allows the study of a large number of samples with many distinct trait values. However, these models make strong assumptions about the distribution of sampled trait values which can bias inference results [<xref ref-type="bibr" rid="pcbi.1006650.ref032">32</xref>]. This issue can be overcome by the newer but computationally more demanding methods above. The Lemey et al. models are available in BEAST 2 through the <monospace>beast-classic</monospace> package (except for the generalized linear model feature introduced in [<xref ref-type="bibr" rid="pcbi.1006650.ref081">81</xref>]).</p>
<p>Another class of models of population structure deals with the fact that each host in an outbreak contains a separate within-host pathogen population during colonisation. In this context, transmission between hosts is a migration event into a new deme that is consequently colonised. The common aim of such models is to reconstruct the series of transmission events between hosts that led to the establishment of the considered outbreak. BEAST 2.5 offers two different models of such dynamics; SCOTTI [<xref ref-type="bibr" rid="pcbi.1006650.ref035">35</xref>] models transmission in a structured coalescent setting, and assumes that there is no recombination, that transmission inocula are small, and that each sample consists of an individual haplotype (however, multiple samples from the same host are allowed). BadTrIP [<xref ref-type="bibr" rid="pcbi.1006650.ref012">12</xref>] instead models transmission with a multispecies coalescent (MSC) paradigm, allowing recombination, large transmission inocula, and within-sample pathogen genetic diversity information from read-based allele counts, while accounting for sequencing error. BadTrIP can efficiently utilize information from genetic variation within samples to reconstruct more detailed transmission histories than SCOTTI, but it is also more computationally demanding [<xref ref-type="bibr" rid="pcbi.1006650.ref012">12</xref>].</p>
</sec>
<sec id="sec011">
<title>Multispecies coalescent models</title>
<p>The multispecies coalescent (MSC) model describes the evolution of genes within species [<xref ref-type="bibr" rid="pcbi.1006650.ref082">82</xref>]. Broadly, it assumes that the sampled alleles for a given gene have evolved according to a common coalescent process within each species, typically thought of as occurring backwards in time. For each branch in the species tree, this process begins at the tipward end of the branch, and apart from the root is truncated by the speciation event at the rootward end. Thus the MSC models trees within trees, and the probability density <italic>P</italic>(<italic>T</italic>|<italic>θ</italic>) becomes more complex, as described below.</p>
<p>An emergent property of the MSC known as incomplete lineage sorting (ILS) occurs when two or more lineages do not coalesce in their immediate ancestral population (<xref ref-type="fig" rid="pcbi.1006650.g004">Fig 4</xref>), which can lead to gene trees with discordant topologies among themselves and with the species tree. The probability of ILS increases as branch lengths are shortened in time, and/or when the effective population size <italic>N</italic><sub><italic>e</italic></sub> is increased. Species trees with four or more ingroup species can have a region of their parameter space (the “anomaly zone” [<xref ref-type="bibr" rid="pcbi.1006650.ref083">83</xref>]) where most gene trees have a topology different to the one of the species tree.</p>
<fig id="pcbi.1006650.g004" position="float">
<object-id pub-id-type="doi">10.1371/journal.pcbi.1006650.g004</object-id>
<label>Fig 4</label>
<caption>
<title>The multispecies coalescent (MSC) model with three species and a single gene tree.</title>
<p>A separate coalescent process applies to each of the five branches in the tree; the branches for the extant species A (red), B (green) and C (blue), the ancestral branch of A and B (yellow), and the root branch (grey). Several individuals have been sampled per species. In this example the ancestral lineage of individual <italic>b</italic><sub>4</sub> does not coalesce in species B or ancestral species 4. In ancestral species 5, it coalesces with the ancestral lineage of species C. This leads to incomplete lineage sorting and enables gene tree discordance—in this example <italic>b</italic><sub>4</sub> is a sister taxon to individuals from species C, rather than to individuals from its own species, or sister species A. If <italic>b</italic><sub>4</sub> was the representative individual for its species, then this gene would exhibit gene tree discordance. Other individuals which show concordance at this locus are expected to show discordance at other unlinked loci when populations are large or speciation times are recent.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1006650.g004" xlink:type="simple"/>
</fig>
<p>Discordance between gene trees and species tree in their topologies and times can lead to incorrect species tree estimates from concatenated gene sequences—this has been shown to occur with both maximum likelihood and Bayesian methods like those implemented in BEAST. More specifically, in the anomaly zone, gene tree topological discordance can result in incorrect estimates of the species tree topology [<xref ref-type="bibr" rid="pcbi.1006650.ref084">84</xref>, <xref ref-type="bibr" rid="pcbi.1006650.ref085">85</xref>], and systematic bias in branch length estimates [<xref ref-type="bibr" rid="pcbi.1006650.ref086">86</xref>]. Even in the case of just two species where gene tree discordance is impossible, speciation times estimated using concatenation will be wrong because the expected time to coalescence is 2<italic>N</italic><sub><italic>e</italic></sub> generations older than the speciation time [<xref ref-type="bibr" rid="pcbi.1006650.ref087">87</xref>]. The concatenation estimates of speciation times are therefore expected to be 2<italic>N</italic><sub><italic>e</italic></sub> generations older than the truth.</p>
<p>Unlike concatenation, multilocus MSC methods can accurately and jointly estimate the topology and times of the species tree and gene trees directly from multiple sequence alignments (MSAs). The first BEAST multilocus MSC implementation was *BEAST, which was introduced in BEAST 1.5.1 [<xref ref-type="bibr" rid="pcbi.1006650.ref088">88</xref>]. Let <italic>P</italic>(<italic>T</italic>, <italic>G</italic>, <italic>θ</italic>|<italic>D</italic>) be the joint posterior probability density for a species tree (<italic>T</italic>), a set of gene trees (<italic>G</italic> = {<italic>g</italic><sub>1</sub>, <italic>g</italic><sub>2</sub>, …, <italic>g</italic><sub><italic>L</italic></sub>}) and additional evolutionary parameters (<italic>θ</italic>), given a corresponding set of multiple sequence alignments <italic>D</italic> = {<italic>d</italic><sub>1</sub>, <italic>d</italic><sub>2</sub>, …, <italic>d</italic><sub><italic>L</italic></sub>}. Thus, we now enrich our posterior probability from above, <italic>P</italic>(<italic>T</italic>, <italic>θ</italic>|<italic>D</italic>) by additionally sampling gene trees <italic>G</italic>, using <italic>P</italic>(<italic>T</italic>, <italic>G</italic>, <italic>θ</italic>|<italic>D</italic>). In the MCMC, we calculate the product of phylogenetic likelihoods <italic>P</italic>(<italic>D</italic><sub><italic>i</italic></sub>|<italic>g</italic><sub><italic>i</italic></sub>, <italic>θ</italic>), the coalescent probability density <italic>P</italic>(<italic>g</italic><sub><italic>i</italic></sub>|<italic>T</italic>, <italic>θ</italic>) for each gene tree <italic>g</italic><sub><italic>i</italic></sub>, and the prior probability of the species tree given macroevolutionary parameters <italic>P</italic>(<italic>T</italic>|<italic>θ</italic>):
<disp-formula id="pcbi.1006650.e002"><alternatives><graphic id="pcbi.1006650.e002g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1006650.e002" xlink:type="simple"/><mml:math display="block" id="M2"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>P</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>T</mml:mi> <mml:mo>,</mml:mo> <mml:mi>G</mml:mi> <mml:mo>,</mml:mo> <mml:mi>θ</mml:mi> <mml:mo>|</mml:mo> <mml:mi>D</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>∝</mml:mo> <mml:mo>(</mml:mo> <mml:munder><mml:mo>∏</mml:mo> <mml:mi>i</mml:mi></mml:munder> <mml:mrow><mml:mi>P</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:msub><mml:mi>D</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>|</mml:mo> <mml:msub><mml:mi>g</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:mi>θ</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mi>P</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:msub><mml:mi>g</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>|</mml:mo> <mml:mi>T</mml:mi> <mml:mo>,</mml:mo> <mml:mi>θ</mml:mi> <mml:mo>)</mml:mo></mml:mrow></mml:mrow> <mml:mo>)</mml:mo> <mml:mi>P</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>T</mml:mi> <mml:mo>|</mml:mo> <mml:mi>θ</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mi>P</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>θ</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(1)</label></disp-formula></p>
<p>StarBEAST 2 [<xref ref-type="bibr" rid="pcbi.1006650.ref043">43</xref>] built on *BEAST [<xref ref-type="bibr" rid="pcbi.1006650.ref088">88</xref>] introduced species tree relaxed molecular clocks, where a separate substitution rate is estimated for each branch of the species tree. The substitution rates across each gene tree, used to calculate gene tree likelihoods, are then derived from the per-species rates and the per-gene rates [<xref ref-type="bibr" rid="pcbi.1006650.ref043">43</xref>]. This clock model enables accurate inference of substitution rate variation across the species tree from multiple loci.</p>
<p>Recently, some of us have developed an integrative model of molecular and morphological evolution which combines the FBD and MSC models to infer species trees from neontological and paleontological data, called the FBD-MSC for short. In this model, morphological data evolve along the species tree like the FBD model, but the MSC is used to model molecular evolution. The FBD-MSC was implemented in StarBEAST 2 v14. Using simulation, it was shown that differences in estimated ages between concatenation and the FBD-MSC are likely due to systematic biases introduced by concatenation [<xref ref-type="bibr" rid="pcbi.1006650.ref044">44</xref>].</p>
<p>Although the MSC deals successfully with a ubiquitous source of discordance, it has limitations. It relies on an assumption that there is no recombination within loci and free recombination between loci. The MSC also ignores the possibility of hybridization. Furthermore, in the MSC, speciation is assumed to be immediate, with an instant where (going back in time) coalescence suddenly becomes possible. In practice, speciation is usually expected to be gradual, and sometimes gene exchange occurs between non-sister species. Newly developed approaches relaxing such strict tree constraints are described in the next section on explicit models of reticulate evolution.</p>
<p>Another assumption of the MSC is that individuals can reliably be assigned to species or populations, whereas in practice, this is often not the case, especially with shallow phylogenies. DISSECT [<xref ref-type="bibr" rid="pcbi.1006650.ref089">89</xref>], extending the MSC, was first developed for BEAST 1.8.1, and it makes no assumption about how individuals are grouped into species, by inferring species assignment and delimitation simultaneously with the joint inference of the species and gene trees. It does so through an approximation to the Dirac delta function, where the birth-death prior includes an additional probability ‘spike’ of very short duration, <italic>ϵ</italic>, just before the present. This model is called the birth-death-collapse model. When the most recent common ancestor (MRCA) of multiple individuals is present inside the spike, those individuals are often interpreted as belonging to a single species [<xref ref-type="bibr" rid="pcbi.1006650.ref090">90</xref>, <xref ref-type="bibr" rid="pcbi.1006650.ref091">91</xref>].</p>
<p>Improving the computational performance of MSC methods is an ongoing challenge. Increasing the number of individual specimens in an analysis will degrade computational performance. Most seriously, the relationship between the number of loci used with *BEAST and the time taken to collect enough independent samples from the posterior distribution follows a power law distribution. The result is that whenever the number of loci used in a study is doubled, the time taken to run *BEAST increases seven-fold [<xref ref-type="bibr" rid="pcbi.1006650.ref042">42</xref>].</p>
<p>STACEY (the successor of DISSECT) [<xref ref-type="bibr" rid="pcbi.1006650.ref041">41</xref>] introduced a number of new classes of MCMC operators that simultaneously modify the species and gene trees in a coordinated fashion. Both StarBEAST 2 and STACEY offer improved MCMC mixing over their predecessors. On a data set where *BEAST was not able to converge when used with any more than 50 loci, STACEY was successfully run with 500 loci [<xref ref-type="bibr" rid="pcbi.1006650.ref041">41</xref>].</p>
<p>Likewise StarBEAST 2 has implemented coordinated operators belonging to one of the classes introduced by Jones [<xref ref-type="bibr" rid="pcbi.1006650.ref041">41</xref>]. Both StarBEAST 2 and STACEY also implement analytical integration of population sizes, which reduces the number of parameters which must be estimated using MCMC. The combination of new operators, analytical integration and additional optimizations to data structures enables StarBEAST 2 to be run with double the number of loci in roughly the same time as *BEAST.</p>
<p>Other approaches have addressed the computational burden associated with the MSC by taking a different modeling path. In particular, it is possible to greatly reduce the number of parameters associated with the gene trees in the MSC by integrating over all possible gene trees at each locus and at each MCMC step. This way, the parameter space does not increase as new loci are added to the analysis, and computational demand increases typically only linearly with the number of loci. In order to simplify gene tree integration, these models consider individual sites as loci, treating each SNP, or base, as unlinked from the others. While this modeling assumption can represent a coarse approximation, it on the other hand has the advantage of allowing recombination within genes, that otherwise can bias gene tree (and therefore species tree) inference.</p>
<p>One of the first gene tree-integrating approaches was SNAPP [<xref ref-type="bibr" rid="pcbi.1006650.ref007">7</xref>], which infers species trees directly from a matrix of biallelic markers (without linkage between markers), and is available as a package for BEAST 2. SNAPP integrates over all possible gene trees for each marker at each MCMC step, enabling much wider data matrices of thousands of markers to be used. The posterior probability density becomes:
<disp-formula id="pcbi.1006650.e003"><alternatives><graphic id="pcbi.1006650.e003g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1006650.e003" xlink:type="simple"/><mml:math display="block" id="M3"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>P</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>S</mml:mi> <mml:mo>,</mml:mo> <mml:mi>θ</mml:mi> <mml:mo>|</mml:mo> <mml:mi>D</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>∝</mml:mo> <mml:mo>(</mml:mo> <mml:munder><mml:mo>∏</mml:mo> <mml:mi>i</mml:mi></mml:munder> <mml:mrow><mml:mi>P</mml:mi> <mml:mo>(</mml:mo> <mml:msub><mml:mi>D</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>|</mml:mo> <mml:mi>S</mml:mi> <mml:mo>,</mml:mo> <mml:mi>θ</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>)</mml:mo> <mml:mi>P</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>S</mml:mi> <mml:mo>|</mml:mo> <mml:mi>θ</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mi>P</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>θ</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(2)</label></disp-formula></p>
<p>Another similar approach is PoMo [<xref ref-type="bibr" rid="pcbi.1006650.ref011">11</xref>]. PoMo models each species in the species tree as a small population (in particular, a Moran model [<xref ref-type="bibr" rid="pcbi.1006650.ref092">92</xref>]), affected by new mutations (introducing new low-frequency alleles in a population) and genetic drift (changing allele frequencies within populations). Differently from SNAPP, PoMo uses nucleotide data, allowing more than two alleles at each SNP, but still allowing at most 2 alleles at one time at any species/population. For each species and locus, PoMo reads 4 numbers, corresponding to the allele counts of the 4 nucleotides at the considered species and locus. PoMo is generally faster than SNAPP or MSC methods [<xref ref-type="bibr" rid="pcbi.1006650.ref011">11</xref>], and in its BEAST 2 implementation it can account for sequencing errors, as for allele counts derived from reads mapped to a reference genome.</p>
</sec>
</sec>
<sec id="sec012">
<title>Reticulate evolution</title>
<p>Describing evolutionary history using tree structures is generally a simplification. Genomes are subject to recombination, organisms are subject to horizontal gene transfer and species undergo hybridization followed by introgression. With a small number of exceptions (e.g. [<xref ref-type="bibr" rid="pcbi.1006650.ref093">93</xref>], [<xref ref-type="bibr" rid="pcbi.1006650.ref094">94</xref>]), computational phylogenetics has so far addressed these processes only partially, by restricting gene tree reconstructions to relatively short alignments that are assumed to be free from intra-locus recombination, or by excluding taxa from phylogenetic analyses that were found to be involved in gene flow by other approaches [<xref ref-type="bibr" rid="pcbi.1006650.ref095">95</xref>].</p>
<p>However, while these approaches to some extent avoid bias resulting from recombination, they at the same time ignore it as a potentially very useful source of information that is increasingly provided by whole-genome sequencing. For example, it has been shown that making use of this large-scale genomic structure can lead directly to powerful insights into ancestral population dynamics [<xref ref-type="bibr" rid="pcbi.1006650.ref096">96</xref>, <xref ref-type="bibr" rid="pcbi.1006650.ref097">97</xref>]. Similarly, with the increasing sophistication of species history reconstruction methods brought about through the availability of MSC methods, the omission of important processes such as hybridization and horizontal gene transfer from these models is becoming obvious. In response to this demand, BEAST 2 package authors have contributed and/or implemented a number of algorithms which perform phylogenetic/phylodynamic inference under models which directly account for non-tree-like evolution.</p>
<sec id="sec013">
<title>Gene conversion</title>
<p>The package Bacter [<xref ref-type="bibr" rid="pcbi.1006650.ref014">14</xref>] provides a complete, carefully validated, reimplementation of the ClonalOrigin model [<xref ref-type="bibr" rid="pcbi.1006650.ref039">39</xref>] which approximately describes networks produced by homologous gene conversion in bacteria. This is done by approximating the recombination graph using a tree-based network [<xref ref-type="bibr" rid="pcbi.1006650.ref098">98</xref>], in which the underlying tree is the “clonal frame” produced by the bacterial reproduction process and the additional edges represent homologous gene conversion events. In contrast to the original implementation, BACTER allows for joint estimation of both the clonal frame and the reticulations contributed by conversion events. Additionally BACTER provides a heuristic algorithm for summarizing the posterior distribution over these trees in a fashion similar to the MCC tree approach used by BEAST for binary trees.</p>
</sec>
<sec id="sec014">
<title>Hybridization and horizontal gene transfer</title>
<p>For multispecies phylogenetic analyses, a model called the Multispecies Network Coalescent (MSNC) has been developed [<xref ref-type="bibr" rid="pcbi.1006650.ref099">99</xref>, <xref ref-type="bibr" rid="pcbi.1006650.ref100">100</xref>]. This model generalizes the MSC by replacing the species tree (which supports only speciation nodes) with a species network (supporting speciation and reticulation nodes). Reticulation nodes and edges in the network can represent multiple biological processes including hybrid species, introgression or secondary contact. Gene trees, embedded within the species network, are still used to model the evolution of individual loci. This means the MSC’s assumption of no intra-locus recombination still applies.</p>
<p>SpeciesNetwork, a fully Bayesian implementation of the MSNC where the species network and gene trees are estimated directly from MSAs, has been developed and is available as a package in BEAST 2.5 [<xref ref-type="bibr" rid="pcbi.1006650.ref015">15</xref>]. Unlike for the MSC, there may be more than one possible embedding of a gene tree of given topology and times within a species network of given topology and times. The probability density of a possible embedding thus depends on the inheritance probability <italic>γ</italic> at each reticulation node.</p>
<p>In SpeciesNetwork, the gene tree embeddings, Ψ, and inheritance probabilities, <italic>γ</italic> ∈ Γ, are jointly estimated alongside the species network, gene trees and other parameters. The posterior probability density for the model is similar to *BEAST and StarBEAST 2, but <italic>T</italic> represents a species network rather than a tree, and the additional jointly estimated parameters are included:
<disp-formula id="pcbi.1006650.e004"><alternatives><graphic id="pcbi.1006650.e004g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1006650.e004" xlink:type="simple"/><mml:math display="block" id="M4"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>P</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>T</mml:mi> <mml:mo>,</mml:mo> <mml:mi>G</mml:mi> <mml:mo>,</mml:mo> <mml:mo>Ψ</mml:mo> <mml:mo>,</mml:mo> <mml:mo>Γ</mml:mo> <mml:mo>,</mml:mo> <mml:mi>θ</mml:mi> <mml:mo>|</mml:mo> <mml:mi>D</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>∝</mml:mo> <mml:mo>(</mml:mo> <mml:munder><mml:mo>∏</mml:mo> <mml:mi>i</mml:mi></mml:munder> <mml:mrow><mml:mi>P</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:msub><mml:mi>D</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>|</mml:mo> <mml:msub><mml:mi>g</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:mi>θ</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mi>P</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:msub><mml:mi>g</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>|</mml:mo> <mml:msub><mml:mo>Ψ</mml:mo> <mml:mi>i</mml:mi></mml:msub> <mml:mo>,</mml:mo> <mml:mi>T</mml:mi> <mml:mo>,</mml:mo> <mml:mi>θ</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mi>P</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:msub><mml:mo>Ψ</mml:mo> <mml:mi>i</mml:mi></mml:msub> <mml:mo>|</mml:mo> <mml:mo>Γ</mml:mo> <mml:mo>,</mml:mo> <mml:mi>T</mml:mi> <mml:mo>)</mml:mo></mml:mrow></mml:mrow> <mml:mo>)</mml:mo> <mml:mi>P</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>T</mml:mi> <mml:mo>|</mml:mo> <mml:mi>θ</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mi>P</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mo>Γ</mml:mo> <mml:mo>)</mml:mo></mml:mrow> <mml:mi>P</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>θ</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(3)</label></disp-formula></p>
</sec>
<sec id="sec015">
<title>Isolation with migration</title>
<p>Sitting between the MSC and the MSNC are models where there is a species tree (not network) but the exchange of genes is allowed between the branches of the species tree. This exchange of genes is typically termed gene flow. Gene flow may occur between sister species, known as isolation-with-migration (IM) [<xref ref-type="bibr" rid="pcbi.1006650.ref101">101</xref>] and between non-sister species (paraphyly) [<xref ref-type="bibr" rid="pcbi.1006650.ref102">102</xref>]. It has been shown that ignoring gene flow can result in poor estimates of species tree topologies and node times [<xref ref-type="bibr" rid="pcbi.1006650.ref102">102</xref>].</p>
<p>One solution in the BEAST2 framework is the DENIM package [<xref ref-type="bibr" rid="pcbi.1006650.ref040">40</xref>], which is able to infer species trees more accurately than MSC-based models such as STACEY when a small amount of gene flow is present. It uses an approximation which breaks down if there is too much gene flow. DENIM is also able to identify which loci are subject to gene flow.</p>
<p>Another solution is AIM [<xref ref-type="bibr" rid="pcbi.1006650.ref045">45</xref>], which is part of StarBEAST 2 since version v15. AIM implements an IM model that allows the estimation of species trees, rates of gene flow and effective population sizes from genetic sequence data of independently evolving loci. Inferring the species tree topology alongside the other parameters of interest is possible due to the ability to integrate over migration histories [<xref ref-type="bibr" rid="pcbi.1006650.ref076">76</xref>]. For every set of effective population sizes of extinct and extant species and rates of gene flow between these species, AIM can calculate the probability of a gene tree given a species tree without inferring the migration events. This allows changing the species tree topology and node order while still computing the probability of gene trees under these new settings. MCMC can thus be used to explore the different combinations of species trees, rates of gene flow, effective population sizes and gene trees jointly.</p>
<p>
<xref ref-type="fig" rid="pcbi.1006650.g005">Fig 5</xref> shows the species tree and migration events inferred with AIM from a set of 100 nuclear gene sequence alignments for five species of Princess cichlid fishes (<italic>Neolamprologus savoryi</italic>-complex [<xref ref-type="bibr" rid="pcbi.1006650.ref103">103</xref>]) from the East African Lake Tanganyika and the outgroup species <italic>Metriaclima zebra</italic> from Lake Malawi. Princess cichlids are well known to hybridize in captivity when placed in the same aquarium [<xref ref-type="bibr" rid="pcbi.1006650.ref103">103</xref>], and hybridization in their natural habitat has been supported by observed discordance of mitochondrial and nuclear among-species relationships [<xref ref-type="bibr" rid="pcbi.1006650.ref104">104</xref>]. Whole-genome sequence data for the six species have been generated by [<xref ref-type="bibr" rid="pcbi.1006650.ref105">105</xref>] and [<xref ref-type="bibr" rid="pcbi.1006650.ref106">106</xref>] had previously been used [<xref ref-type="bibr" rid="pcbi.1006650.ref106">106</xref>] to generate 426 time-calibrated phylogenies from individual regions of the genomes; a comparison of these phylogenies then supported three past hybridization events in Princess cichlids: between <italic>Neolamprologus brichardi</italic> and <italic>N</italic>. <italic>pulcher</italic>, between <italic>N</italic>. <italic>marunguensis</italic> and the common ancestor of <italic>N</italic>. <italic>pulcher</italic> and <italic>N</italic>. <italic>olivaceous</italic>, and between <italic>N</italic>. <italic>marunguensis</italic> and <italic>N</italic>. <italic>gracilis</italic> [<xref ref-type="bibr" rid="pcbi.1006650.ref106">106</xref>]. For the analysis shown in <xref ref-type="fig" rid="pcbi.1006650.g005">Fig 5</xref>, we reused this genomic data of [<xref ref-type="bibr" rid="pcbi.1006650.ref105">105</xref>] and [<xref ref-type="bibr" rid="pcbi.1006650.ref106">106</xref>] to generate alignments for 100 one-to-one orthologous genes following a previously published protocol [<xref ref-type="bibr" rid="pcbi.1006650.ref107">107</xref>], and estimated the species tree jointly with the support for gene flow under the AIM model. We fixed the height of the species tree to be 9.2 Mya [<xref ref-type="bibr" rid="pcbi.1006650.ref095">95</xref>] and inferred the clock rate and transition/transversion ratio for each locus jointly with all other parameters. The backwards in time rate of gene flow between any two species (except the outgroup) was assumed to be inversely proportional to the time these two species co-existed. For each possible direction of gene flow, we inferred the support for this rate being non-zero [<xref ref-type="bibr" rid="pcbi.1006650.ref079">79</xref>] and the rate scaler itself. The rate scaler was assumed to be exponentially distributed around 0.05. While not exactly equal, this corresponds in scale to about 5% of lineages to have originated from a different species.</p>
<fig id="pcbi.1006650.g005" position="float">
<object-id pub-id-type="doi">10.1371/journal.pcbi.1006650.g005</object-id>
<label>Fig 5</label>
<caption>
<title>AIM analysis of 100 nuclear gene alignments for the five Princess cichlid species.</title>
<p>Species are <italic>Neolamprologus marunguensis</italic>, <italic>N</italic>. <italic>gracilis</italic>, <italic>N</italic>. <italic>brichardi</italic>, <italic>N</italic>. <italic>olivaceous</italic>, <italic>N</italic>. <italic>pulcher</italic>, as well as the outgroup <italic>Metriaclima zebra</italic>. a) to d) show the best-supported tree topologies. Arrows show directions of gene flow that are supported with a Bayes Factor of more than 10. Trees a) and c) only differ in the timing of the speciation events; however, AIM differentiates between differently ranked topologies, since these have to be characterized by using different parameters.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1006650.g005" xlink:type="simple"/>
</fig>
</sec>
</sec>
</sec>
<sec id="sec016">
<title>Model selection and model adequacy</title>
<p>The model selection package has been extended with a number of existing methods, and now contains path sampling, stepping-stone, Akaike information criterion for MCMC (a.k.a. AICM), conditional predictive ordinates [<xref ref-type="bibr" rid="pcbi.1006650.ref108">108</xref>] and generalized stepping-stone [<xref ref-type="bibr" rid="pcbi.1006650.ref109">109</xref>].</p>
<p>The NS package implements nested sampling [<xref ref-type="bibr" rid="pcbi.1006650.ref047">47</xref>] for phylogenetics, which can also be used for model selection. Nested sampling is a general purpose Bayesian method [<xref ref-type="bibr" rid="pcbi.1006650.ref110">110</xref>] for estimating the marginal likelihood, which conveniently also provides an estimate of the uncertainty of the marginal likelihood estimate. Such uncertainty estimates are not easily available for other methods. Furthermore, nested sampling can be used to provide a posterior sample, and, for some cases where standard MCMC can get stuck in a mode of a multi-modal posterior, nested sampling can produce consistent posterior samples [<xref ref-type="bibr" rid="pcbi.1006650.ref047">47</xref>]. The marginal likelihood estimates produced by nested sampling can be used to compare models, so provide a basis for model selection.</p>
<p>While model selection compares different models, in model adequacy studies, we assess if a model is a good fit by itself. The key idea of model adequacy assessments is to perform direct simulation of data from generative models (i.e. any of the models discussed above). More precisely, simulations are used to assess the absolute model fit in a posterior predictive framework. First, data is simulated using parameter values sampled from the posterior distribution. Such simulations are known as posterior predictive simulations [<xref ref-type="bibr" rid="pcbi.1006650.ref111">111</xref>–<xref ref-type="bibr" rid="pcbi.1006650.ref113">113</xref>]. A test statistic is calculated for the empirical data and for the simulated data. The model is considered to adequately describe the data if the test statistics for the empirical data fall within the range of those from the posterior predictive simulations, for example using a posterior predictive p-value (analogous to the frequentist <italic>p</italic>-value). For example, a phylodynamic model can be used to estimate the reproductive number, the origin of the outbreak, and epidemic trajectories (e.g. [<xref ref-type="bibr" rid="pcbi.1006650.ref027">27</xref>–<xref ref-type="bibr" rid="pcbi.1006650.ref029">29</xref>]). The package TreeModelAdequacy (TMA; [<xref ref-type="bibr" rid="pcbi.1006650.ref049">49</xref>]) can sample the posterior distribution of these parameters to generate trees using MASTER [<xref ref-type="bibr" rid="pcbi.1006650.ref004">4</xref>] and it calculates a number of test statistics. In <xref ref-type="fig" rid="pcbi.1006650.g006">Fig 6</xref> we assess the adequacy of stochastic and deterministic phylodynamic models by comparing the root-height of trees generated using posterior predictive simulations for a data set of the 2009 H1N1 influenza pandemic.</p>
<fig id="pcbi.1006650.g006" position="float">
<object-id pub-id-type="doi">10.1371/journal.pcbi.1006650.g006</object-id>
<label>Fig 6</label>
<caption>
<title>Posterior predictive distributions for two phylodynamic models.</title>
<p>The right column shows the trajectories of the reproductive number over time for a set of 100 publicly available genomes from the 2009 H1N1 influenza pandemic in North America using stochastic (birth-death SIR; [<xref ref-type="bibr" rid="pcbi.1006650.ref028">28</xref>]) and deterministic (deterministic coalescent SIR [<xref ref-type="bibr" rid="pcbi.1006650.ref027">27</xref>]) models. Each blue line is a trajectory sampled from the posterior distribution. The models make different inferences of when the reproductive number falls below 1 (vertical dotted line; the horizontal dashed line is for R = 1), indicating that the pandemic is past its infectious peak. The right column shows the posterior predictive distributions of the root height for both models (grey histograms) and the value for the empirical data (orange vertical lines). Trees simulated from the stochastic model produce trees that are more consistent with the empirical tree than those from the deterministic model, suggesting that stochasticity may play an important role in the early stages of the pandemic (samples were collected up to June 2009).</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1006650.g006" xlink:type="simple"/>
</fig>
</sec>
<sec id="sec017">
<title>New simulation tools</title>
<p>Many of the models that are implemented in BEAST are generative models that present simplistic, yet mathematically precise, biological hypotheses about the way in which genetic sequences and phylogenetic trees are produced. The focus of BEAST is predominantly learning about biologically meaningful processes via inference of model parameters or model selection. However, models can differ greatly in their assumptions about these processes and the data they generate. Obviously, one must have a clear picture of what generative models imply about data, and if some predicted data features (under a model) are never seen in nature, appropriateness of the model must be questioned. In the previous section, we discussed how to assess model adequacy using simulations.</p>
<p>Furthermore, direct simulation also forms the basis for many inference algorithm validation strategies. Often the best test for correctness of implementation involves judging whether the parameters inferred from data simulated under the model match those used during the simulation. This kind of test can be done qualitatively, or may form the basis for a quantitative validation study by organizing a well-calibrated analysis in which parameters for the data simulation stage are drawn from the same probability distributions used as priors in the inference stage.</p>
<p>BEAST 2.5 provides a number of tools for simulating genetic sequence data and phylogenetic trees. Sequence data simulation is provided as a core feature, and is possible for any of the substitution and clock models supported by BEAST itself or as third-party packages. Phylogenetic tree simulation under specific phylodynamic models (e.g. unstructured/structure coalescent, FBD models, etc.) is provided by the packages that implement those models. General simulation of trees and networks under arbitrary birth-death and coalescent models is provided by MASTER [<xref ref-type="bibr" rid="pcbi.1006650.ref004">4</xref>], which allows models to be specified using a readable chemical reaction notation and for a wide variety of sampling schemes to be simulated.</p>
<p>BEAST methods have been applied extensively in cultural evolution (e.g., [<xref ref-type="bibr" rid="pcbi.1006650.ref036">36</xref>, <xref ref-type="bibr" rid="pcbi.1006650.ref114">114</xref>, <xref ref-type="bibr" rid="pcbi.1006650.ref115">115</xref>]) using the observation that linguistic data can be represented by binary sequence data, and these can be treated similarly to genetic sequence data. The LanguageSequenceGen package [<xref ref-type="bibr" rid="pcbi.1006650.ref048">48</xref>] can be used to simulate language data under common linguistic models of evolution, with languages specific features like borrowing and burst of evolution shared among different words.</p>
</sec>
<sec id="sec018">
<title>Validation, testing and quality management</title>
<p>One challenge of developing a software project involving a large distributed team of varying backgrounds, is maintaining a high level of quality and a uniformity of validation and testing protocols. As this project has developed organically, most of the efforts in this direction have thus far been informal. We encourage all BEAST package developers to develop open-source solutions, employ unit tests, use established verification techniques and, where appropriate, to submit new methodology for peer-review in the primary literature, preferably using open access solutions. This culture is well-embedded, and many packages conform to these basic principles. However there is potentially the need going forward for a more formal process to assess packages for correctness and quality.</p>
<p>Within the core developer group, we have worked over many years to develop a broad range of tools and approaches for testing and verification of correctness (e.g. see sections 4.1 and 4.2 in [<xref ref-type="bibr" rid="pcbi.1006650.ref005">5</xref>] for a typical example). Some of us are currently working on providing a set of formal guidelines and testing tools to aid developers of third-party packages. The core developers plan to put much more effort into this area in the near future. In the meantime, we recommend that each package be evaluated independently by users, based on the published documentation.</p>
</sec>
<sec id="sec019">
<title>Availability and future directions</title>
<p>BEAST is available under the LGPL licence from <ext-link ext-link-type="uri" xlink:href="https://github.com/CompEvol/BEAST2" xlink:type="simple">https://github.com/CompEvol/BEAST2</ext-link> and is based on Java, so runs on any platform that supports Java. More information, including downloads, tutorials, news updates, frequently asked questions, etc. can be found on <ext-link ext-link-type="uri" xlink:href="http://beast2.org/" xlink:type="simple">http://beast2.org/</ext-link>. Additionally, tutorials for many of the described packages can be found as part of the <ext-link ext-link-type="uri" xlink:href="http://taming-the-beast.org/" xlink:type="simple">http://taming-the-beast.org/</ext-link> platform [<xref ref-type="bibr" rid="pcbi.1006650.ref116">116</xref>]. At Google groups, there is a forum (<ext-link ext-link-type="uri" xlink:href="https://groups.google.com/forum/#!forum/beast-users" xlink:type="simple">https://groups.google.com/forum/#!forum/beast-users</ext-link>) for users to discuss questions.</p>
<p>BEAST 1 is still being developed with a focus on epidemiology of infectious disease, and given its common pedigree it is not surprising that there is considerable overlap in functionality of BEAST 1 and 2. With this in mind, the project X-BEAST (pronounce cross-beast) (<ext-link ext-link-type="uri" xlink:href="https://github.com/rbouckaert/xbeast" xlink:type="simple">https://github.com/rbouckaert/xbeast</ext-link>) is being developed which aims at making two versions of BEAST interoperable, so models from both versions can be used in the same analysis. This non-trivial software engineering problem is something we hope will yield fruit in the near future.</p>
</sec>
<sec id="sec020" sec-type="conclusions">
<title>Discussion and conclusion</title>
<p>Since the first release of BEAST 2 there has been a large expansion of core features, an increase in the number of developers, and a large increase in the number of models and the number of packages available. There has also been the publication of a book [<xref ref-type="bibr" rid="pcbi.1006650.ref002">2</xref>] and the introduction of a regular series of week-long in-depth Taming the BEAST workshops [<xref ref-type="bibr" rid="pcbi.1006650.ref116">116</xref>]. The BEAST 2 community has rapidly grown over the past 5 years and the software has grown (with respect to other similar software packages) in a number of distinct directions: (i) hierarchical multi-species coalescent models for species tree estimation, (ii) fossilized birth-death models for macroevolution and total-evidence analyses and (iii) multi-state birth-death and structured coalescent epidemiological models for understanding rapidly evolving infectious diseases, (iv) new model averaging and model comparison methods including nested sampling. BEAST 2 now occupies a unique niche in the landscape of Bayesian phylogenetic inference software, but still shares a very similar modelling philosophy with both BEAST 1.10 [<xref ref-type="bibr" rid="pcbi.1006650.ref117">117</xref>] and RevBayes [<xref ref-type="bibr" rid="pcbi.1006650.ref118">118</xref>]. Multiple platforms provide a valuable opportunity to validate complex new models by comparing independent implementations, and to test different approaches to modelling and inference. On the other hand, a lack of interoperability means that combining models from two different platforms is currently not possible. So one aim for the future may be to work harder on interoperability between these different platforms. To do so will require a common language for model specification. This is currently the biggest hurdle and an obvious target for future work.</p>
</sec>
</body>
<back>
<ack>
<p>We would like to acknowledge all additional contributors to BEAST 2 and the Taming the BEAST workshops including Veronika Bošková, David Bryant, Arjun Dhawan, Tracy Heath, Simon Ho, Stéphane Hué, Carsten Magnus, Patricio Maturana, Vladimir Minin, Venelin Mitov, Jūlija Pečerska, Oliver Pybus, Jérémie Sciré, Christiaan Swanepoel, Erik Volz, Rachel Warnock, David Welch, Jing Yang, Rong Zhang.</p>
</ack>
<ref-list>
<title>References</title>
<ref id="pcbi.1006650.ref001">
<label>1</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Bouckaert</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Heled</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Kühnert</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Vaughan</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Wu</surname> <given-names>CH</given-names></name>, <name name-style="western"><surname>Xie</surname> <given-names>D</given-names></name>, <etal>et al</etal>. <article-title>BEAST 2: a software platform for Bayesian evolutionary analysis</article-title>. <source>PLoS computational biology</source>. <year>2014</year>;<volume>10</volume>(<issue>4</issue>):<fpage>e1003537</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pcbi.1003537" xlink:type="simple">10.1371/journal.pcbi.1003537</ext-link></comment> <object-id pub-id-type="pmid">24722319</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref002">
<label>2</label>
<mixed-citation publication-type="book" xlink:type="simple">
<name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>, <name name-style="western"><surname>Bouckaert</surname> <given-names>RR</given-names></name>. <source>Bayesian evolutionary analysis with BEAST</source>. <publisher-name>Cambridge University Press</publisher-name>; <year>2015</year>.</mixed-citation>
</ref>
<ref id="pcbi.1006650.ref003">
<label>3</label>
<mixed-citation publication-type="other" xlink:type="simple">Bouckaert R, Heled J. DensiTree 2: Seeing trees through the forest. bioRxiv. 2014; p. 012401.</mixed-citation>
</ref>
<ref id="pcbi.1006650.ref004">
<label>4</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Vaughan</surname> <given-names>TG</given-names></name>, <name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>. <article-title>A stochastic simulator of birth–death master equations with application to phylodynamics</article-title>. <source>Molecular biology and evolution</source>. <year>2013</year>;<volume>30</volume>(<issue>6</issue>):<fpage>1480</fpage>–<lpage>1493</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/molbev/mst057" xlink:type="simple">10.1093/molbev/mst057</ext-link></comment> <object-id pub-id-type="pmid">23505043</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref005">
<label>5</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Vaughan</surname> <given-names>TG</given-names></name>, <name name-style="western"><surname>Kühnert</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Popinga</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Welch</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>. <article-title>Efficient Bayesian inference under the structured coalescent</article-title>. <source>Bioinformatics</source>. <year>2014</year>;<volume>30</volume>(<issue>16</issue>):<fpage>2272</fpage>–<lpage>2279</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/bioinformatics/btu201" xlink:type="simple">10.1093/bioinformatics/btu201</ext-link></comment> <object-id pub-id-type="pmid">24753484</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref006">
<label>6</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Bouckaert</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Alvarado-Mora</surname> <given-names>MV</given-names></name>, <name name-style="western"><surname>Pinho</surname> <given-names>JR</given-names></name>, <etal>et al</etal>. <article-title>Evolutionary rates and HBV: issues of rate estimation with Bayesian molecular methods</article-title>. <source>Antivir Ther</source>. <year>2013</year>;<volume>18</volume>(<issue>3 Pt B</issue>):<fpage>497</fpage>–<lpage>503</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3851/IMP2656" xlink:type="simple">10.3851/IMP2656</ext-link></comment> <object-id pub-id-type="pmid">23792904</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref007">
<label>7</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Bryant</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Bouckaert</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Felsenstein</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Rosenberg</surname> <given-names>NA</given-names></name>, <name name-style="western"><surname>RoyChoudhury</surname> <given-names>A</given-names></name>. <article-title>Inferring species trees directly from biallelic genetic markers: bypassing gene trees in a full coalescent analysis</article-title>. <source>Molecular biology and evolution</source>. <year>2012</year>;<volume>29</volume>(<issue>8</issue>):<fpage>1917</fpage>–<lpage>1932</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/molbev/mss086" xlink:type="simple">10.1093/molbev/mss086</ext-link></comment> <object-id pub-id-type="pmid">22422763</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref008">
<label>8</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Wu</surname> <given-names>CH</given-names></name>, <name name-style="western"><surname>Suchard</surname> <given-names>MA</given-names></name>, <name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>. <article-title>Bayesian selection of nucleotide substitution models and their site assignments</article-title>. <source>Molecular biology and evolution</source>. <year>2012</year>;<volume>30</volume>(<issue>3</issue>):<fpage>669</fpage>–<lpage>688</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/molbev/mss258" xlink:type="simple">10.1093/molbev/mss258</ext-link></comment> <object-id pub-id-type="pmid">23233462</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref009">
<label>9</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Stadler</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Kühnert</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Bonhoeffer</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>. <article-title>Birth–death skyline plot reveals temporal changes of epidemic spread in HIV and hepatitis C virus (HCV)</article-title>. <source>Proceedings of the National Academy of Sciences</source>. <year>2013</year>;<volume>110</volume>(<issue>1</issue>):<fpage>228</fpage>–<lpage>233</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1073/pnas.1207965110" xlink:type="simple">10.1073/pnas.1207965110</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref010">
<label>10</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Hinchliff</surname> <given-names>CE</given-names></name>, <name name-style="western"><surname>Smith</surname> <given-names>SA</given-names></name>, <name name-style="western"><surname>Allman</surname> <given-names>JF</given-names></name>, <name name-style="western"><surname>Burleigh</surname> <given-names>JG</given-names></name>, <name name-style="western"><surname>Chaudhary</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Coghill</surname> <given-names>LM</given-names></name>, <etal>et al</etal>. <article-title>Synthesis of phylogeny and taxonomy into a comprehensive tree of life</article-title>. <source>Proc Natl Acad Sci U S A</source>. <year>2015</year>;<volume>112</volume>(<issue>41</issue>):<fpage>12764</fpage>–<lpage>9</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1073/pnas.1423041112" xlink:type="simple">10.1073/pnas.1423041112</ext-link></comment> <object-id pub-id-type="pmid">26385966</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref011">
<label>11</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>De Maio</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Schrempf</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Kosiol</surname> <given-names>C</given-names></name>. <article-title>PoMo: an allele frequency-based approach for species tree estimation</article-title>. <source>Systematic biology</source>. <year>2015</year>;<volume>64</volume>(<issue>6</issue>):<fpage>1018</fpage>–<lpage>1031</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/sysbio/syv048" xlink:type="simple">10.1093/sysbio/syv048</ext-link></comment> <object-id pub-id-type="pmid">26209413</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref012">
<label>12</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>De Maio</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Worby</surname> <given-names>CJ</given-names></name>, <name name-style="western"><surname>Wilson</surname> <given-names>DJ</given-names></name>, <name name-style="western"><surname>Stoesser</surname> <given-names>N</given-names></name>. <article-title>Bayesian reconstruction of transmission within outbreaks using genomic variants</article-title>. <source>PLoS computational biology</source>. <year>2018</year>;<volume>14</volume>(<issue>4</issue>):<fpage>e1006117</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pcbi.1006117" xlink:type="simple">10.1371/journal.pcbi.1006117</ext-link></comment> <object-id pub-id-type="pmid">29668677</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref013">
<label>13</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Gavryushkina</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Welch</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Stadler</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>. <article-title>Bayesian inference of sampled ancestor trees for epidemiology and fossil calibration</article-title>. <source>PLoS computational biology</source>. <year>2014</year>;<volume>10</volume>(<issue>12</issue>):<fpage>e1003919</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pcbi.1003919" xlink:type="simple">10.1371/journal.pcbi.1003919</ext-link></comment> <object-id pub-id-type="pmid">25474353</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref014">
<label>14</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Vaughan</surname> <given-names>TG</given-names></name>, <name name-style="western"><surname>Welch</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>, <name name-style="western"><surname>Biggs</surname> <given-names>PJ</given-names></name>, <name name-style="western"><surname>George</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>French</surname> <given-names>NP</given-names></name>. <article-title>Inferring ancestral recombination graphs from bacterial genomic data</article-title>. <source>Genetics</source>. <year>2017</year>;<volume>205</volume>(<issue>2</issue>):<fpage>857</fpage>–<lpage>870</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.116.193425" xlink:type="simple">10.1534/genetics.116.193425</ext-link></comment> <object-id pub-id-type="pmid">28007885</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref015">
<label>15</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Zhang</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Ogilvie</surname> <given-names>HA</given-names></name>, <name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>, <name name-style="western"><surname>Stadler</surname> <given-names>T</given-names></name>. <article-title>Bayesian inference of species networks from multilocus sequence data</article-title>. <source>Molecular biology and evolution</source>. <year>2017</year>; p. msx307.</mixed-citation>
</ref>
<ref id="pcbi.1006650.ref016">
<label>16</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Bouckaert</surname> <given-names>RR</given-names></name>, <name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>. <article-title>bModelTest: Bayesian phylogenetic site model averaging and model comparison</article-title>. <source>BMC evolutionary biology</source>. <year>2017</year>;<volume>17</volume>(<issue>1</issue>):<fpage>42</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/s12862-017-0890-6" xlink:type="simple">10.1186/s12862-017-0890-6</ext-link></comment> <object-id pub-id-type="pmid">28166715</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref017">
<label>17</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Goldman</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Yang</surname> <given-names>Z</given-names></name>. <article-title>A codon-based model of nucleotide substitution for protein-coding DNA sequences</article-title>. <source>Molecular biology and evolution</source>. <year>1994</year>;<volume>11</volume>(<issue>5</issue>):<fpage>725</fpage>–<lpage>736</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/oxfordjournals.molbev.a040153" xlink:type="simple">10.1093/oxfordjournals.molbev.a040153</ext-link></comment> <object-id pub-id-type="pmid">7968486</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref018">
<label>18</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Yang</surname> <given-names>Z</given-names></name>, <name name-style="western"><surname>Nielsen</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Goldman</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Pedersen</surname> <given-names>AMK</given-names></name>. <article-title>Codon-substitution models for heterogeneous selection pressure at amino acid sites</article-title>. <source>Genetics</source>. <year>2000</year>;<volume>155</volume>(<issue>1</issue>):<fpage>431</fpage>–<lpage>449</lpage>. <object-id pub-id-type="pmid">10790415</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref019">
<label>19</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Lewis</surname> <given-names>PO</given-names></name>. <article-title>A likelihood approach to estimating phylogeny from discrete morphological character data</article-title>. <source>Systematic biology</source>. <year>2001</year>;<volume>50</volume>(<issue>6</issue>):<fpage>913</fpage>–<lpage>925</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1080/106351501753462876" xlink:type="simple">10.1080/106351501753462876</ext-link></comment> <object-id pub-id-type="pmid">12116640</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref020">
<label>20</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Sainudiin</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Durrett</surname> <given-names>RT</given-names></name>, <name name-style="western"><surname>Aquadro</surname> <given-names>CF</given-names></name>, <name name-style="western"><surname>Nielsen</surname> <given-names>R</given-names></name>. <article-title>Microsatellite mutation models: insights from a comparison of humans and chimpanzees</article-title>. <source>Genetics</source>. <year>2004</year>;<volume>168</volume>(<issue>1</issue>):<fpage>383</fpage>–<lpage>395</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.103.022665" xlink:type="simple">10.1534/genetics.103.022665</ext-link></comment> <object-id pub-id-type="pmid">15454551</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref021">
<label>21</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Wu</surname> <given-names>CH</given-names></name>, <name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>. <article-title>Joint inference of microsatellite mutation models, population history and genealogies using transdimensional Markov Chain Monte Carlo</article-title>. <source>Genetics</source>. <year>2011</year>;<volume>188</volume>(<issue>1</issue>):<fpage>151</fpage>–<lpage>164</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.110.125260" xlink:type="simple">10.1534/genetics.110.125260</ext-link></comment> <object-id pub-id-type="pmid">21385725</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref022">
<label>22</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>De Maio</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Schlötterer</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Kosiol</surname> <given-names>C</given-names></name>. <article-title>Linking great apes genome evolution across time scales using polymorphism-aware phylogenetic models</article-title>. <source>Molecular biology and evolution</source>. <year>2013</year>;<volume>30</volume>(<issue>10</issue>):<fpage>2249</fpage>–<lpage>2262</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/molbev/mst131" xlink:type="simple">10.1093/molbev/mst131</ext-link></comment> <object-id pub-id-type="pmid">23906727</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref023">
<label>23</label>
<mixed-citation publication-type="other" xlink:type="simple">Bouckaert R, Lockhart P. Capturing heterotachy through multi-gamma site models. bioRxiv. 2015; p. 018101.</mixed-citation>
</ref>
<ref id="pcbi.1006650.ref024">
<label>24</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Fourment</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Darling</surname> <given-names>AE</given-names></name>. <article-title>Local and relaxed clocks: the best of both worlds</article-title>. <source>PeerJ</source>. <year>2018</year>;<volume>6</volume>:<fpage>e5140</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.7717/peerj.5140" xlink:type="simple">10.7717/peerj.5140</ext-link></comment> <object-id pub-id-type="pmid">30002973</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref025">
<label>25</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Matschiner</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Musilová</surname> <given-names>Z</given-names></name>, <name name-style="western"><surname>Barth</surname> <given-names>JM</given-names></name>, <name name-style="western"><surname>Starostová</surname> <given-names>Z</given-names></name>, <name name-style="western"><surname>Salzburger</surname> <given-names>W</given-names></name>, <name name-style="western"><surname>Steel</surname> <given-names>M</given-names></name>, <etal>et al</etal>. <article-title>Bayesian phylogenetic estimation of clade ages supports trans-Atlantic dispersal of cichlid fishes</article-title>. <source>Systematic biology</source>. <year>2017</year>;<volume>66</volume>(<issue>1</issue>):<fpage>3</fpage>–<lpage>22</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/sysbio/syw076" xlink:type="simple">10.1093/sysbio/syw076</ext-link></comment> <object-id pub-id-type="pmid">28173588</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref026">
<label>26</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Stadler</surname> <given-names>T</given-names></name>. <article-title>On incomplete sampling under birth–death models and connections to the sampling-based coalescent</article-title>. <source>Journal of theoretical biology</source>. <year>2009</year>;<volume>261</volume>(<issue>1</issue>):<fpage>58</fpage>–<lpage>66</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.jtbi.2009.07.018" xlink:type="simple">10.1016/j.jtbi.2009.07.018</ext-link></comment> <object-id pub-id-type="pmid">19631666</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref027">
<label>27</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Popinga</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Vaughan</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Stadler</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>. <article-title>Inferring epidemiological dynamics with Bayesian coalescent inference: the merits of deterministic and stochastic models</article-title>. <source>Genetics</source>. <year>2014</year>; p. genetics–114. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.114.172791" xlink:type="simple">10.1534/genetics.114.172791</ext-link></comment> <object-id pub-id-type="pmid">25527289</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref028">
<label>28</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Kühnert</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Stadler</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Vaughan</surname> <given-names>TG</given-names></name>, <name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>. <article-title>Simultaneous reconstruction of evolutionary history and epidemiological dynamics from viral sequences with the birth–death SIR model</article-title>. <source>Journal of the Royal Society Interface</source>. <year>2014</year>;<volume>11</volume>(<issue>94</issue>):<fpage>20131106</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1098/rsif.2013.1106" xlink:type="simple">10.1098/rsif.2013.1106</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref029">
<label>29</label>
<mixed-citation publication-type="other" xlink:type="simple">Vaughan TG, Leventhal GE, Rasmussen DA, Drummond AJ, Welch D, Stadler T. Directly estimating epidemic curves from genomic data. bioRxiv. 2017; p. 142570.</mixed-citation>
</ref>
<ref id="pcbi.1006650.ref030">
<label>30</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Volz</surname> <given-names>EM</given-names></name>. <article-title>Complex population dynamics and the coalescent under neutrality</article-title>. <source>Genetics</source>. <year>2012</year>;<volume>190</volume>(<issue>1</issue>):<fpage>187</fpage>–<lpage>201</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.111.134627" xlink:type="simple">10.1534/genetics.111.134627</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref031">
<label>31</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Kühnert</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Stadler</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Vaughan</surname> <given-names>TG</given-names></name>, <name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>. <article-title>Phylodynamics with migration: a computational framework to quantify population structure from genomic data</article-title>. <source>Molecular biology and evolution</source>. <year>2016</year>;<volume>33</volume>(<issue>8</issue>):<fpage>2102</fpage>–<lpage>2116</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/molbev/msw064" xlink:type="simple">10.1093/molbev/msw064</ext-link></comment> <object-id pub-id-type="pmid">27189573</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref032">
<label>32</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>De Maio</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Wu</surname> <given-names>CH</given-names></name>, <name name-style="western"><surname>O’Reilly</surname> <given-names>KM</given-names></name>, <name name-style="western"><surname>Wilson</surname> <given-names>D</given-names></name>. <article-title>New routes to phylogeography: a Bayesian structured coalescent approximation</article-title>. <source>PLoS genetics</source>. <year>2015</year>;<volume>11</volume>(<issue>8</issue>):<fpage>e1005421</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pgen.1005421" xlink:type="simple">10.1371/journal.pgen.1005421</ext-link></comment> <object-id pub-id-type="pmid">26267488</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref033">
<label>33</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Müller</surname> <given-names>NF</given-names></name>, <name name-style="western"><surname>Rasmussen</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Stadler</surname> <given-names>T</given-names></name>. <article-title>MASCOT: parameter and state inference under the marginal structured coalescent approximation</article-title>. <source>Bioinformatics</source>. <year>2018</year>; p. bty406 <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/0.1093/bioinformatics/bty406" xlink:type="simple">0.1093/bioinformatics/bty406</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref034">
<label>34</label>
<mixed-citation publication-type="other" xlink:type="simple">Müller NF, Dudas G, Stadler T. Inferring time-dependent migration and coalescence patterns from genetic sequence and predictor data in structured populations. bioRxiv. 2018; p. 342329.</mixed-citation>
</ref>
<ref id="pcbi.1006650.ref035">
<label>35</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>De Maio</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Wu</surname> <given-names>CH</given-names></name>, <name name-style="western"><surname>Wilson</surname> <given-names>DJ</given-names></name>. <article-title>SCOTTI: efficient reconstruction of transmission within outbreaks with the structured coalescent</article-title>. <source>PLoS computational biology</source>. <year>2016</year>;<volume>12</volume>(<issue>9</issue>):<fpage>e1005130</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pcbi.1005130" xlink:type="simple">10.1371/journal.pcbi.1005130</ext-link></comment> <object-id pub-id-type="pmid">27681228</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref036">
<label>36</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Bouckaert</surname> <given-names>RR</given-names></name>, <name name-style="western"><surname>Bowern</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Atkinson</surname> <given-names>QD</given-names></name>. <article-title>The origin and expansion of Pama–Nyungan languages across Australia</article-title>. <source>Nature ecology &amp; evolution</source>. <year>2018</year>; p. <fpage>1</fpage>.</mixed-citation>
</ref>
<ref id="pcbi.1006650.ref037">
<label>37</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Bouckaert</surname> <given-names>R</given-names></name>. <article-title>Phylogeography by diffusion on a sphere: whole world phylogeography</article-title>. <source>PeerJ</source>. <year>2016</year>;<volume>4</volume>:<fpage>e2406</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.7717/peerj.2406" xlink:type="simple">10.7717/peerj.2406</ext-link></comment> <object-id pub-id-type="pmid">27651992</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref038">
<label>38</label>
<mixed-citation publication-type="other" xlink:type="simple">Mendes FK, Bouckaert R, Drummond AJ. SSE, v.1.0.0. Zenodo. 2018;.</mixed-citation>
</ref>
<ref id="pcbi.1006650.ref039">
<label>39</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Didelot</surname> <given-names>X</given-names></name>, <name name-style="western"><surname>Lawson</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Darling</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Falush</surname> <given-names>D</given-names></name>. <article-title>Inference of homologous recombination in bacteria using whole genome sequences</article-title>. <source>Genetics</source>. <year>2010</year>;. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1534/genetics.110.120121" xlink:type="simple">10.1534/genetics.110.120121</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref040">
<label>40</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Jones</surname> <given-names>GR</given-names></name>. <article-title>Divergence Estimation in the Presence of Incomplete Lineage Sorting and Migration</article-title>. <source>Systematic Biology</source>. <year>2018</year>; p. syy041 <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/sysbio/syy041" xlink:type="simple">10.1093/sysbio/syy041</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref041">
<label>41</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Jones</surname> <given-names>G</given-names></name>. <article-title>Algorithmic improvements to species delimitation and phylogeny estimation under the multispecies coalescent</article-title>. <source>Journal of mathematical biology</source>. <year>2017</year>;<volume>74</volume>(<issue>1-2</issue>):<fpage>447</fpage>–<lpage>467</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/s00285-016-1034-0" xlink:type="simple">10.1007/s00285-016-1034-0</ext-link></comment> <object-id pub-id-type="pmid">27287395</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref042">
<label>42</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Ogilvie</surname> <given-names>HA</given-names></name>, <name name-style="western"><surname>Heled</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Xie</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>. <article-title>Computational performance and statistical accuracy of *BEAST and comparisons with other methods</article-title>. <source>Systematic biology</source>. <year>2016</year>;<volume>65</volume>(<issue>3</issue>):<fpage>381</fpage>–<lpage>396</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/sysbio/syv118" xlink:type="simple">10.1093/sysbio/syv118</ext-link></comment> <object-id pub-id-type="pmid">26821913</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref043">
<label>43</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Ogilvie</surname> <given-names>HA</given-names></name>, <name name-style="western"><surname>Bouckaert</surname> <given-names>RR</given-names></name>, <name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>. <article-title>StarBEAST2 brings faster species tree inference and accurate estimates of substitution rates</article-title>. <source>Molecular biology and evolution</source>. <year>2017</year>;<volume>34</volume>(<issue>8</issue>):<fpage>2101</fpage>–<lpage>2114</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/molbev/msx126" xlink:type="simple">10.1093/molbev/msx126</ext-link></comment> <object-id pub-id-type="pmid">28431121</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref044">
<label>44</label>
<mixed-citation publication-type="other" xlink:type="simple">Ogilvie HA, Vaughan TG, Matzke NJ, Slater GJ, Stadler T, Welch D, et al. Inferring Species Trees Using Integrative Models of Species Evolution. bioRxiv. 2018;.</mixed-citation>
</ref>
<ref id="pcbi.1006650.ref045">
<label>45</label>
<mixed-citation publication-type="other" xlink:type="simple">Müller NF, Ogilvie H, Zhang C, Drummond A, Stadler T. Inference of species histories in the presence of gene flow. bioRxiv. 2018; p. 348391.</mixed-citation>
</ref>
<ref id="pcbi.1006650.ref046">
<label>46</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Xie</surname> <given-names>W</given-names></name>, <name name-style="western"><surname>Lewis</surname> <given-names>PO</given-names></name>, <name name-style="western"><surname>Fan</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Kuo</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Chen</surname> <given-names>MH</given-names></name>. <article-title>Improving marginal likelihood estimation for Bayesian phylogenetic model selection</article-title>. <source>Systematic biology</source>. <year>2010</year>;<volume>60</volume>(<issue>2</issue>):<fpage>150</fpage>–<lpage>160</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/sysbio/syq085" xlink:type="simple">10.1093/sysbio/syq085</ext-link></comment> <object-id pub-id-type="pmid">21187451</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref047">
<label>47</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Maturana</surname> <given-names>R P</given-names></name>, <name name-style="western"><surname>Brewer</surname> <given-names>BJ</given-names></name>, <name name-style="western"><surname>Klaere</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Bouckaert</surname> <given-names>RR</given-names></name>. <article-title>Model selection and parameter inference in phylogenetics using Nested Sampling</article-title>. <source>Syst Biol</source>. <year>2018</year>; <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/sysbio/syy050" xlink:type="simple">10.1093/sysbio/syy050</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref048">
<label>48</label>
<mixed-citation publication-type="other" xlink:type="simple">Bradley S. Synthetic Language Generation and Model Validation in BEAST2. arXiv preprint arXiv:160707931. 2016;.</mixed-citation>
</ref>
<ref id="pcbi.1006650.ref049">
<label>49</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Duchene</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Bouckaert</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Duchene</surname> <given-names>DA</given-names></name>, <name name-style="western"><surname>Stadler</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>. <article-title>Phylodynamic model adequacy using posterior predictive simulations</article-title>. <source>Systematic Biology</source>. In press;.</mixed-citation>
</ref>
<ref id="pcbi.1006650.ref050">
<label>50</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Yang</surname> <given-names>Z</given-names></name>, <name name-style="western"><surname>Yoder</surname> <given-names>AD</given-names></name>. <article-title>Comparison of likelihood and Bayesian methods for estimating divergence times using multiple gene loci and calibration points, with application to a radiation of cute-looking mouse lemur species</article-title>. <source>Systematic biology</source>. <year>2003</year>;<volume>52</volume>(<issue>5</issue>):<fpage>705</fpage>–<lpage>716</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1080/10635150390235557" xlink:type="simple">10.1080/10635150390235557</ext-link></comment> <object-id pub-id-type="pmid">14530137</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref051">
<label>51</label>
<mixed-citation publication-type="other" xlink:type="simple">Bouckaert R, Robbeets M. Pseudo Dollo models for the evolution of binary characters along a tree. bioRxiv. 2017; p. 207571.</mixed-citation>
</ref>
<ref id="pcbi.1006650.ref052">
<label>52</label>
<mixed-citation publication-type="book" xlink:type="simple">
<name name-style="western"><surname>Yang</surname> <given-names>Z</given-names></name>. <source>Computational molecular evolution</source>. <publisher-name>Oxford University Press</publisher-name>; <year>2006</year>.</mixed-citation>
</ref>
<ref id="pcbi.1006650.ref053">
<label>53</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>, <name name-style="western"><surname>Ho</surname> <given-names>SY</given-names></name>, <name name-style="western"><surname>Phillips</surname> <given-names>MJ</given-names></name>, <name name-style="western"><surname>Rambaut</surname> <given-names>A</given-names></name>. <article-title>Relaxed phylogenetics and dating with confidence</article-title>. <source>PLoS biology</source>. <year>2006</year>;<volume>4</volume>(<issue>5</issue>):<fpage>e88</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pbio.0040088" xlink:type="simple">10.1371/journal.pbio.0040088</ext-link></comment> <object-id pub-id-type="pmid">16683862</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref054">
<label>54</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>, <name name-style="western"><surname>Suchard</surname> <given-names>MA</given-names></name>. <article-title>Bayesian random local clocks, or one rate to rule them all</article-title>. <source>BMC biology</source>. <year>2010</year>;<volume>8</volume>(<issue>1</issue>):<fpage>114</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/1741-7007-8-114" xlink:type="simple">10.1186/1741-7007-8-114</ext-link></comment> <object-id pub-id-type="pmid">20807414</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref055">
<label>55</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Udny Yule</surname> <given-names>G</given-names></name>. <article-title>A mathematical theory of evolution, based on the conclusions of Dr. JC Willis, FRS</article-title>. <source>Philosophical Transactions of the Royal Society of London Series B</source>. <year>1924</year>;<volume>213</volume>:<fpage>21</fpage>–<lpage>87</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1098/rstb.1925.0002" xlink:type="simple">10.1098/rstb.1925.0002</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref056">
<label>56</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Kendall</surname> <given-names>DG</given-names></name>. <article-title>Stochastic processes and population growth</article-title>. <source>Journal of the Royal Statistical Society Series B (Methodological)</source>. <year>1949</year>;<volume>11</volume>(<issue>2</issue>):<fpage>230</fpage>–<lpage>282</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/j.2517-6161.1949.tb00032.x" xlink:type="simple">10.1111/j.2517-6161.1949.tb00032.x</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref057">
<label>57</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Stadler</surname> <given-names>T</given-names></name>. <article-title>Sampling-through-time in birth-death trees</article-title>. <source>Journal of Theoretical Biology</source>. <year>2010</year>;<volume>267</volume>(<issue>3</issue>):<fpage>396</fpage>–<lpage>404</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.jtbi.2010.09.010" xlink:type="simple">10.1016/j.jtbi.2010.09.010</ext-link></comment> <object-id pub-id-type="pmid">20851708</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref058">
<label>58</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Kingman</surname> <given-names>JFC</given-names></name>. <article-title>The coalescent</article-title>. <source>Stochastic Processes and their Applications</source>. <year>1982</year>;<volume>13</volume>(<issue>3</issue>):<fpage>235</fpage>–<lpage>248</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/0304-4149(82)90011-4" xlink:type="simple">https://doi.org/10.1016/0304-4149(82)90011-4</ext-link>.</mixed-citation>
</ref>
<ref id="pcbi.1006650.ref059">
<label>59</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Griffiths</surname> <given-names>RC</given-names></name>, <name name-style="western"><surname>Tavaré</surname> <given-names>S</given-names></name>. <article-title>Sampling theory for neutral alleles in a varying environment</article-title>. <source>Philosophical Transactions of the Royal Society B: Biological Sciences</source>. <year>1994</year>;<volume>344</volume>(<issue>1310</issue>):<fpage>403</fpage>–<lpage>410</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1098/rstb.1994.0079" xlink:type="simple">10.1098/rstb.1994.0079</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref060">
<label>60</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Drummond</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Nicholls</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Rodrigo</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Solomon</surname> <given-names>W</given-names></name>. <article-title>Estimating Mutation Parameters, Population History and Genealogy Simultaneously From Temporally Spaced Sequence Data</article-title>. <source>Genetics</source>. <year>2002</year>;<volume>161</volume>:<fpage>1307</fpage>–<lpage>1320</lpage>. <object-id pub-id-type="pmid">12136032</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref061">
<label>61</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>, <name name-style="western"><surname>Rambaut</surname> <given-names>A</given-names></name>. <article-title>BEAST: Bayesian evolutionary analysis by sampling trees</article-title>. <source>BMC evolutionary biology</source>. <year>2007</year>;<volume>7</volume>(<issue>1</issue>):<fpage>214</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/1471-2148-7-214" xlink:type="simple">10.1186/1471-2148-7-214</ext-link></comment> <object-id pub-id-type="pmid">17996036</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref062">
<label>62</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Stadler</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Kouyos</surname> <given-names>RD</given-names></name>, <name name-style="western"><surname>von Wyl</surname> <given-names>V</given-names></name>, <name name-style="western"><surname>Yerly</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Böni</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Bürgisser</surname> <given-names>P</given-names></name>, <etal>et al</etal>. <article-title>Estimating the basic reproductive number from viral sequence data</article-title>. <source>Mol Biol Evol</source>. <year>2012</year>;<volume>29</volume>:<fpage>347</fpage>–<lpage>357</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/molbev/msr217" xlink:type="simple">10.1093/molbev/msr217</ext-link></comment> <object-id pub-id-type="pmid">21890480</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref063">
<label>63</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Whitty</surname> <given-names>CJM</given-names></name>, <name name-style="western"><surname>Farrar</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Ferguson</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Edmunds</surname> <given-names>WJ</given-names></name>, <name name-style="western"><surname>Piot</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Leach</surname> <given-names>M</given-names></name>, <etal>et al</etal>. <article-title>Infectious disease: Tough choices to reduce Ebola transmission</article-title>. <source>Nature</source>. <year>2014</year>;<volume>515</volume>(<issue>7526</issue>):<fpage>192</fpage>–<lpage>194</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/515192a" xlink:type="simple">10.1038/515192a</ext-link></comment> <object-id pub-id-type="pmid">25391946</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref064">
<label>64</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<collab>WHO Ebola Response Team</collab>. <article-title>After Ebola in West Africa — Unpredictable Risks, Preventable Epidemics</article-title>. <source>New England Journal of Medicine</source>. <year>2016</year>;<volume>375</volume>(<issue>6</issue>):<fpage>587</fpage>–<lpage>596</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1056/NEJMsr1513109" xlink:type="simple">10.1056/NEJMsr1513109</ext-link></comment> <object-id pub-id-type="pmid">27509108</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref065">
<label>65</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<collab>WHO Ebola Response Team</collab>. <article-title>West African Ebola Epidemic after One Year Slowing but Not Yet under Control</article-title>. <source>New England Journal of Medicine</source>. <year>2015</year>;<volume>372</volume>(<issue>6</issue>):<fpage>584</fpage>–<lpage>587</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1056/NEJMc1414992" xlink:type="simple">10.1056/NEJMc1414992</ext-link></comment> <object-id pub-id-type="pmid">25539446</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref066">
<label>66</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Kermack</surname> <given-names>W</given-names></name>, <name name-style="western"><surname>Mckendrick</surname> <given-names>A</given-names></name>. <article-title>A contribution to the mathematical theory of epidemics</article-title>. <source>Proc Roy Soc A</source>. <year>1927</year>; p. <fpage>700</fpage>–<lpage>721</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1098/rspa.1927.0118" xlink:type="simple">10.1098/rspa.1927.0118</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref067">
<label>67</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Nee</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Mooers</surname> <given-names>AO</given-names></name>, <name name-style="western"><surname>Harvey</surname> <given-names>PH</given-names></name>. <article-title>Tempo and mode of evolution revealed from molecular phylogenies</article-title>. <source>Proceedings of the National Academy of Sciences</source>. <year>1992</year>;<volume>89</volume>(<issue>17</issue>):<fpage>8322</fpage>–<lpage>8326</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1073/pnas.89.17.8322" xlink:type="simple">10.1073/pnas.89.17.8322</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref068">
<label>68</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Heath</surname> <given-names>TA</given-names></name>, <name name-style="western"><surname>Huelsenbeck</surname> <given-names>JP</given-names></name>, <name name-style="western"><surname>Stadler</surname> <given-names>T</given-names></name>. <article-title>The fossilized birth–death process for coherent calibration of divergence-time estimates</article-title>. <source>Proceedings of the National Academy of Sciences</source>. <year>2014</year>;<volume>111</volume>(<issue>29</issue>):<fpage>E2957</fpage>–<lpage>E2966</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1073/pnas.1319091111" xlink:type="simple">10.1073/pnas.1319091111</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref069">
<label>69</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Zhang</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Stadler</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Klopfstein</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Heath</surname> <given-names>TA</given-names></name>, <name name-style="western"><surname>Ronquist</surname> <given-names>F</given-names></name>. <article-title>Total-evidence dating under the fossilized birth–death process</article-title>. <source>Systematic biology</source>. <year>2015</year>;<volume>65</volume>(<issue>2</issue>):<fpage>228</fpage>–<lpage>249</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/sysbio/syv080" xlink:type="simple">10.1093/sysbio/syv080</ext-link></comment> <object-id pub-id-type="pmid">26493827</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref070">
<label>70</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Gavryushkina</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Heath</surname> <given-names>TA</given-names></name>, <name name-style="western"><surname>Ksepka</surname> <given-names>DT</given-names></name>, <name name-style="western"><surname>Stadler</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Welch</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>. <article-title>Bayesian total-evidence dating reveals the recent crown radiation of penguins</article-title>. <source>Systematic biology</source>. <year>2017</year>;<volume>66</volume>(<issue>1</issue>):<fpage>57</fpage>–<lpage>73</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/sysbio/syw060" xlink:type="simple">10.1093/sysbio/syw060</ext-link></comment> <object-id pub-id-type="pmid">28173531</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref071">
<label>71</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Pyron</surname> <given-names>RA</given-names></name>. <article-title>Divergence Time Estimation Using Fossils as Terminal Taxa and the Origins of Lissamphibia</article-title>. <source>Systematic Biology</source>. <year>2011</year>;<volume>60</volume>:<fpage>466</fpage>–<lpage>81</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/sysbio/syr047" xlink:type="simple">10.1093/sysbio/syr047</ext-link></comment> <object-id pub-id-type="pmid">21540408</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref072">
<label>72</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Ronquist</surname> <given-names>F</given-names></name>, <name name-style="western"><surname>Klopfstein</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Vilhelmsen</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Schulmeister</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Murray</surname> <given-names>DL</given-names></name>, <name name-style="western"><surname>Rasnitsyn</surname> <given-names>AP</given-names></name>. <article-title>A total-evidence approach to dating with fossils, applied to the early radiation of the Hymenoptera</article-title>. <source>Systematic Biology</source>. <year>2012</year>;<volume>61</volume>(<issue>6</issue>):<fpage>973</fpage>–<lpage>999</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/sysbio/sys058" xlink:type="simple">10.1093/sysbio/sys058</ext-link></comment> <object-id pub-id-type="pmid">22723471</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref073">
<label>73</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Heled</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>. <article-title>Calibrated tree priors for relaxed phylogenetics and divergence time estimation</article-title>. <source>Systematic Biology</source>. <year>2011</year>;<volume>61</volume>(<issue>1</issue>):<fpage>138</fpage>–<lpage>149</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/sysbio/syr087" xlink:type="simple">10.1093/sysbio/syr087</ext-link></comment> <object-id pub-id-type="pmid">21856631</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref074">
<label>74</label>
<mixed-citation publication-type="other" xlink:type="simple">Matzke NJ, Wright A. Ground truthing tip-dating methods using fossil Canidae reveals major differences in performance. bioRxiv. 2016; p. 049643.</mixed-citation>
</ref>
<ref id="pcbi.1006650.ref075">
<label>75</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Maddison</surname> <given-names>WP</given-names></name>, <name name-style="western"><surname>Midford</surname> <given-names>PE</given-names></name>, <name name-style="western"><surname>Otto</surname> <given-names>SP</given-names></name>. <article-title>Estimating a binary character’s effect on speciation and extinction</article-title>. <source>Systematic biology</source>. <year>2007</year>;<volume>56</volume>(<issue>5</issue>):<fpage>701</fpage>–<lpage>710</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1080/10635150701607033" xlink:type="simple">10.1080/10635150701607033</ext-link></comment> <object-id pub-id-type="pmid">17849325</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref076">
<label>76</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Müller</surname> <given-names>NF</given-names></name>, <name name-style="western"><surname>Rasmussen</surname> <given-names>DA</given-names></name>, <name name-style="western"><surname>Stadler</surname> <given-names>T</given-names></name>. <article-title>The Structured Coalescent and Its Approximations</article-title>. <source>Molecular biology and evolution</source>. <year>2017</year>;<volume>34</volume>(<issue>11</issue>):<fpage>2970</fpage>–<lpage>2981</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/molbev/msx186" xlink:type="simple">10.1093/molbev/msx186</ext-link></comment> <object-id pub-id-type="pmid">28666382</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref077">
<label>77</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Volz</surname> <given-names>E</given-names></name>, <name name-style="western"><surname>Siveroni</surname> <given-names>I</given-names></name>. <article-title>Bayesian phylodynamic inference with complex models</article-title>. <source>PLOS Computational Biology</source>. <year>2018</year>;(in press). <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pcbi.1006546" xlink:type="simple">10.1371/journal.pcbi.1006546</ext-link></comment> <object-id pub-id-type="pmid">30422979</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref078">
<label>78</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Beerli</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Felsenstein</surname> <given-names>J</given-names></name>. <article-title>Maximum likelihood estimation of a migration matrix and effective population sizes in n subpopulations by using a coalescent approach</article-title>. <source>Proceedings of the National Academy of Sciences</source>. <year>2001</year>;<volume>98</volume>(<issue>8</issue>):<fpage>4563</fpage>–<lpage>4568</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1073/pnas.081068098" xlink:type="simple">10.1073/pnas.081068098</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref079">
<label>79</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Lemey</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Rambaut</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>, <name name-style="western"><surname>Suchard</surname> <given-names>MA</given-names></name>. <article-title>Bayesian phylogeography finds its roots</article-title>. <source>PLoS computational biology</source>. <year>2009</year>;<volume>5</volume>(<issue>9</issue>):<fpage>e1000520</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pcbi.1000520" xlink:type="simple">10.1371/journal.pcbi.1000520</ext-link></comment> <object-id pub-id-type="pmid">19779555</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref080">
<label>80</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Lemey</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Rambaut</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Welch</surname> <given-names>JJ</given-names></name>, <name name-style="western"><surname>Suchard</surname> <given-names>MA</given-names></name>. <article-title>Phylogeography takes a relaxed random walk in continuous space and time</article-title>. <source>Molecular biology and evolution</source>. <year>2010</year>;<volume>27</volume>(<issue>8</issue>):<fpage>1877</fpage>–<lpage>1885</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/molbev/msq067" xlink:type="simple">10.1093/molbev/msq067</ext-link></comment> <object-id pub-id-type="pmid">20203288</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref081">
<label>81</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Lemey</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Rambaut</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Bedford</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Faria</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Bielejec</surname> <given-names>F</given-names></name>, <name name-style="western"><surname>Baele</surname> <given-names>G</given-names></name>, <etal>et al</etal>. <article-title>Unifying viral genetics and human transportation data to predict the global transmission dynamics of human influenza H3N2</article-title>. <source>PLoS pathogens</source>. <year>2014</year>;<volume>10</volume>(<issue>2</issue>):<fpage>e1003932</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.ppat.1003932" xlink:type="simple">10.1371/journal.ppat.1003932</ext-link></comment> <object-id pub-id-type="pmid">24586153</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref082">
<label>82</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Degnan</surname> <given-names>JH</given-names></name>, <name name-style="western"><surname>Rosenberg</surname> <given-names>NA</given-names></name>. <article-title>Gene tree discordance, phylogenetic inference and the multispecies coalescent</article-title>. <source>Trends in Ecology &amp; Evolution</source>. <year>2009</year>;<volume>24</volume>(<issue>6</issue>):<fpage>332</fpage>–<lpage>340</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.tree.2009.01.009" xlink:type="simple">https://doi.org/10.1016/j.tree.2009.01.009</ext-link>.</mixed-citation>
</ref>
<ref id="pcbi.1006650.ref083">
<label>83</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Degnan</surname> <given-names>JH</given-names></name>, <name name-style="western"><surname>Rosenberg</surname> <given-names>NA</given-names></name>. <article-title>Discordance of Species Trees with Their Most Likely Gene Trees</article-title>. <source>PLOS Genetics</source>. <year>2006</year>;<volume>2</volume>(<issue>5</issue>):<fpage>1</fpage>–<lpage>7</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pgen.0020068" xlink:type="simple">10.1371/journal.pgen.0020068</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref084">
<label>84</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Roch</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Steel</surname> <given-names>M</given-names></name>. <article-title>Likelihood-based tree reconstruction on a concatenation of aligned sequence data sets can be statistically inconsistent</article-title>. <source>Theoretical Population Biology</source>. <year>2015</year>;<volume>100</volume>:<fpage>56</fpage>–<lpage>62</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.tpb.2014.12.005" xlink:type="simple">10.1016/j.tpb.2014.12.005</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref085">
<label>85</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Mendes</surname> <given-names>FK</given-names></name>, <name name-style="western"><surname>Hahn</surname> <given-names>MW</given-names></name>. <article-title>Why Concatenation Fails Near the Anomaly Zone</article-title>. <source>Systematic Biology</source>. <year>2018</year>;<volume>67</volume>(<issue>1</issue>):<fpage>158</fpage>–<lpage>169</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/sysbio/syx063" xlink:type="simple">10.1093/sysbio/syx063</ext-link></comment> <object-id pub-id-type="pmid">28973673</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref086">
<label>86</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Mendes</surname> <given-names>FK</given-names></name>, <name name-style="western"><surname>Hahn</surname> <given-names>MW</given-names></name>. <article-title>Gene Tree Discordance Causes Apparent Substitution Rate Variation</article-title>. <source>Systematic Biology</source>. <year>2016</year>;<volume>65</volume>(<issue>4</issue>):<fpage>711</fpage>–<lpage>721</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/sysbio/syw018" xlink:type="simple">10.1093/sysbio/syw018</ext-link></comment> <object-id pub-id-type="pmid">26927960</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref087">
<label>87</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Nichols</surname> <given-names>R</given-names></name>. <article-title>Gene trees and species trees are not the same</article-title>. <source>Trends in Ecology &amp; Evolution</source>. <year>2001</year>;<volume>16</volume>(<issue>7</issue>):<fpage>358</fpage>–<lpage>364</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/S0169-5347(01)02203-0" xlink:type="simple">10.1016/S0169-5347(01)02203-0</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref088">
<label>88</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Heled</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>. <article-title>Bayesian Inference of Species Trees from Multilocus Data</article-title>. <source>Molecular Biology and Evolution</source>. <year>2010</year>;<volume>27</volume>(<issue>3</issue>):<fpage>570</fpage>–<lpage>580</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/molbev/msp274" xlink:type="simple">10.1093/molbev/msp274</ext-link></comment> <object-id pub-id-type="pmid">19906793</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref089">
<label>89</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Jones</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Aydin</surname> <given-names>Z</given-names></name>, <name name-style="western"><surname>Oxelman</surname> <given-names>B</given-names></name>. <article-title>DISSECT: an assignment-free Bayesian discovery method for species delimitation under the multispecies coalescent</article-title>. <source>Bioinformatics</source>. <year>2015</year>;<volume>31</volume>(<issue>7</issue>):<fpage>991</fpage>–<lpage>998</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/bioinformatics/btu770" xlink:type="simple">10.1093/bioinformatics/btu770</ext-link></comment> <object-id pub-id-type="pmid">25422051</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref090">
<label>90</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Vitecek</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Kučinić</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Previšić</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Živić</surname> <given-names>I</given-names></name>, <name name-style="western"><surname>Stojanović</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Keresztes</surname> <given-names>L</given-names></name>, <etal>et al</etal>. <article-title>Integrative taxonomy by molecular species delimitation: multi-locus data corroborate a new species of Balkan Drusinae micro-endemics</article-title>. <source>BMC Evolutionary Biology</source>. <year>2017</year>;<volume>17</volume>(<issue>1</issue>):<fpage>129</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/s12862-017-0972-5" xlink:type="simple">10.1186/s12862-017-0972-5</ext-link></comment> <object-id pub-id-type="pmid">28587671</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref091">
<label>91</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Singh</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Dal Grande</surname> <given-names>F</given-names></name>, <name name-style="western"><surname>Divakar</surname> <given-names>PK</given-names></name>, <name name-style="western"><surname>Otte</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Crespo</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Schmitt</surname> <given-names>I</given-names></name>. <article-title>Fungal–algal association patterns in lichen symbiosis linked to macroclimate</article-title>. <source>New Phytologist</source>. <year>2017</year>;<volume>214</volume>(<issue>1</issue>):<fpage>317</fpage>–<lpage>329</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/nph.14366" xlink:type="simple">10.1111/nph.14366</ext-link></comment> <object-id pub-id-type="pmid">27918622</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref092">
<label>92</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Moran</surname> <given-names>PAP</given-names></name>. <article-title>Random processes in genetics</article-title>. <source>Mathematical Proceedings of the Cambridge Philosophical Society</source>. <year>1958</year>;<volume>54</volume>(<issue>1</issue>):<fpage>60</fpage>–<lpage>71</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1017/S0305004100033193" xlink:type="simple">10.1017/S0305004100033193</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref093">
<label>93</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Wang</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Rannala</surname> <given-names>B</given-names></name>. <article-title>Bayesian inference of fine-scale recombination rates using population genomic data</article-title>. <source>Philos Trans R Soc Lond B Biol Sci</source>. <year>2008</year>;<volume>363</volume>(<issue>1512</issue>):<fpage>3921</fpage>–<lpage>3930</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1098/rstb.2008.0172" xlink:type="simple">10.1098/rstb.2008.0172</ext-link></comment> <object-id pub-id-type="pmid">18852101</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref094">
<label>94</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Bloomquist</surname> <given-names>EW</given-names></name>, <name name-style="western"><surname>Suchard</surname> <given-names>MA</given-names></name>. <article-title>Unifying vertical and nonvertical evolution: a stochastic ARG-based framework</article-title>. <source>Syst Biol</source>. <year>2010</year>;<volume>59</volume>(<issue>1</issue>):<fpage>27</fpage>–<lpage>41</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/sysbio/syp076" xlink:type="simple">10.1093/sysbio/syp076</ext-link></comment> <object-id pub-id-type="pmid">20525618</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref095">
<label>95</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Meyer</surname> <given-names>BS</given-names></name>, <name name-style="western"><surname>Matschiner</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Salzburger</surname> <given-names>W</given-names></name>. <article-title>Disentangling incomplete lineage sorting and introgression to refine species-tree estimates for Lake Tanganyika cichlid fishes</article-title>. <source>Systematic Biology</source>. <year>2017</year>;<volume>66</volume>:<fpage>531</fpage>–<lpage>550</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/sysbio/syw069" xlink:type="simple">10.1093/sysbio/syw069</ext-link></comment> <object-id pub-id-type="pmid">27539485</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref096">
<label>96</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Li</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Durbin</surname> <given-names>R</given-names></name>. <article-title>Inference of human population history from individual whole-genome sequences</article-title>. <source>Nature</source>. <year>2011</year>;<volume>475</volume>(<issue>7357</issue>):<fpage>493</fpage>–<lpage>496</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nature10231" xlink:type="simple">10.1038/nature10231</ext-link></comment> <object-id pub-id-type="pmid">21753753</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref097">
<label>97</label>
<mixed-citation publication-type="other" xlink:type="simple">Barroso GV, Puzovic N, Dutheil J. Inference of recombination maps from a single pair of genomes and its application to archaic samples. bioRxiv. 2018;.</mixed-citation>
</ref>
<ref id="pcbi.1006650.ref098">
<label>98</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Francis</surname> <given-names>AR</given-names></name>, <name name-style="western"><surname>Steel</surname> <given-names>M</given-names></name>. <article-title>Which Phylogenetic Networks are Merely Trees with Additional Arcs?</article-title> <source>Systematic Biology</source>. <year>2015</year>;<volume>64</volume>(<issue>5</issue>):<fpage>768</fpage>–<lpage>777</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/sysbio/syv037" xlink:type="simple">10.1093/sysbio/syv037</ext-link></comment> <object-id pub-id-type="pmid">26070685</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref099">
<label>99</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Yu</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Degnan</surname> <given-names>JH</given-names></name>, <name name-style="western"><surname>Nakhleh</surname> <given-names>L</given-names></name>. <article-title>The Probability of a Gene Tree Topology within a Phylogenetic Network with Applications to Hybridization Detection</article-title>. <source>PLOS Genetics</source>. <year>2012</year>;<volume>8</volume>(<issue>4</issue>):<fpage>1</fpage>–<lpage>10</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pgen.1002660" xlink:type="simple">10.1371/journal.pgen.1002660</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref100">
<label>100</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Wen</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Yu</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Nakhleh</surname> <given-names>L</given-names></name>. <article-title>Bayesian Inference of Reticulate Phylogenies under the Multispecies Network Coalescent</article-title>. <source>PLOS Genetics</source>. <year>2016</year>;<volume>12</volume>(<issue>5</issue>):<fpage>1</fpage>–<lpage>17</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pgen.1006006" xlink:type="simple">10.1371/journal.pgen.1006006</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref101">
<label>101</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Nielsen</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Wakeley</surname> <given-names>J</given-names></name>. <article-title>Distinguishing migration from isolation: a Markov chain Monte Carlo approach</article-title>. <source>Genetics</source>. <year>2001</year>;<volume>158</volume>(<issue>2</issue>):<fpage>885</fpage>–<lpage>896</lpage>. <object-id pub-id-type="pmid">11404349</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref102">
<label>102</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Leaché</surname> <given-names>AD</given-names></name>, <name name-style="western"><surname>Harris</surname> <given-names>RB</given-names></name>, <name name-style="western"><surname>Rannala</surname> <given-names>B</given-names></name>, <name name-style="western"><surname>Yang</surname> <given-names>Z</given-names></name>. <article-title>The influence of gene flow on species tree estimation: a simulation study</article-title>. <source>Syst Biol</source>. <year>2014</year>;<volume>63</volume>(<issue>1</issue>):<fpage>17</fpage>–<lpage>30</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/sysbio/syt049" xlink:type="simple">10.1093/sysbio/syt049</ext-link></comment> <object-id pub-id-type="pmid">23945075</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref103">
<label>103</label>
<mixed-citation publication-type="book" xlink:type="simple">
<name name-style="western"><surname>Konings</surname> <given-names>A</given-names></name>. <source>Tanganyika Cichlids in Their Natural Habitat</source>. <publisher-name>Cichlid Press</publisher-name>, <publisher-loc>El Paso, TX</publisher-loc>; <year>2015</year>.</mixed-citation>
</ref>
<ref id="pcbi.1006650.ref104">
<label>104</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Salzburger</surname> <given-names>W</given-names></name>, <name name-style="western"><surname>Baric</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Sturmbauer</surname> <given-names>C</given-names></name>. <article-title>Speciation via introgressive hybridization in East African cichlids?</article-title> <source>Molecular Ecology</source>. <year>2002</year>;<volume>11</volume>:<fpage>619</fpage>–<lpage>625</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1046/j.0962-1083.2001.01438.x" xlink:type="simple">10.1046/j.0962-1083.2001.01438.x</ext-link></comment> <object-id pub-id-type="pmid">11918795</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref105">
<label>105</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Brawand</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Wagner</surname> <given-names>CE</given-names></name>, <name name-style="western"><surname>Li</surname> <given-names>YI</given-names></name>, <name name-style="western"><surname>Malinsky</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Keller</surname> <given-names>I</given-names></name>, <name name-style="western"><surname>Fan</surname> <given-names>S</given-names></name>, <etal>et al</etal>. <article-title>The genomic substrate for adaptive radiation in African cichlid fish</article-title>. <source>Nature</source>. <year>2014</year>;<volume>513</volume>:<fpage>375</fpage>–<lpage>381</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nature13726" xlink:type="simple">10.1038/nature13726</ext-link></comment> <object-id pub-id-type="pmid">25186727</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref106">
<label>106</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Gante</surname> <given-names>HF</given-names></name>, <name name-style="western"><surname>Matschiner</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Malmstrøm</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Jakobsen</surname> <given-names>KS</given-names></name>, <name name-style="western"><surname>Jentoft</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Salzburger</surname> <given-names>W</given-names></name>. <article-title>Genomics of speciation and introgression in Princess cichlid fishes from Lake Tanganyika</article-title>. <source>Molecular Ecology</source>. <year>2016</year>;<volume>25</volume>(<issue>24</issue>):<fpage>6143</fpage>–<lpage>6161</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/mec.13767" xlink:type="simple">10.1111/mec.13767</ext-link></comment> <object-id pub-id-type="pmid">27452499</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref107">
<label>107</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Malmstrøm</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Matschiner</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Tørresen</surname> <given-names>OK</given-names></name>, <name name-style="western"><surname>Star</surname> <given-names>B</given-names></name>, <name name-style="western"><surname>Snipen</surname> <given-names>LG</given-names></name>, <name name-style="western"><surname>Hansen</surname> <given-names>TF</given-names></name>, <etal>et al</etal>. <article-title>Evolution of the immune system influences speciation rates in teleost fishes</article-title>. <source>Nat Genet</source>. <year>2016</year>;<volume>48</volume>(<issue>10</issue>):<fpage>1204</fpage>–<lpage>1210</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ng.3645" xlink:type="simple">10.1038/ng.3645</ext-link></comment> <object-id pub-id-type="pmid">27548311</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref108">
<label>108</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Lewis</surname> <given-names>PO</given-names></name>, <name name-style="western"><surname>Xie</surname> <given-names>W</given-names></name>, <name name-style="western"><surname>Chen</surname> <given-names>MH</given-names></name>, <name name-style="western"><surname>Fan</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Kuo</surname> <given-names>L</given-names></name>. <article-title>Posterior predictive Bayesian phylogenetic model selection</article-title>. <source>Systematic biology</source>. <year>2013</year>;<volume>63</volume>(<issue>3</issue>):<fpage>309</fpage>–<lpage>321</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/sysbio/syt068" xlink:type="simple">10.1093/sysbio/syt068</ext-link></comment> <object-id pub-id-type="pmid">24193892</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref109">
<label>109</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Fan</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>Wu</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Chen</surname> <given-names>MH</given-names></name>, <name name-style="western"><surname>Kuo</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Lewis</surname> <given-names>PO</given-names></name>. <article-title>Choosing among partition models in Bayesian phylogenetics</article-title>. <source>Molecular biology and evolution</source>. <year>2010</year>;<volume>28</volume>(<issue>1</issue>):<fpage>523</fpage>–<lpage>532</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/molbev/msq224" xlink:type="simple">10.1093/molbev/msq224</ext-link></comment> <object-id pub-id-type="pmid">20801907</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref110">
<label>110</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Skilling</surname> <given-names>J</given-names></name>, <etal>et al</etal>. <article-title>Nested sampling for general Bayesian computation</article-title>. <source>Bayesian analysis</source>. <year>2006</year>;<volume>1</volume>(<issue>4</issue>):<fpage>833</fpage>–<lpage>859</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1214/06-BA127" xlink:type="simple">10.1214/06-BA127</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref111">
<label>111</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Bollback</surname> <given-names>JP</given-names></name>. <article-title>Bayesian model adequacy and choice in phylogenetics</article-title>. <source>Molecular Biology and Evolution</source>. <year>2002</year>;<volume>19</volume>(<issue>7</issue>):<fpage>1171</fpage>–<lpage>1180</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/oxfordjournals.molbev.a004175" xlink:type="simple">10.1093/oxfordjournals.molbev.a004175</ext-link></comment> <object-id pub-id-type="pmid">12082136</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref112">
<label>112</label>
<mixed-citation publication-type="book" xlink:type="simple">
<name name-style="western"><surname>Gelman</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Stern</surname> <given-names>HS</given-names></name>, <name name-style="western"><surname>Carlin</surname> <given-names>JB</given-names></name>, <name name-style="western"><surname>Dunson</surname> <given-names>DB</given-names></name>, <name name-style="western"><surname>Vehtari</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Rubin</surname> <given-names>DB</given-names></name>. <source>Bayesian data analysis</source>. <publisher-name>Chapman and Hall/CRC</publisher-name>; <year>2013</year>.</mixed-citation>
</ref>
<ref id="pcbi.1006650.ref113">
<label>113</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Höhna</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Coghill</surname> <given-names>LM</given-names></name>, <name name-style="western"><surname>Mount</surname> <given-names>GG</given-names></name>, <name name-style="western"><surname>Thomson</surname> <given-names>RC</given-names></name>, <name name-style="western"><surname>Brown</surname> <given-names>JM</given-names></name>. <article-title>P3: Phylogenetic posterior prediction in RevBayes</article-title>. <source>Molecular biology and evolution</source>. <year>2017</year>;<volume>35</volume>(<issue>4</issue>):<fpage>1028</fpage>–<lpage>1034</lpage>.</mixed-citation>
</ref>
<ref id="pcbi.1006650.ref114">
<label>114</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Greenhill</surname> <given-names>SJ</given-names></name>, <name name-style="western"><surname>Blust</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Gray</surname> <given-names>RD</given-names></name>. <article-title>The Austronesian basic vocabulary database: from bioinformatics to lexomics</article-title>. <source>Evolutionary bioinformatics online</source>. <year>2008</year>;<volume>4</volume>:<fpage>271</fpage>. <object-id pub-id-type="pmid">19204825</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref115">
<label>115</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Bouckaert</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Lemey</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Dunn</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Greenhill</surname> <given-names>SJ</given-names></name>, <name name-style="western"><surname>Alekseyenko</surname> <given-names>AV</given-names></name>, <name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>, <etal>et al</etal>. <article-title>Mapping the origins and expansion of the Indo-European language family</article-title>. <source>Science</source>. <year>2012</year>;<volume>337</volume>(<issue>6097</issue>):<fpage>957</fpage>–<lpage>960</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1126/science.1219669" xlink:type="simple">10.1126/science.1219669</ext-link></comment> <object-id pub-id-type="pmid">22923579</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref116">
<label>116</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Barido-Sottani</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Bošková</surname> <given-names>V</given-names></name>, <name name-style="western"><surname>du Plessis</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Kühnert</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Magnus</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Mitov</surname> <given-names>V</given-names></name>, <etal>et al</etal>. <article-title>Taming the BEAST—A Community Teaching Material Resource for BEAST 2</article-title>. <source>Systematic biology</source>. <year>2017</year>;<volume>67</volume>(<issue>1</issue>):<fpage>170</fpage>–<lpage>174</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/sysbio/syx060" xlink:type="simple">10.1093/sysbio/syx060</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref117">
<label>117</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Suchard</surname> <given-names>MA</given-names></name>, <name name-style="western"><surname>Lemey</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Baele</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Ayres</surname> <given-names>DL</given-names></name>, <name name-style="western"><surname>Drummond</surname> <given-names>AJ</given-names></name>, <name name-style="western"><surname>Rambaut</surname> <given-names>A</given-names></name>. <article-title>Bayesian phylogenetic and phylodynamic data integration using BEAST 1.10</article-title>. <source>Virus Evol</source>. <year>2018</year>;<volume>4</volume>(<issue>1</issue>):<fpage>vey016</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/ve/vey016" xlink:type="simple">10.1093/ve/vey016</ext-link></comment> <object-id pub-id-type="pmid">29942656</object-id></mixed-citation>
</ref>
<ref id="pcbi.1006650.ref118">
<label>118</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Höhna</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Landis</surname> <given-names>MJ</given-names></name>, <name name-style="western"><surname>Heath</surname> <given-names>TA</given-names></name>, <name name-style="western"><surname>Boussau</surname> <given-names>B</given-names></name>, <name name-style="western"><surname>Lartillot</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Moore</surname> <given-names>BR</given-names></name>, <etal>et al</etal>. <article-title>RevBayes: Bayesian Phylogenetic Inference Using Graphical Models and an Interactive Model-Specification Language</article-title>. <source>Syst Biol</source>. <year>2016</year>;<volume>65</volume>(<issue>4</issue>):<fpage>726</fpage>–<lpage>36</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/sysbio/syw021" xlink:type="simple">10.1093/sysbio/syw021</ext-link></comment> <object-id pub-id-type="pmid">27235697</object-id></mixed-citation>
</ref>
</ref-list>
</back>
</article>