<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article
  PUBLIC "-//NLM//DTD Journal Publishing DTD v3.0 20080202//EN" "http://dtd.nlm.nih.gov/publishing/3.0/journalpublishing3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="3.0" xml:lang="EN">
<front>
<journal-meta><journal-id journal-id-type="nlm-ta">PLoS ONE</journal-id><journal-id journal-id-type="publisher-id">plos</journal-id><journal-id journal-id-type="pmc">plosone</journal-id><!--===== Grouping journal title elements =====--><journal-title-group><journal-title>PLoS ONE</journal-title></journal-title-group><issn pub-type="epub">1932-6203</issn><publisher>
<publisher-name>Public Library of Science</publisher-name>
<publisher-loc>San Francisco, USA</publisher-loc></publisher></journal-meta>
<article-meta><article-id pub-id-type="publisher-id">08-PONE-RA-06075</article-id><article-id pub-id-type="doi">10.1371/journal.pone.0003527</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="Discipline"><subject>Genetics and Genomics/Chromosome Biology</subject><subject>Genetics and Genomics/Comparative Genomics</subject><subject>Infectious Diseases/Protozoal Infections</subject></subj-group></article-categories><title-group><article-title>Telomeric Expression Sites Are Highly Conserved in <italic>Trypanosoma brucei</italic></article-title><alt-title alt-title-type="running-head">Architecture of <italic>T. brucei</italic> BESs</alt-title></title-group><contrib-group>
<contrib contrib-type="author" equal-contrib="yes" xlink:type="simple"><name name-style="western"><surname>Hertz-Fowler</surname><given-names>Christiane</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref><xref ref-type="corresp" rid="cor1"><sup>*</sup></xref></contrib>
<contrib contrib-type="author" equal-contrib="yes" xlink:type="simple"><name name-style="western"><surname>Figueiredo</surname><given-names>Luisa M.</given-names></name><xref ref-type="aff" rid="aff2"><sup>2</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Quail</surname><given-names>Michael A.</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Becker</surname><given-names>Marion</given-names></name><xref ref-type="aff" rid="aff3"><sup>3</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Jackson</surname><given-names>Andrew</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Bason</surname><given-names>Nathalie</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Brooks</surname><given-names>Karen</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Churcher</surname><given-names>Carol</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Fahkro</surname><given-names>Samah</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Goodhead</surname><given-names>Ian</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref><xref ref-type="fn" rid="fn1"><sup>¤</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Heath</surname><given-names>Paul</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Kartvelishvili</surname><given-names>Magdalena</given-names></name><xref ref-type="aff" rid="aff2"><sup>2</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Mungall</surname><given-names>Karen</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Harris</surname><given-names>David</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Hauser</surname><given-names>Heidi</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Sanders</surname><given-names>Mandy</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Saunders</surname><given-names>David</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Seeger</surname><given-names>Kathy</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Sharp</surname><given-names>Sarah</given-names></name><xref ref-type="aff" rid="aff3"><sup>3</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Taylor</surname><given-names>Jesse E.</given-names></name><xref ref-type="aff" rid="aff4"><sup>4</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Walker</surname><given-names>Danielle</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>White</surname><given-names>Brian</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Young</surname><given-names>Rosanna</given-names></name><xref ref-type="aff" rid="aff5"><sup>5</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Cross</surname><given-names>George A. M.</given-names></name><xref ref-type="aff" rid="aff2"><sup>2</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Rudenko</surname><given-names>Gloria</given-names></name><xref ref-type="aff" rid="aff5"><sup>5</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Barry</surname><given-names>J. David</given-names></name><xref ref-type="aff" rid="aff6"><sup>6</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Louis</surname><given-names>Edward J.</given-names></name><xref ref-type="aff" rid="aff3"><sup>3</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Berriman</surname><given-names>Matthew</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
</contrib-group><aff id="aff1"><label>1</label><addr-line>Wellcome Trust Sanger Institute, Wellcome Trust Genome Campus, Hinxton, United Kingdom</addr-line>       </aff><aff id="aff2"><label>2</label><addr-line>The Rockefeller University, New York, New York, United States of America</addr-line>       </aff><aff id="aff3"><label>3</label><addr-line>Institute of Genetics, The University of Nottingham Queen's Medical Centre, Nottingham, United Kingdom</addr-line>       </aff><aff id="aff4"><label>4</label><addr-line>Department of Statistics, University of Oxford, Oxford, United Kingdom</addr-line>       </aff><aff id="aff5"><label>5</label><addr-line>The Peter Medawar Building for Pathogen Research, University of Oxford, Oxford, United Kingdom</addr-line>       </aff><aff id="aff6"><label>6</label><addr-line>Wellcome Centre for Molecular Parasitology, University of Glasgow, Glasgow, United Kingdom</addr-line>       </aff><contrib-group>
<contrib contrib-type="editor" xlink:type="simple"><name name-style="western"><surname>Hall</surname><given-names>Neil</given-names></name>
<role>Editor</role>
<xref ref-type="aff" rid="edit1"/></contrib>
</contrib-group><aff id="edit1">University of Liverpool, United Kingdom</aff><author-notes>
<corresp id="cor1">* E-mail: <email xlink:type="simple">chf@sanger.ac.uk</email></corresp>
<fn fn-type="con"><p>Conceived and designed the experiments: CHF LMF MQ MB APJ GC GR JDB EJL MB. Performed the experiments: CHF LMF MQ MB APJ NB KB CC SF IG PH MK KM DH HH MS DS KS SS DW BW RY. Analyzed the data: CHF LMF MB APJ KB CC KM HH MS JET RY GC GR JDB EJL MB. Contributed reagents/materials/analysis tools: CHF LMF MQ MB APJ JET RY GR EJL MB. Wrote the paper: CHF LMF MB APJ GC GR JDB EJL.</p></fn>
<fn fn-type="current-aff" id="fn1"><label>¤</label><p>Current address: School of Biological Sciences, University of Liverpool, Liverpool, United Kingdom</p></fn>
<fn fn-type="conflict"><p>The authors have declared that no competing interests exist.</p></fn></author-notes><pub-date pub-type="collection"><year>2008</year></pub-date><pub-date pub-type="epub"><day>27</day><month>10</month><year>2008</year></pub-date><volume>3</volume><issue>10</issue><elocation-id>e3527</elocation-id><history>
<date date-type="received"><day>21</day><month>8</month><year>2008</year></date>
<date date-type="accepted"><day>23</day><month>9</month><year>2008</year></date>
</history><!--===== Grouping copyright info into permissions =====--><permissions><copyright-year>2008</copyright-year><copyright-holder>Hertz-Fowler et al</copyright-holder><license><license-p>This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p></license></permissions><abstract>
<p>Subtelomeric regions are often under-represented in genome sequences of eukaryotes. One of the best known examples of the use of telomere proximity for adaptive purposes are the bloodstream expression sites (BESs) of the African trypanosome <italic>Trypanosoma brucei</italic>. To enhance our understanding of BES structure and function in host adaptation and immune evasion, the BES repertoire from the Lister 427 strain of <italic>T. brucei</italic> were independently tagged and sequenced. BESs are polymorphic in size and structure but reveal a surprisingly conserved architecture in the context of extensive recombination. Very small BESs do exist and many functioning BESs do not contain the full complement of expression site associated genes (<italic>ESAG</italic>s). The consequences of duplicated or missing <italic>ESAG</italic>s, including <italic>ESAG9</italic>, a newly named <italic>ESAG12</italic>, and additional variant surface glycoprotein genes (<italic>VSG</italic>s) were evaluated by functional assays after BESs were tagged with a drug-resistance gene. Phylogenetic analysis of constituent <italic>ESAG</italic> families suggests that BESs are sequence mosaics and that extensive recombination has shaped the evolution of the BES repertoire. This work opens important perspectives in understanding the molecular mechanisms of antigenic variation, a widely used strategy for immune evasion in pathogens, and telomere biology.</p>
</abstract><funding-group><funding-statement>The Wellcome Trust supports the Sanger Institute Pathogen Genomics group. LMF, MK and GAMC are supported in part by Grant Number R01AI021729 from the National Institute of Allergy And Infectious Diseases (NIAID). The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</funding-statement></funding-group><counts><page-count count="12"/></counts></article-meta>
</front>
<body><sec id="s1">
<title>Introduction</title>
<p>Subtelomeres are dynamic and fast-evolving regions of eukaryotic genomes owing to their remarkable plasticity <xref ref-type="bibr" rid="pone.0003527-Mefford1">[1]</xref>–<xref ref-type="bibr" rid="pone.0003527-Fedorova1">[3]</xref>. Recombination between internal repeats and chromosomal arms results in the accumulation of species-specific sequences, commonly mediating adaptation to the environment. Despite their extreme genetic diversity, common aspects of structure and function are shared across telomeres from a diverse range of organisms <xref ref-type="bibr" rid="pone.0003527-Pryde1">[4]</xref>.</p>
<p>The ability to encode contingency functions within their subtelomeric regions has been exploited by the African Trypanosome, subspecies of which cause the debilitating disease Human African Trypanosomiasis and the related disease ‘nagana’ in livestock [reviewed in <xref ref-type="bibr" rid="pone.0003527-Horn1">[2]</xref>. <italic>Trypanosoma brucei</italic> evades the mammalian host's immune response by periodically changing its variant surface glycoprotein (VSG) coat (reviewed in: <xref ref-type="bibr" rid="pone.0003527-Pays1">[5]</xref>), a dense monolayer of 5×10<sup>6</sup> identical VSG dimers. The expressed <italic>VSG</italic> is located in specialised subtelomeric transcription units known as the Bloodstream Expression Sites (BES). The total number of BESs is dependent on the subspecies and strain but is believed to be about 20 for the <italic>T. brucei</italic> Lister 427 strain <xref ref-type="bibr" rid="pone.0003527-Navarro1">[6]</xref> used in the present study. To change the VSG coat, transcription is switched to an alternative <italic>VSG</italic> by recombination of a new <italic>VSG</italic> into the active BES or by transcriptional silencing of one BES with concomitant activation of a second.</p>
<p>Sequencing of a few BESs has revealed a diverse range of 11 polymorphic genes, called Expression Site Associated Genes (<italic>ESAG</italic>s) <xref ref-type="bibr" rid="pone.0003527-Redpath1">[7]</xref>, few of which have been functionally characterised: <italic>ESAG3</italic>, <italic>ESAG5</italic> and <italic>ESAG11</italic> encode membrane-associated or membrane-targeted proteins <xref ref-type="bibr" rid="pone.0003527-Pays2">[8]</xref>; <italic>ESAG4</italic> encodes a putative transmembrane receptor with adenylate cyclase activity <xref ref-type="bibr" rid="pone.0003527-Paindavoine1">[9]</xref>; <italic>ESAG6</italic> and <italic>ESAG7</italic> encode subunits of a heterodimeric receptor that mediates uptake of host transferrin <xref ref-type="bibr" rid="pone.0003527-Ligtenberg1">[10]</xref>, <xref ref-type="bibr" rid="pone.0003527-Salmon1">[11]</xref>; <italic>ESAG8</italic> encodes a putative nuclear DNA-binding protein <xref ref-type="bibr" rid="pone.0003527-Hoek1">[12]</xref>, <xref ref-type="bibr" rid="pone.0003527-Hoek2">[13]</xref>; <italic>ESAG10</italic> encodes a homologue of the <italic>Leishmania</italic> biopterin transporter <xref ref-type="bibr" rid="pone.0003527-Gottesdiener1">[14]</xref> whilst <italic>ESAG9</italic> <xref ref-type="bibr" rid="pone.0003527-Florent1">[15]</xref> has an unknown function. As many <italic>ESAG</italic>s are members of large families and are dispersed in the genome <xref ref-type="bibr" rid="pone.0003527-Carruthers1">[16]</xref>–<xref ref-type="bibr" rid="pone.0003527-Berriman1">[18]</xref>, and as a low level of transcription occurs even from ‘inactive’ BESs, determining the precise function of individual <italic>ESAG</italic>s in active expression sites is challenging.</p>
<p>In an effort to systematically analyse the BES repertoire of a single clone, a library of transformation-associated recombination (TAR) clones was made <xref ref-type="bibr" rid="pone.0003527-Becker1">[19]</xref>. In the present study, sequence analysis revealed that the 19 TAR clones fall into 14 distinct BES groups. Independently, 13 randomly tagged BESs were constructed and analyzed, confirming the structures and re-defining the minimal gene complement of a functional BES for survival in culture.</p>
<p>Patterns of sequence variation between different <italic>ESAG</italic> families were analysed revealing that expression sites are sequence mosaics - related to each other differently depending on the gene family examined - and highlighting the significant role that recombination between gene families has played in forming BES sequences. In characterising a complete BES repertoire these results provide a perspective on nucleotide diversity, but also on the mechanisms regulating their origins and diversity.</p>
</sec><sec id="s2">
<title>Results</title>
<p>Two independent approaches were undertaken. First, BESs were randomly tagged with a G418-resistance gene, and we will refer to these clones as ‘<italic>NEO</italic>-tagged’. Second, TAR-cloned BESs were sequenced, and we will refer to these clones either by their TAR clone number or by the BES to which they have been assigned.</p>
<sec id="s2a">
<title>Tagging BESs</title>
<p><italic>T. brucei</italic> cell lines tagged with two drug-resistance markers were generated to select parasites that had stochastically activated an individually tagged BES from the background of highly similar BESs. The active BES1 was tagged with a Puromycin resistance gene (<italic>PUR</italic>), immediately downstream of the promoter. In the remaining silent BESs, transcription initiates at the BES promoter but is rapidly attenuated. This low level of transcriptional activity allowed the integration of a Neomycin resistance gene (<italic>NEO</italic>) immediately downstream of a second ‘silent’ BES promoter. In this way, we obtained 30 double-tagged clones. Each randomly <italic>NEO</italic>-tagged BES was typed according to its <italic>ESAG6</italic> hypervariable region, the distance between the <italic>ESAG6</italic> gene and the promoter, the number of BES promoters, and the sequence of the expressed <italic>VSG</italic> upon BES activation. Analysis of the 30 <italic>NEO</italic>-tagged clones and comparison to the TAR clones showed that 13 different BESs were tagged: BES1, 2, 3, 4, 5, 7, 8, 12, 13, 14, 15a and 15b (a duplicated BES, see below) and 17 (<xref ref-type="table" rid="pone-0003527-t001">Tables 1</xref> and <xref ref-type="table" rid="pone-0003527-t002">2</xref>). All tagged BES could be activated <italic>in vitro</italic>, except for BES8. Characterisation of these clones confirmed many of the apparently anomalous structures revealed by the TAR sequences (see below). The only two cloned BESs that were not tagged were BES10 and BES11 (<xref ref-type="table" rid="pone-0003527-t001">Tables 1</xref> and <xref ref-type="table" rid="pone-0003527-t002">2</xref>).</p>
<table-wrap id="pone-0003527-t001" position="float"><object-id pub-id-type="doi">10.1371/journal.pone.0003527.t001</object-id><label>Table 1</label><caption>
<title>BES overview.</title>
</caption><!--===== Grouping alternate versions of objects =====--><alternatives><graphic id="pone-0003527-t001-1" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0003527.t001" xlink:type="simple"/><table><colgroup span="1"><col align="left" span="1"/><col align="center" span="1"/><col align="center" span="1"/><col align="center" span="1"/><col align="center" span="1"/><col align="center" span="1"/><col align="center" span="1"/><col align="center" span="1"/><col align="center" span="1"/><col align="center" span="1"/><col align="center" span="1"/><col align="center" span="1"/></colgroup>
<thead>
<tr>
<td align="left" colspan="1" rowspan="1">BES</td>
<td align="left" colspan="1" rowspan="1">TAR clone sequenced</td>
<td align="left" colspan="3" rowspan="1"><italic>Nomenclature of VSG</italic> genes</td>
<td align="left" colspan="3" rowspan="1">Deviation from conserved architecture</td>
<td align="left" colspan="1" rowspan="1"><italic>Drug-resistance</italic> tagged clone</td>
<td align="left" colspan="1" rowspan="1"><italic>NEO</italic>-tagged clone consistent with sequenced TAR clone</td>
<td align="left" colspan="1" rowspan="1">BES could be activated <italic>in vitro</italic></td>
<td align="left" colspan="1" rowspan="1">Genome localisation: type and size (Mb) of chromosome</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1"/>
<td align="left" colspan="1" rowspan="1"/>
<td align="left" colspan="1" rowspan="1"><italic>2008</italic></td>
<td align="left" colspan="1" rowspan="1"><italic>Lab-specific</italic></td>
<td align="left" colspan="1" rowspan="1"><italic>MITat</italic></td>
<td align="left" colspan="1" rowspan="1">Multiple copies of ESAGs?</td>
<td align="left" colspan="1" rowspan="1">Missing ESAGs?</td>
<td align="left" colspan="1" rowspan="1">Other</td>
<td align="left" colspan="1" rowspan="1"/>
<td align="left" colspan="1" rowspan="1"/>
<td align="left" colspan="1" rowspan="1"/>
<td align="left" colspan="1" rowspan="1"/>
</tr>
</thead>
<tbody>
<tr>
<td align="left" colspan="1" rowspan="1">1 (a)</td>
<td align="left" colspan="1" rowspan="1">40</td>
<td align="left" colspan="1" rowspan="1">427-2</td>
<td align="left" colspan="1" rowspan="1">221</td>
<td align="left" colspan="1" rowspan="1">MITat 1.2</td>
<td align="left" colspan="1" rowspan="1">large-scale</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1">70 bp-repeat array (×2)</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">MBC-3.0</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">2 (a)</td>
<td align="left" colspan="1" rowspan="1">129</td>
<td align="left" colspan="1" rowspan="1">427-9</td>
<td align="left" colspan="1" rowspan="1">VO2</td>
<td align="left" colspan="1" rowspan="1">MITat 1.9</td>
<td align="left" colspan="1" rowspan="1">7 (×2)</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1">ingi element 3′ of 70-bp repeat</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">IC-0.325</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">3</td>
<td align="left" colspan="1" rowspan="1">2, 15</td>
<td align="left" colspan="1" rowspan="1">427-6</td>
<td align="left" colspan="1" rowspan="1">121</td>
<td align="left" colspan="1" rowspan="1">MITat 1.6</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1"/>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">MBC-2.05</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">4</td>
<td align="left" colspan="1" rowspan="1">3, 28</td>
<td align="left" colspan="1" rowspan="1">427-21</td>
<td align="left" colspan="1" rowspan="1">T3</td>
<td align="left" colspan="1" rowspan="1">MITat 1.21</td>
<td align="left" colspan="1" rowspan="1">7 (×3)</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1">VSG ψ 3′ of 70-bp repeat</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">IC-0.250</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">5</td>
<td align="left" colspan="1" rowspan="1">98</td>
<td align="left" colspan="1" rowspan="1">427-18</td>
<td align="left" colspan="1" rowspan="1">800</td>
<td align="left" colspan="1" rowspan="1">MITat 1.18</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1"/>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">No (c)</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">MBC-1.95</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">7</td>
<td align="left" colspan="1" rowspan="1">65 (b), 153</td>
<td align="left" colspan="1" rowspan="1">427-3</td>
<td align="left" colspan="1" rowspan="1">224</td>
<td align="left" colspan="1" rowspan="1">MITat 1.3</td>
<td align="left" colspan="1" rowspan="1">6 (×2)</td>
<td align="left" colspan="1" rowspan="1">7</td>
<td align="left" colspan="1" rowspan="1"><italic>ESAG3</italic> ψ 3′ of 70-bp repeat</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">MBC &gt;3.1</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">8</td>
<td align="left" colspan="1" rowspan="1">64</td>
<td align="left" colspan="1" rowspan="1">427-14</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1">MITat 1.14</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1">1,2,3,4,5,6,8,9,11</td>
<td align="left" colspan="1" rowspan="1">Single <italic>ESAG7</italic> gene</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">No (c)</td>
<td align="left" colspan="1" rowspan="1">No</td>
<td align="left" colspan="1" rowspan="1">MBC &gt;3.1</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">10</td>
<td align="left" colspan="1" rowspan="1">134</td>
<td align="left" colspan="1" rowspan="1">427-15</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1">MITat 1.15</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1">1,2,3,4,8,11</td>
<td align="left" colspan="1" rowspan="1">23 bp trace of 70-bp repeat</td>
<td align="left" colspan="1" rowspan="1">No</td>
<td align="left" colspan="1" rowspan="1">N/A</td>
<td align="left" colspan="1" rowspan="1">N/A</td>
<td align="left" colspan="1" rowspan="1">IC-0.450</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">11</td>
<td align="left" colspan="1" rowspan="1">122</td>
<td align="left" colspan="1" rowspan="1">427-16</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1">MITat 1.16</td>
<td align="left" colspan="1" rowspan="1">4 (×2)</td>
<td align="left" colspan="1" rowspan="1">1,2,11</td>
<td align="left" colspan="1" rowspan="1">additional <italic>VSG</italic> ψ; copy of <italic>ESAG9</italic></td>
<td align="left" colspan="1" rowspan="1">No</td>
<td align="left" colspan="1" rowspan="1">N/A</td>
<td align="left" colspan="1" rowspan="1">N/A</td>
<td align="left" colspan="1" rowspan="1">IC-0.180</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">12</td>
<td align="left" colspan="1" rowspan="1">29</td>
<td align="left" colspan="1" rowspan="1">427-8</td>
<td align="left" colspan="1" rowspan="1">OD1</td>
<td align="left" colspan="1" rowspan="1">MITat 1.8</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1">3,4,8</td>
<td align="left" colspan="1" rowspan="1"/>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">MBC-1.7</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">13</td>
<td align="left" colspan="1" rowspan="1">56</td>
<td align="left" colspan="1" rowspan="1">427-17</td>
<td align="left" colspan="1" rowspan="1">JS1</td>
<td align="left" colspan="1" rowspan="1">MITat 1.17</td>
<td align="left" colspan="1" rowspan="1">8 (×2)</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1"/>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">IC-0.180</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">14</td>
<td align="left" colspan="1" rowspan="1">10</td>
<td align="left" colspan="1" rowspan="1">427-19</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1">MITat 1.19</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1">3,4,8</td>
<td align="left" colspan="1" rowspan="1">2 additional <italic>VSG</italic> ψs; 70 bp-repeat array (×2)</td>
<td align="left" colspan="1" rowspan="1">No</td>
<td align="left" colspan="1" rowspan="1">N/A</td>
<td align="left" colspan="1" rowspan="1">N/A</td>
<td align="left" colspan="1" rowspan="1">N/A</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1"/>
<td align="left" colspan="1" rowspan="1">117 (not sequenced)</td>
<td align="left" colspan="1" rowspan="1">427-8</td>
<td align="left" colspan="1" rowspan="1">OD1</td>
<td align="left" colspan="1" rowspan="1">MITat 1.8</td>
<td align="left" colspan="1" rowspan="1">N/A</td>
<td align="left" colspan="1" rowspan="1">N/A</td>
<td align="left" colspan="1" rowspan="1">N/A</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">MBC &gt;3.1</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">15 (two copies: 15a, 15b)</td>
<td align="left" colspan="1" rowspan="1">126</td>
<td align="left" colspan="1" rowspan="1">427-11</td>
<td align="left" colspan="1" rowspan="1">bR-2</td>
<td align="left" colspan="1" rowspan="1">MITat 1.11</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1"><italic>ESAG8(×2)</italic>; <italic>VSG</italic> ψ (×2); <italic>ESAG3</italic> ψ (×2); 70 bp-repeat array (×2)</td>
<td align="left" colspan="1" rowspan="1">Yes (15a &amp; 15b)</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">2 MBC: 1.35, 1.7</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">16</td>
<td align="left" colspan="1" rowspan="1">128 (d)</td>
<td align="left" colspan="1" rowspan="1">427-2</td>
<td align="left" colspan="1" rowspan="1">221</td>
<td align="left" colspan="1" rowspan="1">MITat 1.2</td>
<td align="left" colspan="1" rowspan="1">N/A</td>
<td align="left" colspan="1" rowspan="1">N/A</td>
<td align="left" colspan="1" rowspan="1">N/A</td>
<td align="left" colspan="1" rowspan="1">N/A</td>
<td align="left" colspan="1" rowspan="1">N/A</td>
<td align="left" colspan="1" rowspan="1">N/A</td>
<td align="left" colspan="1" rowspan="1">N/A</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">17 (a)</td>
<td align="left" colspan="1" rowspan="1">51 (b), 59</td>
<td align="left" colspan="1" rowspan="1">427-13</td>
<td align="left" colspan="1" rowspan="1">NA1</td>
<td align="left" colspan="1" rowspan="1">MITat 1.13</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1">-</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">Yes</td>
<td align="left" colspan="1" rowspan="1">IC-0.295</td>
</tr>
</tbody>
</table></alternatives><table-wrap-foot><fn id="nt101"><p>In this paper, we propose a new simple and logical <italic>VSG</italic> nomenclature. The hyphenated name indicates the <italic>T. brucei</italic> strain, followed by a number that identifies each unique <italic>VSG</italic>. For very closely related (probably antigenically indistinguishable) members of a <italic>VSG</italic> family, the number may be followed by a lower-case letter (for example Lister 427-3). When no misunderstanding can occur between strains under discussion in a particular context, the strain information may be omitted and the <italic>VSG</italic> referred to only by its number (for example, VSG 3). ND: not determined; N/A: not applicable; IC: intermediate chromosome; MBC: Megabase chromosome. (a) BES1, 2 and 17 had been previously cloned in BACs and identified as 221 ES, VO2 ES and Bn-2 ES, respectively <xref ref-type="bibr" rid="pone.0003527-Berriman2">[27]</xref>. (b) TAR65 and TAR51 were re-classified as belonging to BES group 7 and 17, respectively, based on global alignments showing sequence identity along the length of the sequence. The only differences were found in the promoter region, the target site for recombination during construction of the library. (c) Restriction mapping of the NEO tagged BES suggests the existence of two promoters, whereas the TAR clone has a single promoter. (d) TAR clone 128 is likely to be a recombinant between expression sites belonging to BES groups 1 and 15 (see text).</p></fn></table-wrap-foot></table-wrap><table-wrap id="pone-0003527-t002" position="float"><object-id pub-id-type="doi">10.1371/journal.pone.0003527.t002</object-id><label>Table 2</label><caption>
<title>Summary of the number of TAR clones sequenced, BES identified and BES activated.</title>
</caption><!--===== Grouping alternate versions of objects =====--><alternatives><graphic id="pone-0003527-t002-2" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0003527.t002" xlink:type="simple"/><table><colgroup span="1"><col align="left" span="1"/><col align="center" span="1"/><col align="center" span="1"/><col align="center" span="1"/></colgroup>
<thead>
<tr>
<td align="left" colspan="1" rowspan="1"/>
<td align="left" colspan="1" rowspan="1">Number</td>
<td align="left" colspan="1" rowspan="1">TAR clones or BES</td>
<td align="left" colspan="1" rowspan="1">TAR clones or BES missing</td>
</tr>
</thead>
<tbody>
<tr>
<td align="left" colspan="1" rowspan="1">TAR clones</td>
<td align="left" colspan="1" rowspan="1">19</td>
<td align="left" colspan="1" rowspan="1">40, 129, 2, 15, 3, 28, 98, 65, 153, 64, 134, 122, 29, 56, 10, 126, 128, 51, 59</td>
<td align="left" colspan="1" rowspan="1">TAR128 is probably a recombination artifact</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Unique BES</td>
<td align="left" colspan="1" rowspan="1">14</td>
<td align="left" colspan="1" rowspan="1">1, 2, 3, 4, 5, 7, 8, 10, 11, 12, 13, 14, 15, 17</td>
<td align="left" colspan="1" rowspan="1">TAR2 and TAR3 were duplicates of TAR15 and TAR28, respectively; TAR51 and TAR65 were re-classified</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">All BES</td>
<td align="left" colspan="1" rowspan="1">15</td>
<td align="left" colspan="1" rowspan="1">1, 2, 3, 4, 5, 7, 8, 10, 11, 12, 13, 14, 15a+15b, 17</td>
<td align="left" colspan="1" rowspan="1">BES15 is present in two copies in the genome</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Tagged BES</td>
<td align="left" colspan="1" rowspan="1">13</td>
<td align="left" colspan="1" rowspan="1">1, 2, 3, 4, 5, 7, 8, 12, 13, 14, 15a+15b, 17</td>
<td align="left" colspan="1" rowspan="1">BES10 and BES11 were not tagged</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Functional tagged BES</td>
<td align="left" colspan="1" rowspan="1">12</td>
<td align="left" colspan="1" rowspan="1">1, 2, 3, 4, 5, 7, 12, 13, 14, 15a+15b, 17</td>
<td align="left" colspan="1" rowspan="1">BES8 was tagged with NEO gene, but no G418-resistant clones could be obtained.</td>
</tr>
</tbody>
</table></alternatives></table-wrap></sec><sec id="s2b">
<title>Chromosomal localization of BESs</title>
<p>The chromosome containing each BES (indicated by arrows in <xref ref-type="fig" rid="pone-0003527-g001">Figure 1</xref>) was identified by Southern blotting of PFGE-separated chromosomal DNA with <italic>NEO</italic> and <italic>VSG</italic> probes (<xref ref-type="fig" rid="pone-0003527-g001">Figure 1</xref>). It had been shown previously that BES2 is located on an intermediate chromosome <xref ref-type="bibr" rid="pone.0003527-Rudenko1">[20]</xref>. We now show that BES4, BES10, BES11, BES13 and BES17 are also present in this chromosome class and that the megabase-sized chromosomes encode all remaining BES, consistent with previous reports <xref ref-type="bibr" rid="pone.0003527-Melville1">[21]</xref>.</p>
<fig id="pone-0003527-g001" position="float"><object-id pub-id-type="doi">10.1371/journal.pone.0003527.g001</object-id><label>Figure 1</label><caption>
<title>Chromosomal distribution of BES-resident <italic>VSG</italic>s.</title>
<p>Red arrows indicate BES randomly tagged in this study with <italic>NEO</italic>. Open arrows indicate BES activated by <xref ref-type="bibr" rid="pone.0003527-Aitcheson1">[58]</xref> and subsequently tagged. Names of <italic>VSG</italic> genes are indicated at the bottom, using the newly proposed strain-specific numbering (top row) and lab-specific names (bottom row). BES10 and 11 were not tagged in either study. BES14 is represented in two lanes: 14* refers to TAR117 (which was not sequenced and harbours VSG8), whereas 14<sup>$</sup> refers to TAR10 (which was sequenced and harbours VSG9).</p>
</caption><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0003527.g001" xlink:type="simple"/></fig>
<p>In some cases, the <italic>VSG</italic> probe hybridized with more than one chromosome, indicating that the genome contains multiple copies of the corresponding <italic>VSG</italic>. For instance, BES12 and BES14 contain <italic>VSG427-8</italic>, and BES15a and BES15b contain <italic>VSGbR-2/427-11</italic>, on megabase chromosomes of different sizes (<xref ref-type="supplementary-material" rid="pone.0003527.s002">Figures S1A and S1B</xref>, respectively). <italic>VSG121/427-6</italic> is present as a non-BES copy (Dreesen O., personal communication).</p>
</sec><sec id="s2c">
<title>Switching mechanism and frequency</title>
<p>The switching assay was designed to select for trypanosomes that had undergone an <italic>in situ</italic> switch by transcriptionally silencing BES1 and activating another BES without any DNA rearrangements. To assess the efficiency of selecting <italic>in situ</italic> switchers, Puromycin- and G418-resistant clones were analyzed by PFGE. If an <italic>in situ</italic> switch had occurred, the chromosomal locations of <italic>PUR</italic>, <italic>NEO</italic> and <italic>VSG</italic> should be unchanged: <italic>PUR</italic> and <italic>VSG221/427-2</italic> should be on chromosome VIa, whereas <italic>NEO</italic> and the newly identified <italic>VSG</italic> should be located on a different chromosome. PFGE analysis of 28 NEO-tagged clones that had activated different BES (2, 4, 5, 7, 13, 14, 15b and 17) confirmed that <italic>in situ</italic> switching was the predominant switching mechanism (15 switch events), but other switching mechanisms were also observed (<xref ref-type="fig" rid="pone-0003527-g002">Figure 2</xref>). In BES2- or BES15-tagged clones, for example, we observed that <italic>VSG221/427-2</italic> and <italic>PUR</italic> were deleted, whereas <italic>NEO</italic> and the new <italic>VSG</italic> remained in their original chromosomal location. This suggests that activation of BES5 and BES15 was accompanied by the truncation of BES1, a phenomenon previously reported for another BES <xref ref-type="bibr" rid="pone.0003527-Rudenko2">[22]</xref>. In three of the 28 cases studied, the active BES was replaced by duplicative transposition of the entire new BES. In switchers that activated BES7 (<xref ref-type="fig" rid="pone-0003527-g002">Figure 2B</xref>), BES13 or BES15b, <italic>VSG221/427-2</italic> and <italic>PUR</italic> were lost and <italic>NEO</italic> and the new <italic>VSG</italic> genes were duplicated onto chromosome VIa. This switching mechanism has been previously detected in switchers obtained in mice <xref ref-type="bibr" rid="pone.0003527-Pays3">[23]</xref> or by negative-selection <italic>in vitro </italic><xref ref-type="bibr" rid="pone.0003527-Cross1">[<italic>24</italic>]</xref>. In three cases, we observed unconventional recombination events that involved more than two chromosomes. These complicated VSG switch events that have undergone multiple DNA rearrangements have been previously documented <xref ref-type="bibr" rid="pone.0003527-Myler1">[25]</xref>.</p>
<fig id="pone-0003527-g002" position="float"><object-id pub-id-type="doi">10.1371/journal.pone.0003527.g002</object-id><label>Figure 2</label><caption>
<title>Types of switching mechanisms observed for tagged BES clones <italic>in vitro</italic>.</title>
<p>A. <italic>NEO</italic>-tagged clones have PUR in BES1 and <italic>NEO</italic> in an unknown BES. B. Example of a BES duplication. PFGE analysis of a BES7-tagged clone (17.9), when this BES is silent (S) and after activation. <italic>NEO</italic> and <italic>VSG3</italic> genes were duplicated onto the chromosome that originally contained <italic>PUR</italic> and <italic>VSG221/427-2</italic>. C. Quantification of the frequency of the different types of mechanisms. “Other” refers to recombination events that involved more than 2 chromosomes.</p>
</caption><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0003527.g002" xlink:type="simple"/></fig>
<p>In our cell-lines, the frequency of switching between BES1 and a second BES can be measured as the ratio between the number of G418-resistant clones and the total number of starting cells. Switching frequency was measured for clones in which the <italic>NEO</italic> gene was in BES4, 5, 13, 15b and 17. Consistent with previous reports, the average frequency was around 2±3×10<sup>−6</sup> switchers/cell, with BES15 showing the lowest switching frequency (8.3×10<sup>−8</sup> switchers/cell) <xref ref-type="bibr" rid="pone.0003527-Rudenko1">[20]</xref>, <xref ref-type="bibr" rid="pone.0003527-Lamont1">[26]</xref>. However, it should be noted that these measurements were based on a small number of independent clones (usually 3). A larger-scale study would be necessary to assess if the differences of switching frequency are statistically significant and how those correlate with the DNA sequence of the activated BES.</p>
</sec><sec id="s2d">
<title>Sequencing and assembly of TAR clones</title>
<p>Nineteen TAR clones <xref ref-type="bibr" rid="pone.0003527-Becker1">[19]</xref> were sequenced, manually finished and analysed. This set represents 14 unique BESs, with TAR clones from BESs 9 and 16 having been re-classified (<xref ref-type="table" rid="pone-0003527-t002">Table 2</xref>). For each BES group, at least one clone was sequenced (<xref ref-type="fig" rid="pone-0003527-g003">Figure 3</xref>, <xref ref-type="table" rid="pone-0003527-t001">Table 1</xref>), choosing a larger sized clone wherever possible. Additional clones were sequenced for BES3 and BES4 to verify the sequence and clone integrity. Global alignments showed that TAR clones 2 and 15 (BES3) as well as 3 and 28 (BES4) are 100% identical at the DNA level with the exception of an <italic>ESAG7</italic> triplication in TAR28. In addition, TAR clones from BES1 (TAR40), BES2 (TAR129) and BES17 (TAR59) were compared to the same BES previously sequenced from a BAC library <xref ref-type="bibr" rid="pone.0003527-Berriman2">[27]</xref> and were 99%,100% and 99% identical, respectively, indicating that TAR cloning produced stable clones.</p>
<fig id="pone-0003527-g003" position="float"><object-id pub-id-type="doi">10.1371/journal.pone.0003527.g003</object-id><label>Figure 3</label><caption>
<title>Overview of <italic>T. brucei</italic> Lister 427 BES.</title>
<p>BES are drawn to scale and have been aligned at their 5′-most <italic>ESAG7</italic> or <italic>ESAG6</italic> sequence. The inset shows the regions conserved between the dual promoters present in some of the clones. The <italic>VSG</italic> indicated in front of the BES label refers to the telomere-proximal <italic>VSG</italic>.</p>
</caption><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0003527.g003" xlink:type="simple"/></fig></sec><sec id="s2e">
<title>BES architecture</title>
<p>Eighteen of the TAR clones contain full-length BESs, ending in telomeric hexamer repeats, and the 14 BES types show a striking conservation in overall structure and order of <italic>ESAG</italic>s (<xref ref-type="fig" rid="pone-0003527-g003">Figure 3</xref>). The 5′ end of each TAR clone contains the BES promoter that was used as the recombination target during cloning. Half of the BESs have a second promoter approximately 13 kb upstream from the first <xref ref-type="bibr" rid="pone.0003527-Gottesdiener2">[28]</xref> which accounts for the differences in clone sizes observed in some of the BES groups. The region between the two promoters encodes <italic>ESAG10</italic> and a variety of pseudogenes that are commonly found in <italic>T. brucei</italic> subtelomeric regions (<xref ref-type="fig" rid="pone-0003527-g003">Figure 3</xref>). The presence of two promoters in some BES was confirmed by restriction mapping of the <italic>NEO</italic>-tagged clones. BES5 and BES8 were the only two discrepancies: <italic>NEO</italic>-tagged clones suggested the presence of 2 promoters, whereas TAR clones only had one, presumably because the downstream promoter was the target of the TAR cloning (<xref ref-type="supplementary-material" rid="pone.0003527.s004">Figure S3B</xref>). Downstream of the second promoter, the majority of sites encode polymorphic variants of <italic>ESAG7</italic>, <italic>ESAG6</italic>, <italic>ESAG5</italic>, <italic>ESAG3</italic>, <italic>ESAG4</italic>, <italic>ESAG8</italic>, <italic>ESAG3</italic>, <italic>ESAG2</italic>, <italic>ESAG11</italic> and <italic>ESAG1</italic>, in this conserved order. The only exception was an inversion between <italic>ESAG7</italic> and <italic>ESAG6</italic> in two BES groups (TAR29/BES12 and TAR56/BES13).</p>
<p>Nine BESs encode at least one copy of each <italic>ESAG</italic> (excluding <italic>ESAG10</italic>). We also observed frequent duplication of <italic>ESAG</italic>s, including a large-scale duplication in BES1 (TAR40), an ESAG7 triplication in BES4/TAR28 and three cases of divergent additional copies of <italic>ESAG8</italic> (BES1, BES13 and BES15).</p>
<p>The terminal <italic>VSG</italic>s are flanked upstream by tracts of 70-bp repeats, whose lengths vary in our assemblies between 0.2–7.1 kb, although this repeat region was only manually finished in 10 clones (<xref ref-type="fig" rid="pone-0003527-g003">Figure 3</xref>). The distance between the <italic>VSG</italic> and the telomeric repeats could be assessed in 17 TAR clones and ranged from 200–1590 nucleotides.</p>
<p>As described above, the analysis of the <italic>NEO</italic>-tagged clones was consistent with the analysis of TAR clones except in one case. Although VSG221/427-2 is a single-copy gene (<xref ref-type="fig" rid="pone-0003527-g001">Figure 1</xref>), we found it in both BES1/TAR40 and BES16/TAR128. The presence of VSG221/427-2 in BES1 has been firmly established from sequencing one BAC and two TAR clones. The promoter-proximal region (approx 40 kb) of TAR128 is identical to TAR126. Taken this data together, we conclude that TAR128 may be an artefact that resulted from recombination between BES1 and BES15. PCR analysis of additional TAR clones of BES16 failed to detect VSG221/427-2 (data not shown), further suggesting that TAR128 is not representative of BES16.</p>
</sec><sec id="s2f">
<title>Non-functional and novel BES genes</title>
<p>A defining feature shared by most BESs is the strict conservation of the 5′ copy of <italic>ESAG3</italic> and <italic>ESAG11</italic> as pseudogenes (<xref ref-type="fig" rid="pone-0003527-g003">Figure 3</xref>). The predominance of the latter is corroborated by a previous study describing the characterisation of this gene family <xref ref-type="bibr" rid="pone.0003527-Redpath1">[7]</xref>. In addition to these two pseudogenes, single frameshifts cause the presumed inactivation of <italic>ESAG4</italic> and <italic>ESAG5</italic> in some BESs. An analysis of <italic>ESAG</italic> processing signals gave further indication that some of the <italic>ESAGs</italic> may not localise correctly within the cell, including a number of <italic>ESAG4</italic> genes which lack sequences for surface targeting.</p>
<p>In five BESs (BESs 1, 2, 4, 5, 7) we identified a novel highly conserved putative protein coding sequence with a predicted signal peptide that we have designated ESAG12 (<xref ref-type="fig" rid="pone-0003527-g003">Figure 3</xref>). No functional clues could be discerned from sequence similarity or protein domain search results. A single homologue is found in the TREU 927 genome (Tb927.7.7510), although this is likely to be an under-representation due to the lack of subtelomeric sequence in the current TREU 927 genome assembly <xref ref-type="bibr" rid="pone.0003527-Berriman1">[18]</xref>.</p>
</sec><sec id="s2g">
<title>Some BES deviate from the overall conserved structure</title>
<p>Several BESs diverge from this conserved structure either by encoding additional sequences or because they represent truncated sites, lacking members of individual <italic>ESAG</italic> families. Most BES harbour only the <italic>VSG</italic> between the 70 bp-repeat array and the telomere (<xref ref-type="fig" rid="pone-0003527-g003">Figure 3</xref>). BESs 2, 4, 7 and 15 are exceptions to this rule, showing additional sequences (<italic>ingi</italic> element, <italic>VSG</italic> or <italic>ESAG3</italic> pseudogene). A further three sites encode duplicated regions of 70-bp repeats (BES1, 14 and 15), in each instance sandwiching <italic>VSG</italic> pseudogenes (see below). Five of the BES groups do not contain one or more of the expected <italic>ESAG</italic> repertoire. Amongst this set are:</p>
<p>BES7 (TARs 65,153) lacks <italic>ESAG7</italic>, but contains tandem copies of <italic>ESAG6</italic>, with different hypervariable regions, with <italic>ESAG6a</italic> resembling an <italic>ESAG6</italic>/<italic>ESAG7</italic> mosaic. This BES could be activated <italic>in vitro</italic> at the same frequency as other BESs. In order to investigate whether any DNA rearrangements have donated a copy of <italic>ESAG7</italic> to the newly activated BES7, DNA from cells with an active or silent BES7 were compared by PCR and restriction mapping (<xref ref-type="supplementary-material" rid="pone.0003527.s003">Figure S2</xref>). No differences were observed, suggesting that a BES lacking <italic>ESAG7</italic> can indeed be activated, confirming previous observations <xref ref-type="bibr" rid="pone.0003527-Ansorge1">[29]</xref>.</p>
<p>BES8 (TAR64) is unusually small and only contains a single copy of <italic>ESAG7</italic> followed by the 70-bp repeat region and the <italic>VSG</italic> (<xref ref-type="fig" rid="pone-0003527-g003">Figure 3</xref>). Long-range analysis of chromosomal DNA from a BES8-tagged clone digested with <italic>Apa</italic> I supported this finding, with the <italic>NEO and VSG427-14</italic>-hybridizing restriction fragment being only ∼20 kb in length (<xref ref-type="supplementary-material" rid="pone.0003527.s004">Figure S3A</xref>). Genotyping of the NEO-tagged clone confirmed the presence of ESAG7 and absence of <italic>ESAG6</italic> (data not shown). Attempts to activate this BES in two independent clones were unsuccessful, suggesting that this mini-BES may not be functional.</p>
<p>BES10 (TAR134) lacks the central portion (<italic>ESAG</italic> 4-8-3-2-11-1). TAR134 also encodes only a 23-bp fraction of a 70-bp repeat. This site was not among those that were tagged with a drug resistance marker, so its potential for activation could not be assessed.</p>
<p>BES14 (TAR10), also lacks the <italic>ESAG4</italic>-<italic>8-3</italic> gene cluster and has two <italic>VSG</italic> pseudogenes sandwiched between 70-bp repeat arrays. An inconsistency was found between the NEO-tagged clone and TAR sequence. The <italic>NEO</italic>-tagged clone did not harbour the <italic>VSG</italic> predicted by the TAR clone. Instead, the <italic>NEO</italic> tagged cell line expressed <italic>VSG427-8</italic> upon activation, rather than <italic>VSG427-19</italic>, as predicted by the TAR sequence. We confirmed by PFGE that the BES activation did not involve gene rearrangements (data not shown), indicating that <italic>VSG427-8</italic> was at the BES14 locus prior to activation. Further examination of the TAR clones in the BES14 set revealed TAR117 to correspond to the <italic>NEO</italic>-tagged clone. An interesting consequence of these results is that two BESs (BES12 and BES14) contain the <italic>VSG427-8</italic> gene (<xref ref-type="fig" rid="pone-0003527-g001">Figures 1</xref> and <xref ref-type="supplementary-material" rid="pone.0003527.s002">S1A</xref>).</p>
<p>In BES11 (TAR122), the <italic>ESAG2-11-1</italic> cluster has been replaced by a <italic>VSG</italic>-related gene (VR, <xref ref-type="fig" rid="pone-0003527-g003">Figure 3</xref>) and a full-length copy of <italic>ESAG9</italic>, the only copy found to date in a <italic>T. brucei</italic> BES. The <italic>VR</italic> gene is believed to be a <italic>VSG</italic> that has already evolved a new function and, like other <italic>VR</italic>s, has no 70-bp repeat sequences in its upstream flank <xref ref-type="bibr" rid="pone.0003527-Marcello1">[30]</xref>. Similarly to BES10, this site was not tagged with a drug selectable marker and therefore, activation <italic>in vitro</italic> could not be assessed.</p>
<p>BES12 (TAR29) has a deletion of the <italic>ESAG4-8-3</italic> cluster, but successful tagging and activation demonstrated that this site was functional <italic>in vitro</italic> (<xref ref-type="table" rid="pone-0003527-t001">Table 1</xref>).</p>
</sec><sec id="s2h">
<title>Investigating the forces driving BES diversity</title>
<p>In order to investigate the role of recombination in the evolution of bloodstream expressions sites, we examined changes in phylogenetic relationships along the BESs using two methods.</p>
<sec id="s2h1">
<title>Likelihood comparisons of optimal and constrained trees</title>
<p>There were obvious discrepancies between the optimal phylogenies for different <italic>ESAG</italic> loci, suggesting that the phylogenetic signal varied along the BESs. This was manifest in both the different shapes of ESAG trees and comparisons of their log-likelihood scores (<xref ref-type="fig" rid="pone-0003527-g004">Figures 4</xref> and <xref ref-type="supplementary-material" rid="pone.0003527.s005">S4</xref>). Comparing the likelihood score of an optimal topology for any given <italic>ESAG</italic> with the score obtained for a tree constrained with the signal of another <italic>ESAG</italic> locus, typically indicated a decrease in likelihood and therefore a decreased probability of shared histories. Indeed, the drop in likelihood was generally proportional with physical distance, such that topologies from different ends of the expression sites were most dissimilar (<xref ref-type="fig" rid="pone-0003527-g004">Figures 4</xref> and <xref ref-type="supplementary-material" rid="pone.0003527.s005">S4</xref>). Although topological differences between the phylogenies of neighbouring <italic>ESAG</italic>s were observed, these were non-significant and fell within the margins of systematic error. In fact, comparisons for all genes (<xref ref-type="supplementary-material" rid="pone.0003527.s005">Figure S4</xref>) showed that <italic>ESAG</italic>s fell into three clusters with regard to phylogenetic signal: <italic>ESAG</italic>s 7, 6 and <italic>5</italic>, <italic>ESAG</italic>s <italic>4</italic> and <italic>8</italic>, and <italic>ESAG</italic>s <italic>2</italic>, <italic>1</italic> and <italic>11</italic> with compatible phylogenetic signals within, but not between, these clusters.</p>
<fig id="pone-0003527-g004" position="float"><object-id pub-id-type="doi">10.1371/journal.pone.0003527.g004</object-id><label>Figure 4</label><caption>
<title>Quantifying the difference in phylogenetic signal along the bloodstream expression site.</title>
<p>A. Three tanglegrams relate the <italic>ESAG5</italic> phylogeny with those of <italic>ESAG6</italic> (close match), <italic>ESAG4</italic> (moderate incongruence) and <italic>ESAG1</italic> (severe incongruence). Dashed lines link corresponding expression sites in each tree. Incongruence between trees increases from left to right. B. Comparison of likelihood scores between optimal and constrained tree topologies for <italic>ESAG5</italic>. The phylogenies of six other <italic>ESAG</italic> loci (indicated by a cartoon of the expression site) were used to constrain the estimation of the <italic>ESAG5</italic> tree; the difference in likelihood score between each of these constrained trees and the optimal <italic>ESAG5</italic> tree is plotted along the expression site. Non-significant differences in likelihood are denoted by a dashed circle as evident when constraining the <italic>ESAG5</italic> topology with the <italic>ESAG6</italic> topology; however, enforcing the topologies of central loci (<italic>ESAGs 4</italic> and <italic>8</italic>) caused a moderate decrease in likelihood, whilst constraining with <italic>ESAG</italic>s <italic>2</italic>, <italic>11</italic> or <italic>1</italic> caused a larger decrease.</p>
</caption><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0003527.g004" xlink:type="simple"/></fig></sec><sec id="s2h2">
<title>Recombination analyses</title>
<p>To examine the fine scale structure of recombination within the BESs, a genetic algorithm-based tool (GARD) <xref ref-type="bibr" rid="pone.0003527-KosakovskyPond1">[31]</xref> was used to infer the numbers and locations of recombination breakpoints. Although this method relies on phylogenetic incompatibility to deduce recombination, GARD differs from the constrained tree analyses described above in two important respects: (i) the locations of putative breakpoints are inferred rather than fixed <italic>a priori</italic>, allowing us to characterize recombination within individual loci, and (ii) GARD is able to detect gene conversion events that affect branch lengths but not tree topology. When applied to the nucleotide alignments of each <italic>ESAG</italic> locus and to five intergenic regions, this method identified a large number of recombination tracts with distinct phylogenetic histories (<xref ref-type="supplementary-material" rid="pone.0003527.s007">Tables S1</xref> and <xref ref-type="supplementary-material" rid="pone.0003527.s008">S2</xref>). Mean recombination tract lengths ranged from 90 bp/tract for <italic>ESAG1</italic> to 687 bp/tract for <italic>ESAG10</italic>, and mean tract lengths were similar in both coding and non-coding sequences. The GARD analyses demonstrate that phylogenetic breakpoints occur throughout the expression sites, consistent with frequent genetic exchange.</p>
<p>Phylogenetic inference of recombination can be misled by substitution rate variation, as could occur if different genes or regions within a gene are subject to different selection pressures. Therefore, a summary statistic-based approach, the Pairwise Homoplasy Index (Φ) Test <xref ref-type="bibr" rid="pone.0003527-Bruen1">[32]</xref>, which has been shown to be robust to substitution rate variation, was applied to each alignment to validate the GARD analyses, and to each of the individual recombination tracts inferred by GARD to identify any further recombination that might exist. With the exception of <italic>ESAG10</italic>, which is highly conserved, significant values of Φ were obtained for each <italic>ESAG</italic> alignment, consistent with recombination within these loci (<xref ref-type="supplementary-material" rid="pone.0003527.s008">Table S2</xref>). In addition, the Φ values were significant in at least some of the GARD-inferred tracts within all <italic>ESAG</italic> loci except <italic>ESAG8</italic> and <italic>ESAG10</italic>, and in 30% of individual tracts overall. These results indicate that there are additional breakpoints not detected by GARD, and support the conclusion that there is extensive recombination throughout the entire BES.</p>
</sec><sec id="s2h3">
<title>Evidence of molecular adaptation within ESAG families</title>
<p>The role of selection in the evolution of bloodstream expression sites was examined by estimating the ratio of the non-synonymous and synonymous substitution rates (ω) within each <italic>ESAG</italic> family. A likelihood ratio test was used to assess whether the distribution of ω across codons is best explained by a model (M1a) which assumes that all sites are evolving neutrally or under purifying selection, or by a model (M2a) which includes an additional category of sites under positive selection (i.e., ω&gt;1). As indicated by the higher likelihood scores of model M2a (<xref ref-type="supplementary-material" rid="pone.0003527.s009">Table S3</xref>), these tests provide significant evidence of adaptive evolution within <italic>ESAGs</italic> 4, 5, 6, and 7, and are nearly significant (p&lt;0.1) for <italic>ESAG1</italic> and <italic>ESAG3b</italic>. In contrast, there is no evidence of adaptive evolution in <italic>ESAGs</italic> 2, 8 and 10. Selective pressures at individual codons were inferred using a Bayesian approach with model M2a used as a prior distribution on ω. As expected, the majority of sites appear to be subject to strong purifying selection (ω≪0.5), while the numbers of positively-selected sites corroborate the gene-wide analyses, with <italic>ESAGs</italic> 4–7 displaying widespread adaptation (<xref ref-type="supplementary-material" rid="pone.0003527.s010">Table S4</xref>). Taken together, these results indicate that all <italic>ESAGs</italic> are under strong purifying selection, presumably to maintain functionality, and that most <italic>ESAGs</italic> contain at least some sites which have undergone adaptive evolution over the course of BES differentiation.</p>
</sec></sec></sec><sec id="s3">
<title>Discussion</title>
<p>The elucidation of the BES repertoire of a single <italic>T. brucei</italic> strain has produced a global view of BES structure and evolution. We have sequenced 19 out of 182 clones of BESs from <italic>T. brucei</italic> 427, chosen to represent as many different BESs as possible based on the preliminary analysis of the original set <xref ref-type="bibr" rid="pone.0003527-Becker1">[19]</xref> and including duplicates. Sequence analysis identified 14 distinct BESs, one of which exists in two copies, giving a total number of 15 BESs. Have we found all of the BESs in <italic>T. brucei</italic> 427? Assuming that the promoter sequence is conserved in all BESs, we estimated the chance of missing any BESs in the entire library by simulating samples of 182 randomly sampled clones from populations with different numbers of underlying BESs. In such a simulation, no sites are ‘missed’ if there were 19 or fewer BESs. Based on all of the available data the subset chosen for sequencing appears to cover most, if not all, BESs. Thirteen of these 15 BES were tagged with the Neomycin resistance gene in 30 random integration events. Assuming equal probability of tagging any end we expect to miss at least 2 out of 15 BESs in 30 tagging events 65% of the time (simulation of 1000 random samples of 30 tagging events). No BESs were tagged that were absent from the collection of TAR clones and we therefore are confident that the library contains the entire <italic>T. brucei</italic> Lister 427 BES repertoire. We will however only be able to address the question as to whether the size of the BES repertoire of <italic>T. brucei</italic> Lister 427 is shared by other <italic>Trypanosoma brucei</italic> isolates once a large number of strains are analyzed. The genome strain <italic>T. brucei</italic> TREU 927 has fewer BESs based on hybridization analysis <xref ref-type="bibr" rid="pone.0003527-Melville2">[33]</xref> and a similar set of <italic>T. brucei</italic> 927 BES TAR clones with only 5–8 promoter and <italic>ESAG6</italic> region sequence types have been identified (Becker and Louis, unpublished). In addition to having fewer BESs, <italic>T. brucei</italic> 927 also has smaller <italic>VSG</italic> basic copy arrays compared with <italic>T. brucei</italic> 427, though the genome strain <italic>T. brucei</italic> TREU 927 has one of the smallest genomes analysed among <italic>T. brucei</italic> isolates <xref ref-type="bibr" rid="pone.0003527-Callejas1">[34]</xref>. This makes it likely that the relatively large number of BESs that we observe here with <italic>T. brucei</italic> 427 does indeed fall within the range of BES copy numbers that may be observed among different isolates.</p>
<p>The validity of the TAR cloning is demonstrated by the identical sequences obtained from two independent TAR clones of the same BES, by the comparison to previously published sequences and by the congruence with the data obtained from the NEO-tagged BES. Given both the number of TAR clones from known BESs and TAR cloned DNA that does not exist in the genome, we get a maximum estimate of 15% of aberrant TAR clones in the original library. In fact, only one of the 19 TAR clones selected for sequencing (TAR128) is inconsistent with other data and could be a recombinant between two BESs generated during TAR cloning. The other clones originally classified with this clone in BES group 16 appear not to be recombinant and could be sequenced in the future.</p>
<p>The sequencing effort has also highlighted the need to return to the original TAR clone set to account for misclassifications based on the hypervariable region of <italic>ESAG6</italic> and the promoter sequence. Given that the promoter sequence was the target for recombination, the actual cloning procedure may have introduced variability in this region not present in the genome. As a consequence, two TAR clones were re-assigned in this study to different BES groups, giving fewer groupings than the original classification into 19 groups. It is clear that correct and complete characterisation of the telomeres requires a combination of saturation cloning and sequencing of well-chosen clones.</p>
<p>Characterisation of parasites with activated <italic>NEO</italic>-tagged BESs revealed that, as expected, <italic>in situ</italic> switching was the most frequent event. Interestingly, in three out of 28 switchers, we observed a switching mechanism, in which the previously active BES (BES1) was replaced by a duplication of the newly activated BES (7, 13 or 15b). Most likely recombination between the two subtelomeric regions occurs upstream of the drug-resistance genes, possibly at the promoter region, the 50 bp-repeat array, or in an even more internal chromosomal location. It is unclear which of the two BES copies is the active one. Nevertheless, our observations confirm what has been previously reported that an entire BES can be duplicated and transposed to a different locus <xref ref-type="bibr" rid="pone.0003527-Pays3">[23]</xref>, <xref ref-type="bibr" rid="pone.0003527-Cross1">[24]</xref>, which is reminiscent of break-induced replication in yeast. In fact, when a double-strand break is induced in subtelomeric regions of <italic>S. cerevisiae</italic>, that end is often replaced by a duplicated copy of another end (reviewed in <xref ref-type="bibr" rid="pone.0003527-Haber1">[35]</xref>). Such mechanism could explain the existence of two copies of BES15 and it may also have contributed to the large number of BES in <italic>T. brucei</italic> 427 relative to other isolates.</p>
<p>The BESs presented here show considerable diversity in the <italic>ESAG</italic> complement, though there is an overall conservation of order that agrees with the generic BES structure previously proposed <xref ref-type="bibr" rid="pone.0003527-Berriman2">[27]</xref> (top diagram in <xref ref-type="fig" rid="pone-0003527-g003">Figure 3</xref>). There are some clear exceptions within the overall conservation, ranging from a small BES containing only <italic>ESAG7</italic> and a <italic>VSG</italic>, to a BES containing <italic>ESAG</italic> duplications and triplications. The BES-tagging data presented here redefine the requirement for a minimal BES, which appears only to entail functional copies of <italic>ESAG</italic>s 1, 2 and 6, although <italic>ESAG1</italic> is not essential within an active BES <xref ref-type="bibr" rid="pone.0003527-Carruthers1">[16]</xref>, <xref ref-type="bibr" rid="pone.0003527-Morgan1">[17]</xref> and <italic>ESAG2</italic> is absent from the BES encoding <italic>SRA</italic>, the <italic>T. b. rhodesiense</italic> gene able to confer resistance to human serum in infections <xref ref-type="bibr" rid="pone.0003527-Xong1">[36]</xref>. There appears to be no requirement for <italic>ESAG7</italic>, as previously postulated <xref ref-type="bibr" rid="pone.0003527-Berriman2">[27]</xref>. The smallest BES we came across as part of this study only encodes <italic>ESAG7</italic> in addition to <italic>VSG</italic> (BES8). We were unfortunately unable to show activation of this site <italic>in vitro</italic> but it may yet indicate that none of the <italic>ESAGs</italic> need to be expressed from the active BES. However, the absolute requirement of <italic>ESAG</italic>s in an expression site is difficult to test because low-level transcription of <italic>ESAG6</italic> and <italic>ESAG7</italic> and indeed other <italic>ESAG</italic>s may occur from ‘silent’ sites <xref ref-type="bibr" rid="pone.0003527-Vanhamme1">[37]</xref>, <xref ref-type="bibr" rid="pone.0003527-vanLuenen1">[38]</xref>. Even if these truncated BES are not functional, they may still contribute sequences via gene conversion to other BESs.</p>
<p>One surprising finding was the presence of additional sequences downstream of the 70-bp repeat in some BESs, as well as the number of BESs containing additional <italic>VSG</italic> pseudogenes. The presence of pseudogenes towards the downstream end of the BES is not entirely unexpected though, as this area is a recombinational hotspot, continually accepting incoming copies of <italic>VSG</italic> cassettes in order to mediate antigenic variation. As the recombination processes involved may not be constrained by the high stringency normally imposed by mismatch repair <xref ref-type="bibr" rid="pone.0003527-Barnes1">[39]</xref>, it has to be expected that there will be errors, such as a duplicated cassette being copied into another cassette, rather than replacing it. Most of the <italic>VSG</italic>s in the silent archive are full-length pseudogenes, at least some of which contribute ‘healthy’ sequence to novel mosaic expressed <italic>VSG</italic>s <xref ref-type="bibr" rid="pone.0003527-Marcello1">[30]</xref>. It has been speculated that silent BESs might safely foster the stepwise assembly of mosaics, in contrast to the active BES, from which there is an absolute requirement for expression of an intact <italic>VSG</italic> <xref ref-type="bibr" rid="pone.0003527-Barry1">[40]</xref>, <xref ref-type="bibr" rid="pone.0003527-Sheader1">[41]</xref>. The present findings are compatible with this proposal, but not conclusive. The <italic>VSG</italic> pseudogenes could be copies of silent <italic>VSG</italic> pseudogenes, or partially assembled mosaics, or genes that have degenerated <italic>in situ</italic> through lack of requirement for expression. Work is underway to address the question of mosaic <italic>VSG</italic> assembly and expression.</p>
<p>The repertoire of BESs gives some indication of their proliferation among telomeres and their macroevolution. The driving forces that have shaped this repertoire are segmental duplications and deletions, recombination events typical of subtelomeres. However, gene content does not always coincide with the relationships among ESAG genes; for instance, BES13, 15 and 16 all possess a tandem duplication of <italic>ESAG8</italic>, but are not closely related based on their <italic>ESAG8</italic> nucleotide sequences. The incongruence between gene trees for the different <italic>ESAG</italic>s confirms that BESs have not diversified through ‘orthodox’ patterns of duplication and divergence. Rather, each BES is a mosaic and the product of frequent recombination between telomeres; this may occur through reciprocal crossover events between homologous strands at mitosis, or through non-reciprocal gene conversion. Recombination is frequently non-homologous, as we observe both segmental deletions and duplications, (for instance the substantial duplications and triplications within BES1), and variations in length, with some BESs greatly reduced in size (e.g. BES8 and BES10).</p>
<p>This process is consistent with previous observations of ‘telomere exchange’ <xref ref-type="bibr" rid="pone.0003527-Rudenko3">[42]</xref>, though the prevalence of mosaics demonstrates that whole telomeres are not typically exchanged. Instead, the data suggest that clusters of contiguous <italic>ESAG</italic>s share common histories, and therefore have not frequently been split by recombination. There appears to be a physical limit on the frequency of recombination breakpoints, which seldom occur in between <italic>ESAG</italic>s <italic>7</italic>, <italic>6</italic> and <italic>5</italic>, <italic>ESAG</italic>s <italic>4</italic> and <italic>8</italic> or between <italic>ESAG</italic>s<italic>2</italic>, <italic>1</italic> and <italic>11</italic> (<xref ref-type="fig" rid="pone-0003527-g004">Figure 4</xref>, <xref ref-type="supplementary-material" rid="pone.0003527.s008">Table S2</xref>). However, the transposition of an isolated ESAG7 copy into an active expression site (without ESAG6 and 5) has been reported under <italic>in vitro</italic> drug and serum selection pressure <xref ref-type="bibr" rid="pone.0003527-vanLuenen1">[38]</xref>. This provides experimental evidence that <italic>ESAG</italic>s can and do move between sites, with the loss of a particular allele from the active BES; our data qualify this by showing that <italic>ESAG7</italic> usually transpose in unison with <italic>ESAG</italic>s<italic>6</italic> and <italic>5</italic> (otherwise they would not share a common phylogenetic history).</p>
<p>Given that frequent breakpoints coincide with the position of <italic>ESAG3</italic> loci between linkage blocks, these could play a role in orientating expression sites prior to the exchange of intervening regions. This could also explain why <italic>ESAG3a</italic>, <italic>b</italic> and <italic>c</italic> sequences do not cluster by position (data not shown). It is therefore conceivable that the conserved, repetitive, higher order structure of expression sites may be maintained as a template for recombination, either to enhance the function of <italic>ESAG</italic>s, or of the VSG switching mechanism. Alternatively, the overall structure could be a secondary, non-adaptive result of the <italic>VSG</italic> switching events.</p>
<p>The majority of <italic>ESAG</italic>s within expression sites are unusual in that they are part of larger gene families present at chromosome internal locations within the genome but ‘behave’ like a tandem gene array or highly linked loci <xref ref-type="bibr" rid="pone.0003527-Jackson1">[43]</xref>. Internal and telomeric gene copies seem to evolve in very different ways. Internal copies of some families, for example <italic>ESAG4</italic> and <italic>5</italic> are more diverse and retain orthology with corresponding loci in the related species. Telomeric <italic>ESAG</italic> copies in contrast have relatively low levels of variation and therefore always form a clade in <italic>ESAG</italic> family phylogenies (data not shown). This indicates that frequent recombination between telomeric copies leads to homogenisation and concerted evolution of <italic>ESAG</italic> families and both GARD and PHI analyses have shown that most <italic>ESAG</italic> alignments contain chimaeras (<xref ref-type="fig" rid="pone-0003527-g004">Figures 4</xref> and <xref ref-type="supplementary-material" rid="pone.0003527.s006">S5</xref>, <xref ref-type="supplementary-material" rid="pone.0003527.s007">Table S1</xref>). In addition, localised diversification has clearly occurred in some <italic>ESAG</italic> families such as <italic>ESAG7</italic> and <italic>6</italic>, where the most diversifying codons can be mapped to the exposed surface of the molecule, including the hypervariable region. <xref ref-type="bibr" rid="pone.0003527-Salmon1">[11]</xref> (M. Carrington, University of Cambridge, personal communication).</p>
<p>We also postulate that a by-product of the recombination between <italic>ESAG</italic> families is the prevalence of some <italic>ESAGs</italic> as apparent pseudogenes. Like <italic>VSG</italic>s, <italic>ESAG</italic> copies may be routinely corrupted but continue to provide genetic resources for functional copies, since they can be rescued by subsequent gene conversion events. Whether <italic>ESAG</italic> evolution is adaptive, or simply a secondary consequence of sharing the expression site environment, remains to be seen.</p>
<p>The conclusion that both the whole BES and individual <italic>ESAGs</italic> are mosaics raises the question as to how it is possible for two contiguous markers, such as <italic>ESAG1</italic> and <italic>2</italic>, to display parallel evolutionary histories, when both gene families are being homogenised by frequent gene conversions. This should effectively randomise the relationships of each ESAG family relative to each other. Essentially, we could be observing recombination on two different scales. Entire BESs recombine, perhaps as a secondary effect of the <italic>VSG</italic> switching mechanism, but this is limited by spatial proximity. At a finer scale, individual <italic>ESAG</italic>s recombine with paralogs in other expression sites, which restrains the normal process of divergence, tending to homogenise the entire family. Our observation that BESs retain phylogenetic signals, i.e. a pattern of divergence, demonstrates that substitutions affecting <italic>ESAG</italic> sequences are not entirely homogenised by recombination. Therefore, for phylogenetic signals to persist, the substitution rate, perhaps augmented by positive selection, must limit the extent of homogenisation through recombination in a dynamic equilibrium. Neighbouring <italic>ESAG</italic>s that are not separated by recombination share this equilibrium and therefore, phylogenetic signal.</p>
<p>This work opens important perspectives in understanding the molecular mechanisms of antigenic variation and telomere biology. The fact that the short BES8 and BES10 could not be activated <italic>in vitro</italic> opens the possibility of using these sites to identify the minimum requirements to make a functional BES. The role of telomeres in BES transcription has been extensively studied by several groups (reviewed in <xref ref-type="bibr" rid="pone.0003527-Dreesen1">[44]</xref>). Truncated BES may be a useful tool to study telomere biology in <italic>T. brucei</italic>, since the distance between the promoter and the telomere is much shorter. Finally, BES sequences and overall architecture will aid the identification of the mediators involved in <italic>VSG</italic> switching. Such studies may reveal mechanisms that are relevant to telomere biology and antigenic variation in other important pathogens.</p>
</sec><sec id="s4">
<title>Materials and Methods</title>
<sec id="s4a">
<title><italic>Trypanosoma brucei</italic></title>
<p>The BES TAR library was constructed from <italic>T. brucei</italic> Lister 427 strain clone 221a <xref ref-type="bibr" rid="pone.0003527-Johnson1">[45]</xref>, in which a hygromycin-resistance gene had been previously introduced immediately downstream of the promoter of the active VSG221/427-2 expression site and a neomycin-resistance gene downstream of the promoter of the silent VSGVO2 expression site <xref ref-type="bibr" rid="pone.0003527-Rudenko2">[22]</xref>. BES-tagged cell lines were also derived from wild-type <italic>T. brucei</italic> 221a. Bloodstream-form trypanosomes were grown in HMI-9 medium <xref ref-type="bibr" rid="pone.0003527-Hirumi1">[46]</xref>. Stable transfections were performed using the BTX Electroporator <xref ref-type="bibr" rid="pone.0003527-Wirtz1">[47]</xref>.</p>
</sec><sec id="s4b">
<title>Isolation of TAR clones and preparation of sequencing libraries</title>
<p>Yeast artificial chromosomes (YACs) containing BESs, TAR-cloned using the conserved <italic>VSG</italic> BES promoter as a recombination targets, have been previously described <xref ref-type="bibr" rid="pone.0003527-Becker1">[19]</xref>. A representative clone was chosen from each group, selecting a larger sized clone wherever possible. Clones were isolated from yeast transformants through separation of the YAC DNA from endogenous chromosomes by CHEF (contour clamped homogeneous electric field) gel electrophoresis <xref ref-type="bibr" rid="pone.0003527-Leech1">[48]</xref>. The recovered DNA was fragmented by sonication and end-repaired with mung bean nuclease prior to preparative agarose gel electrophoresis. DNA fragments of 2–4 kb and 1.4–2 kb were purified and cloned into pUC18 plasmid vector.</p>
</sec><sec id="s4c">
<title>Sequence determination, assembly and annotation</title>
<p>Nineteen TAR clones were sequenced by random sequencing of small insert libraries using dye-terminator chemistry on an ABI 3730 sequencing machine. Sequence reads were assembled using Phrap [<ext-link ext-link-type="uri" xlink:href="http://www.phrap.org" xlink:type="simple">www.phrap.org</ext-link>; P. Green, unpublished)]. Manual base calling and finishing was carried out using Gap4 software (<ext-link ext-link-type="uri" xlink:href="http://www.mrc-lmb.cam.ac.uk/pubseq/manual/gap4_unix_1.html" xlink:type="simple">http://www.mrc-lmb.cam.ac.uk/pubseq/manual/gap4_unix_1.html</ext-link>). Gaps and low quality regions of the sequence were resolved by primer walking and targeted polymerase chain reactions (PCR). A number of gaps, all exclusively located in the 70-bp repeat regions, remain in the assemblies and are indicated by 100 N's (<xref ref-type="fig" rid="pone-0003527-g003">Figure 3</xref>).</p>
<p>Each clone was annotated using the Artemis software <xref ref-type="bibr" rid="pone.0003527-Rutherford1">[49]</xref>. Protein coding sequences were predicted as previously described and analysed to assign putative functions as previously described <xref ref-type="bibr" rid="pone.0003527-Berriman1">[18]</xref>. The full annotation of 19 expression sites can be viewed and searched via GeneDB (<ext-link ext-link-type="uri" xlink:href="http://www.genedb.org/genedb/tbrucei427/" xlink:type="simple">http://www.genedb.org/genedb/tbrucei427/</ext-link>) and sequences have been submitted to EMBL with the following accession numbers: FM162566 - FM162583.</p>
<p>Current VSG nomenclature reflects multiple naming schemes. We therefore propose a new systematic nomenclature based on sequential numbering with reference to the <italic>T. brucei</italic> Lister 427 strain (<xref ref-type="table" rid="pone-0003527-t001">Table 1</xref>).</p>
</sec><sec id="s4d">
<title>Sequence alignments</title>
<p>The Needle program, an implementation of Needleman-Wunsch algorithm in the EMBOSS <xref ref-type="bibr" rid="pone.0003527-Rice1">[50]</xref> software package was used to perform global alignments using default parameters. The region of the imperfect 70-bp repeats was excluded from each alignment. Local alignments were performed using ClustalW (<ext-link ext-link-type="uri" xlink:href="http://www.ebi.ac.uk/clustalw/index.html" xlink:type="simple">http://www.ebi.ac.uk/clustalw/index.html</ext-link>) with default parameters</p>
</sec><sec id="s4e">
<title>Generation of <italic>T. brucei</italic> clones with tagged BES</title>
<p>BES-tagged clones were generated by introducing a Puromycin resistance gene (<italic>PUR</italic>) downstream of the promoter of a wild-type <italic>VSG221/427-2</italic> expressing cell line. <italic>NEO</italic> was subsequently integrated downstream of the promoters of random BESs conferring resistance to G418. Clones obtained from this transfection were named BF-LF17.x or BF-LF18.x. depending on the presence or absence of the 50-bp repeat array upstream of BES1 promoter (Figueiredo <italic>et al.</italic>, unpublished) (see also <xref ref-type="supplementary-material" rid="pone.0003527.s001">Data S1</xref>).</p>
</sec><sec id="s4f">
<title>BES switching assay</title>
<p>To prevent premature growth of <italic>in situ</italic> switchers, <italic>NEO</italic>-tagged clones were grown under Puromycin selection. After 5 days, cells were subcloned by limiting dilution in the absence of any drug to allow independent switching in each subclone. 2.4×10<sup>7</sup> cells of 2–5 subclones were subsequently diluted in HMI-9 containing 100 µg/mL G418, and distributed in a 24-well plate. After 6–8 days, the number of G418-resistant clones was counted. Switching frequency was calculated by dividing the number of G418-resistant clones by the total number of plated cells. One or two clones from each plate were tested for Puromycin sensitivity by diluting 10<sup>5</sup> cells in 5 mL of HMI-9 containing Puromycin at 1 µg/mL. Cell growth was scored after 2 days. Western Blotting was performed to confirm that G418-resistant cells no longer expressed VSG221/427-2.</p>
</sec><sec id="s4g">
<title>Cloning the <italic>ESAG6</italic> hypervariable region</title>
<p>The <italic>ESAG6</italic> hypervariable region of each <italic>NEO</italic>-tagged BES was PCR amplified using a <italic>NEO</italic>-specific primer and one of two <italic>ESAG6</italic>-specific primers (<named-content content-type="gene" xlink:type="simple">5′-TAAAGAGAGTTGTTCACTCAC-3′</named-content> or <named-content content-type="gene" xlink:type="simple">5′-TGTTCACTCACTCTCTTTGAC-3′</named-content>) and the products gel-purified and sequenced. From clones with two consecutive <italic>ESAG6</italic> genes, the <italic>ESAG6</italic> hypervariable region from the most telomeric <italic>ESAG6</italic> gene, was reamplified from the largest PCR fragment by nested-PCR with primers: <named-content content-type="gene" xlink:type="simple">5′-CACTAATGATCAGCTTTACG-3′</named-content> and <named-content content-type="gene" xlink:type="simple">5′-GACTCTTTTACACGTGAATC-3′</named-content>. The resulting 1-kb fragment was purified and sequenced.</p>
</sec><sec id="s4h">
<title>Cloning the expressed VSG</title>
<p>Total RNA was extracted from ∼10<sup>8</sup> G418-resistant cells with RNA STAT-60 reagent (TEL-TEST, Inc.), following the manufacturer's instructions. cDNA was synthesized using a PolyT-primer and the StrataScript™ First Strand Synthesis System (Stratagene). <italic>VSG</italic> cDNA was amplified with primers that bind to the spliced leader (<named-content content-type="gene" xlink:type="simple">5′-GACTAGTTTCTGTACTATAT-3′</named-content>) and to a conserved sequence found in the 3′UTR of all <italic>VSG</italic> (<named-content content-type="gene" xlink:type="simple">5′-GTGTTAAAATATATC-3′</named-content>). Using the spliced leader primer ensured that the amplified product originated only from <italic>trans</italic>-spliced RNA and not from a DNA contaminant. PCR products were subsequently cloned in pGEM-T Easy (Promega) and sequenced.</p>
</sec><sec id="s4i">
<title>Chromosome separation by CHEF</title>
<p><italic>T. brucei</italic> chromosomes were separated using a CHEF electrophoresis apparatus (CHEF-DR III, Bio-Rad), loading DNA from approximately 2×10<sup>7</sup> cells per lane. Electrophoresis conditions for the panel separating <italic>T. brucei</italic> intermediate chromosomes were: 25 s pulse time, 6 V/cm, for 20 h, in 0.5×TBE, at 14°C, using a gel of 1% high-strength agarose (Helena Biosciences). <italic>T. brucei</italic> megabase chromosomes were separated using 1400–700 s linear ramped pulse, 2.5 V/cm, for 144 h in 1×TBE at 14°C in a gel with 1.2% high-strength agarose.</p>
</sec><sec id="s4j">
<title>Long-range Southern blotting</title>
<p>Agarose-embedded chromosome plugs were digested with 40 units of <italic>Apa</italic> I or <italic>Apa</italic> I and <italic>Xma</italic> I (New England Biolabs), as previously described <xref ref-type="bibr" rid="pone.0003527-Dreesen2">[51]</xref>. Restriction products were separated on a 1.0% agarose gel in 0.5×Tris-Borate-EDTA buffer (TBE) in the Stratagene Rotating Agarose Gel Electrophoresis variant of Pulsed Field Gel Electrophoresis (PFGE) at 12°C and with a rotation angle of 120°. The running program for <italic>Apa</italic> I restriction fragments consisted of a 5 to 15 sec linear ramp at a constant 155 V for 18 h. For <italic>Apa</italic> I and <italic>Xma</italic> I restriction fragments the program was 1 to 4 sec linear ramp at a constant 150 V for 18 h. After alkaline transfer and hybridization with a radioactive probe, the Hybond-N+ Nylon membranes (Amersham Biosciences) were typically washed at 65°C as follows: twice for 20 min with 2×Sodium Chloride/Sodium Citrate (SSC), 0.1% SDS and twice for 20 min with 0.5×SSC, 0.1%SDS.</p>
</sec><sec id="s4k">
<title>Comparison of phylogenetic signal among <italic>ESAG</italic>s</title>
<p>ClustalX was used to align homologs of 7 ESAG loci from 11 different expression sites <xref ref-type="bibr" rid="pone.0003527-Thompson1">[52]</xref>. The maximum likelihood phylogenetic tree topology was estimated for each locus using the program PHYML <xref ref-type="bibr" rid="pone.0003527-Guindon1">[53]</xref>, with a GTR+Γ model and parameters estimated from the data. By constraining the resulting trees with the optimal topology of each other locus in turn a further six tree topologies were produced for each locus. The differences in likelihood value between the optimal tree and each constrained tree were calculated and the significance evaluated using the Shimodaira-Hasegawa test <xref ref-type="bibr" rid="pone.0003527-Shimodaira1">[54]</xref> thus quantifying the difference in phylogenetic signal between different loci along the expression site. Such likelihood comparisons require that two trees have equal taxon sets. For this reason a consistent gene complement from each expression site was used and <italic>ESAG10</italic> and <italic>ESAG7</italic> were therefore excluded. <italic>ESAG3</italic> was also not used because it is present in three positions along the expression site and does not cluster by position; hence, its phylogenetic signal was not amenable to positional comparisons.</p>
</sec><sec id="s4l">
<title>Characterization of recombination</title>
<p>Sequence alignments of each <italic>ESAG</italic> family and selected intergenic regions were generated with ClustalX as described above, manually edited and gap-stripped. Each alignment was tested for evidence of recombination using two approaches. (i) The likelihood-based method implemented in the program GARD (<xref ref-type="bibr" rid="pone.0003527-KosakovskyPond1">[31]</xref>; <ext-link ext-link-type="uri" xlink:href="http://www.datamonkey.org/GARD" xlink:type="simple">http://www.datamonkey.org/GARD</ext-link>) was used to identify putative recombination and gene conversion breakpoints, employing a nucleotide substitution model specified by the HyPhy software package (<xref ref-type="bibr" rid="pone.0003527-Pond1">[55]</xref>; <ext-link ext-link-type="uri" xlink:href="http://www.hyphy.org" xlink:type="simple">http://www.hyphy.org</ext-link>). (ii) The program Phi <xref ref-type="bibr" rid="pone.0003527-Bruen1">[32]</xref>; <ext-link ext-link-type="uri" xlink:href="http://www.mcb.mcgill.ca/trevor" xlink:type="simple">http://www.mcb.mcgill.ca/trevor</ext-link>) was used to assess the significance of the pairwise homoplasy index (Φ<sub>w</sub>) with a window size of 100 bases and 10,000 permutations per test.</p>
</sec><sec id="s4m">
<title>Adaptive evolution of <italic>ESAG</italic> sequences</title>
<p><italic>ESAG</italic> protein-coding sequences were analysed for adaptive evolution by estimating the relative rates of non-synonymous and synonymous substitutions within each ESAG family. Positive selection is indicated by a non-synonymous/synonymous rate ratio (ω) greater than 1. The method was modified for recombinant sequences by allowing the genealogy to vary across the alignment while sharing the parameters of the codon substitution model between tracts <xref ref-type="bibr" rid="pone.0003527-Scheffler1">[56]</xref>. The dimensions and genealogies of putative recombination tracts were provided by the GARD analyses described previously. HyPhy was used to obtain maximum likelihood estimates for two nested models of the distribution of ω. A likelihood ratio test for positive selection was performed with a χ<sup>2</sup>-distribution on two degrees of freedom by comparing twice the log-likelihood difference between a nearly-neutral model (M1a, in which ω cannot exceed 1) and a selection model (M2a) that included an additional category for ω&gt;1 <xref ref-type="bibr" rid="pone.0003527-Wong1">[57]</xref>. Evidence for adaptive evolution at individual codons was tested using an empirical Bayes method <xref ref-type="bibr" rid="pone.0003527-Wong1">[57]</xref>: model M2a, with the maximum likelihood estimated parameters, was taken as a prior distribution for ω, and Bayes' formula was used to calculate the posterior distribution of ω at each codon, given the sequence data.</p>
</sec></sec><sec id="s5">
<title>Supporting Information</title>
<supplementary-material id="pone.0003527.s001" mimetype="application/msword" position="float" xlink:href="info:doi/10.1371/journal.pone.0003527.s001" xlink:type="simple"><label>Data S1</label><caption>
<p>Additional <xref ref-type="sec" rid="s4">Materials and Methods</xref>; Figure and Table legends of supporting data</p>
<p>(0.04 MB DOC)</p>
</caption></supplementary-material><supplementary-material id="pone.0003527.s002" mimetype="application/postscript" position="float" xlink:href="info:doi/10.1371/journal.pone.0003527.s002" xlink:type="simple"><label>Figure S1</label><caption>
<p>PFGE Southern blotting.</p>
<p>(2.68 MB EPS)</p>
</caption></supplementary-material><supplementary-material id="pone.0003527.s003" mimetype="application/postscript" position="float" xlink:href="info:doi/10.1371/journal.pone.0003527.s003" xlink:type="simple"><label>Figure S2</label><caption>
<p>Absence of ESAG7 from BES7.</p>
<p>(1.82 MB EPS)</p>
</caption></supplementary-material><supplementary-material id="pone.0003527.s004" mimetype="application/postscript" position="float" xlink:href="info:doi/10.1371/journal.pone.0003527.s004" xlink:type="simple"><label>Figure S3</label><caption>
<p>Long-range restriction mapping of NEO-tagged clones.</p>
<p>(5.15 MB EPS)</p>
</caption></supplementary-material><supplementary-material id="pone.0003527.s005" mimetype="application/postscript" position="float" xlink:href="info:doi/10.1371/journal.pone.0003527.s005" xlink:type="simple"><label>Figure S4</label><caption>
<p>Quantifying the difference in phylogenetic signal along the bloodstream expression site.</p>
<p>(1.97 MB EPS)</p>
</caption></supplementary-material><supplementary-material id="pone.0003527.s006" mimetype="application/postscript" position="float" xlink:href="info:doi/10.1371/journal.pone.0003527.s006" xlink:type="simple"><label>Figure S5</label><caption>
<p>GARD analysis and interpretation using ESAG2 sequences as an example.</p>
<p>(5.49 MB EPS)</p>
</caption></supplementary-material><supplementary-material id="pone.0003527.s007" mimetype="application/postscript" position="float" xlink:href="info:doi/10.1371/journal.pone.0003527.s007" xlink:type="simple"><label>Table S1</label><caption>
<p>Locations of breakpoints inferred by GARD analysis of ESAG alignments.</p>
<p>(0.38 MB EPS)</p>
</caption></supplementary-material><supplementary-material id="pone.0003527.s008" mimetype="application/postscript" position="float" xlink:href="info:doi/10.1371/journal.pone.0003527.s008" xlink:type="simple"><label>Table S2</label><caption>
<p>Diversity and recombination within BES coding and intergenic sequences.</p>
<p>(0.45 MB EPS)</p>
</caption></supplementary-material><supplementary-material id="pone.0003527.s009" mimetype="application/postscript" position="float" xlink:href="info:doi/10.1371/journal.pone.0003527.s009" xlink:type="simple"><label>Table S3</label><caption>
<p>Non-synonymous substitution rates for ESAGs.</p>
<p>(0.35 MB EPS)</p>
</caption></supplementary-material><supplementary-material id="pone.0003527.s010" mimetype="application/postscript" position="float" xlink:href="info:doi/10.1371/journal.pone.0003527.s010" xlink:type="simple"><label>Table S4</label><caption>
<p>Positively selected codons in ESAG proteins.</p>
<p>(0.32 MB EPS)</p>
</caption></supplementary-material></sec></body>
<back>
<ack>
<p>We thank the core sequencing and informatics teams at the Wellcome Trust Sanger Institute for their assistance.</p>
</ack>
<ref-list>
<title>References</title>
<ref id="pone.0003527-Mefford1"><label>1</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Mefford</surname><given-names>HC</given-names></name>
<name name-style="western"><surname>Trask</surname><given-names>BJ</given-names></name>
</person-group>             <year>2002</year>             <article-title>The complex structure and dynamic evolution of human subtelomeres.</article-title>             <source>Nat Rev Genet</source>             <volume>3</volume>             <fpage>91</fpage>             <lpage>102</lpage>          </element-citation></ref>
<ref id="pone.0003527-Horn1"><label>2</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Horn</surname><given-names>D</given-names></name>
<name name-style="western"><surname>Barry</surname><given-names>JD</given-names></name>
</person-group>             <year>2005</year>             <article-title>The central roles of telomeres and subtelomeres in antigenic variation in African trypanosomes.</article-title>             <source>Chromosome Res</source>             <volume>13</volume>             <fpage>525</fpage>             <lpage>533</lpage>          </element-citation></ref>
<ref id="pone.0003527-Fedorova1"><label>3</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Fedorova</surname><given-names>ND</given-names></name>
<name name-style="western"><surname>Khaldi</surname><given-names>N</given-names></name>
<name name-style="western"><surname>Joardar</surname><given-names>VS</given-names></name>
<name name-style="western"><surname>Maiti</surname><given-names>R</given-names></name>
<name name-style="western"><surname>Amedeo</surname><given-names>P</given-names></name>
<etal/></person-group>             <year>2008</year>             <article-title>Genomic islands in the pathogenic filamentous fungus Aspergillus fumigatus.</article-title>             <source>PLoS Genet</source>             <volume>4</volume>             <fpage>e1000046</fpage>          </element-citation></ref>
<ref id="pone.0003527-Pryde1"><label>4</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Pryde</surname><given-names>FE</given-names></name>
<name name-style="western"><surname>Gorham</surname><given-names>HC</given-names></name>
<name name-style="western"><surname>Louis</surname><given-names>EJ</given-names></name>
</person-group>             <year>1997</year>             <article-title>Chromosome ends: all the same under their caps.</article-title>             <source>Curr Opin Genet Dev</source>             <volume>7</volume>             <fpage>822</fpage>             <lpage>828</lpage>          </element-citation></ref>
<ref id="pone.0003527-Pays1"><label>5</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Pays</surname><given-names>E</given-names></name>
</person-group>             <year>2005</year>             <article-title>Regulation of antigen gene expression in Trypanosoma brucei.</article-title>             <source>Trends Parasitol</source>             <volume>21</volume>             <fpage>517</fpage>             <lpage>520</lpage>          </element-citation></ref>
<ref id="pone.0003527-Navarro1"><label>6</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Navarro</surname><given-names>M</given-names></name>
<name name-style="western"><surname>Cross</surname><given-names>GA</given-names></name>
</person-group>             <year>1996</year>             <article-title>DNA rearrangements associated with multiple consecutive directed antigenic switches in Trypanosoma brucei.</article-title>             <source>Mol Cell Biol</source>             <volume>16</volume>             <fpage>3615</fpage>             <lpage>3625</lpage>          </element-citation></ref>
<ref id="pone.0003527-Redpath1"><label>7</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Redpath</surname><given-names>MB</given-names></name>
<name name-style="western"><surname>Windle</surname><given-names>H</given-names></name>
<name name-style="western"><surname>Nolan</surname><given-names>D</given-names></name>
<name name-style="western"><surname>Pays</surname><given-names>E</given-names></name>
<name name-style="western"><surname>Voorheis</surname><given-names>HP</given-names></name>
<etal/></person-group>             <year>2000</year>             <article-title>ESAG11, a new VSG expression site-associated gene from Trypanosoma brucei.</article-title>             <source>Mol Biochem Parasitol</source>             <volume>111</volume>             <fpage>223</fpage>             <lpage>228</lpage>          </element-citation></ref>
<ref id="pone.0003527-Pays2"><label>8</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Pays</surname><given-names>E</given-names></name>
<name name-style="western"><surname>Lips</surname><given-names>S</given-names></name>
<name name-style="western"><surname>Nolan</surname><given-names>D</given-names></name>
<name name-style="western"><surname>Vanhamme</surname><given-names>L</given-names></name>
<name name-style="western"><surname>Perez-Morga</surname><given-names>D</given-names></name>
</person-group>             <year>2001</year>             <article-title>The VSG expression sites of Trypanosoma brucei: multipurpose tools for the adaptation of the parasite to mammalian hosts.</article-title>             <source>Mol Biochem Parasitol</source>             <volume>114</volume>             <fpage>1</fpage>             <lpage>16</lpage>          </element-citation></ref>
<ref id="pone.0003527-Paindavoine1"><label>9</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Paindavoine</surname><given-names>P</given-names></name>
<name name-style="western"><surname>Rolin</surname><given-names>S</given-names></name>
<name name-style="western"><surname>Van Assel</surname><given-names>S</given-names></name>
<name name-style="western"><surname>Geuskens</surname><given-names>M</given-names></name>
<name name-style="western"><surname>Jauniaux</surname><given-names>JC</given-names></name>
<etal/></person-group>             <year>1992</year>             <article-title>A gene from the variant surface glycoprotein expression site encodes one of several transmembrane adenylate cyclases located on the flagellum of Trypanosoma brucei.</article-title>             <source>Mol Cell Biol</source>             <volume>12</volume>             <fpage>1218</fpage>             <lpage>1225</lpage>          </element-citation></ref>
<ref id="pone.0003527-Ligtenberg1"><label>10</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Ligtenberg</surname><given-names>MJ</given-names></name>
<name name-style="western"><surname>Bitter</surname><given-names>W</given-names></name>
<name name-style="western"><surname>Kieft</surname><given-names>R</given-names></name>
<name name-style="western"><surname>Steverding</surname><given-names>D</given-names></name>
<name name-style="western"><surname>Janssen</surname><given-names>H</given-names></name>
<etal/></person-group>             <year>1994</year>             <article-title>Reconstitution of a surface transferrin binding complex in insect form Trypanosoma brucei.</article-title>             <source>Embo J</source>             <volume>13</volume>             <fpage>2565</fpage>             <lpage>2573</lpage>          </element-citation></ref>
<ref id="pone.0003527-Salmon1"><label>11</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Salmon</surname><given-names>D</given-names></name>
<name name-style="western"><surname>Hanocq-Quertier</surname><given-names>J</given-names></name>
<name name-style="western"><surname>Paturiaux-Hanocq</surname><given-names>F</given-names></name>
<name name-style="western"><surname>Pays</surname><given-names>A</given-names></name>
<name name-style="western"><surname>Tebabi</surname><given-names>P</given-names></name>
<etal/></person-group>             <year>1997</year>             <article-title>Characterization of the ligand-binding site of the transferrin receptor in Trypanosoma brucei demonstrates a structural relationship with the N-terminal domain of the variant surface glycoprotein.</article-title>             <source>Embo J</source>             <volume>16</volume>             <fpage>7272</fpage>             <lpage>7278</lpage>          </element-citation></ref>
<ref id="pone.0003527-Hoek1"><label>12</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Hoek</surname><given-names>M</given-names></name>
<name name-style="western"><surname>Engstler</surname><given-names>M</given-names></name>
<name name-style="western"><surname>Cross</surname><given-names>GA</given-names></name>
</person-group>             <year>2000</year>             <article-title>Expression-site-associated gene 8 (ESAG8) of Trypanosoma brucei is apparently essential and accumulates in the nucleolus.</article-title>             <source>J Cell Sci</source>             <volume>113(Pt 22)</volume>             <fpage>3959</fpage>             <lpage>3968</lpage>          </element-citation></ref>
<ref id="pone.0003527-Hoek2"><label>13</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Hoek</surname><given-names>M</given-names></name>
<name name-style="western"><surname>Zanders</surname><given-names>T</given-names></name>
<name name-style="western"><surname>Cross</surname><given-names>GAM</given-names></name>
</person-group>             <year>2002</year>             <article-title>Trypanosoma brucei expression-site-associated-gene 8 protein interacts with a Pumilio family protein.</article-title>             <source>Mol Biochem Parasitol</source>             <volume>120</volume>             <fpage>269</fpage>             <lpage>283</lpage>          </element-citation></ref>
<ref id="pone.0003527-Gottesdiener1"><label>14</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Gottesdiener</surname><given-names>KM</given-names></name>
</person-group>             <year>1994</year>             <article-title>A new VSG expression site-associated gene (ESAG) in the promoter region of Trypanosoma brucei encodes a protein with 10 potential transmembrane domains.</article-title>             <source>Mol Biochem Parasitol</source>             <volume>63</volume>             <fpage>143</fpage>             <lpage>151</lpage>          </element-citation></ref>
<ref id="pone.0003527-Florent1"><label>15</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Florent</surname><given-names>IC</given-names></name>
<name name-style="western"><surname>Raibaud</surname><given-names>A</given-names></name>
<name name-style="western"><surname>Eisen</surname><given-names>H</given-names></name>
</person-group>             <year>1991</year>             <article-title>A family of genes related to a new expression site-associated gene in Trypanosoma equiperdum.</article-title>             <source>Mol Cell Biol</source>             <volume>11</volume>             <fpage>2180</fpage>             <lpage>2188</lpage>          </element-citation></ref>
<ref id="pone.0003527-Carruthers1"><label>16</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Carruthers</surname><given-names>VB</given-names></name>
<name name-style="western"><surname>Navarro</surname><given-names>M</given-names></name>
<name name-style="western"><surname>Cross</surname><given-names>GA</given-names></name>
</person-group>             <year>1996</year>             <article-title>Targeted disruption of expression site-associated gene-1 in bloodstream-form Trypanosoma brucei.</article-title>             <source>Mol Biochem Parasitol</source>             <volume>81</volume>             <fpage>65</fpage>             <lpage>79</lpage>          </element-citation></ref>
<ref id="pone.0003527-Morgan1"><label>17</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Morgan</surname><given-names>RW</given-names></name>
<name name-style="western"><surname>El-Sayed</surname><given-names>NM</given-names></name>
<name name-style="western"><surname>Kepa</surname><given-names>JK</given-names></name>
<name name-style="western"><surname>Pedram</surname><given-names>M</given-names></name>
<name name-style="western"><surname>Donelson</surname><given-names>JE</given-names></name>
</person-group>             <year>1996</year>             <article-title>Differential expression of the expression site-associated gene I family in African trypanosomes.</article-title>             <source>J Biol Chem</source>             <volume>271</volume>             <fpage>9771</fpage>             <lpage>9777</lpage>          </element-citation></ref>
<ref id="pone.0003527-Berriman1"><label>18</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Berriman</surname><given-names>M</given-names></name>
<name name-style="western"><surname>Ghedin</surname><given-names>E</given-names></name>
<name name-style="western"><surname>Hertz-Fowler</surname><given-names>C</given-names></name>
<name name-style="western"><surname>Blandin</surname><given-names>G</given-names></name>
<name name-style="western"><surname>Renauld</surname><given-names>H</given-names></name>
<etal/></person-group>             <year>2005</year>             <article-title>The genome of the African trypanosome Trypanosoma brucei.</article-title>             <source>Science</source>             <volume>309</volume>             <fpage>416</fpage>             <lpage>422</lpage>          </element-citation></ref>
<ref id="pone.0003527-Becker1"><label>19</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Becker</surname><given-names>M</given-names></name>
<name name-style="western"><surname>Aitcheson</surname><given-names>N</given-names></name>
<name name-style="western"><surname>Byles</surname><given-names>E</given-names></name>
<name name-style="western"><surname>Wickstead</surname><given-names>B</given-names></name>
<name name-style="western"><surname>Louis</surname><given-names>E</given-names></name>
<etal/></person-group>             <year>2004</year>             <article-title>Isolation of the repertoire of VSG expression site containing telomeres of Trypanosoma brucei 427 using transformation-associated recombination in yeast.</article-title>             <source>Genome Res</source>             <volume>14</volume>             <fpage>2319</fpage>             <lpage>2329</lpage>          </element-citation></ref>
<ref id="pone.0003527-Rudenko1"><label>20</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Rudenko</surname><given-names>G</given-names></name>
<name name-style="western"><surname>Blundell</surname><given-names>PA</given-names></name>
<name name-style="western"><surname>Dirks-Mulder</surname><given-names>A</given-names></name>
<name name-style="western"><surname>Kieft</surname><given-names>R</given-names></name>
<name name-style="western"><surname>Borst</surname><given-names>P</given-names></name>
</person-group>             <year>1995</year>             <article-title>A ribosomal DNA promoter replacing the promoter of a telomeric VSG gene expression site can be efficiently switched on and off in T. brucei.</article-title>             <source>Cell</source>             <volume>83</volume>             <fpage>547</fpage>             <lpage>553</lpage>          </element-citation></ref>
<ref id="pone.0003527-Melville1"><label>21</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Melville</surname><given-names>SE</given-names></name>
<name name-style="western"><surname>Leech</surname><given-names>V</given-names></name>
<name name-style="western"><surname>Navarro</surname><given-names>M</given-names></name>
<name name-style="western"><surname>Cross</surname><given-names>GAM</given-names></name>
</person-group>             <year>2000</year>             <article-title>The molecular karyotype of the megabase chromosomes of Trypanosoma brucei stock 427.</article-title>             <source>Mol Biochem Parasitol</source>             <volume>111</volume>             <fpage>261</fpage>             <lpage>273</lpage>          </element-citation></ref>
<ref id="pone.0003527-Rudenko2"><label>22</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Rudenko</surname><given-names>G</given-names></name>
<name name-style="western"><surname>Chaves</surname><given-names>I</given-names></name>
<name name-style="western"><surname>Dirks-Mulder</surname><given-names>A</given-names></name>
<name name-style="western"><surname>Borst</surname><given-names>P</given-names></name>
</person-group>             <year>1998</year>             <article-title>Selection for activation of a new variant surface glycoprotein gene expression site in Trypanosoma brucei can result in deletion of the old one.</article-title>             <source>Mol Biochem Parasitol</source>             <volume>95</volume>             <fpage>97</fpage>             <lpage>109</lpage>          </element-citation></ref>
<ref id="pone.0003527-Pays3"><label>23</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Pays</surname><given-names>E</given-names></name>
<name name-style="western"><surname>Delauw</surname><given-names>MF</given-names></name>
<name name-style="western"><surname>Van Assel</surname><given-names>S</given-names></name>
<name name-style="western"><surname>Laurent</surname><given-names>M</given-names></name>
<name name-style="western"><surname>Vervoort</surname><given-names>T</given-names></name>
<etal/></person-group>             <year>1983</year>             <article-title>Modifications of a Trypanosoma b. brucei antigen gene repertoire by different DNA recombinational mechanisms.</article-title>             <source>Cell</source>             <volume>35</volume>             <fpage>721</fpage>             <lpage>731</lpage>          </element-citation></ref>
<ref id="pone.0003527-Cross1"><label>24</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Cross</surname><given-names>M</given-names></name>
<name name-style="western"><surname>Taylor</surname><given-names>MC</given-names></name>
<name name-style="western"><surname>Borst</surname><given-names>P</given-names></name>
</person-group>             <year>1998</year>             <article-title>Frequent loss of the active site during variant surface glycoprotein expression site switching in vitro in Trypanosoma brucei.</article-title>             <source>Molecular &amp; Cellular Biology</source>             <volume>18</volume>             <fpage>198</fpage>             <lpage>205</lpage>          </element-citation></ref>
<ref id="pone.0003527-Myler1"><label>25</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Myler</surname><given-names>PJ</given-names></name>
<name name-style="western"><surname>Aline</surname><given-names>RF</given-names><suffix>Jr</suffix></name>
<name name-style="western"><surname>Scholler</surname><given-names>JK</given-names></name>
<name name-style="western"><surname>Stuart</surname><given-names>KD</given-names></name>
</person-group>             <year>1988</year>             <article-title>Multiple events associated with antigenic switching in Trypanosoma brucei.</article-title>             <source>Mol Biochem Parasitol</source>             <volume>29</volume>             <fpage>227</fpage>             <lpage>241</lpage>          </element-citation></ref>
<ref id="pone.0003527-Lamont1"><label>26</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Lamont</surname><given-names>GS</given-names></name>
<name name-style="western"><surname>Tucker</surname><given-names>RS</given-names></name>
<name name-style="western"><surname>Cross</surname><given-names>GAM</given-names></name>
</person-group>             <year>1986</year>             <article-title>Analysis of antigen switching rates in Trypanosoma brucei.</article-title>             <source>Parasitology</source>             <volume>92</volume>             <fpage>355</fpage>             <lpage>367</lpage>          </element-citation></ref>
<ref id="pone.0003527-Berriman2"><label>27</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Berriman</surname><given-names>M</given-names></name>
<name name-style="western"><surname>Hall</surname><given-names>N</given-names></name>
<name name-style="western"><surname>Sheader</surname><given-names>K</given-names></name>
<name name-style="western"><surname>Bringaud</surname><given-names>F</given-names></name>
<name name-style="western"><surname>Tiwari</surname><given-names>B</given-names></name>
<etal/></person-group>             <year>2002</year>             <article-title>The architecture of variant surface glycoprotein gene expression sites in Trypanosoma brucei.</article-title>             <source>Mol Biochem Parasitol</source>             <volume>122</volume>             <fpage>131</fpage>             <lpage>140</lpage>          </element-citation></ref>
<ref id="pone.0003527-Gottesdiener2"><label>28</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Gottesdiener</surname><given-names>KM</given-names></name>
<name name-style="western"><surname>Goriparthi</surname><given-names>L</given-names></name>
<name name-style="western"><surname>Masucci</surname><given-names>JP</given-names></name>
<name name-style="western"><surname>Van der Ploeg</surname><given-names>LH</given-names></name>
</person-group>             <year>1992</year>             <article-title>A proposed mechanism for promoter-associated DNA rearrangement events at a variant surface glycoprotein gene expression site.</article-title>             <source>Mol Cell Biol</source>             <volume>12</volume>             <fpage>4784</fpage>             <lpage>4795</lpage>          </element-citation></ref>
<ref id="pone.0003527-Ansorge1"><label>29</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Ansorge</surname><given-names>I</given-names></name>
<name name-style="western"><surname>Steverding</surname><given-names>D</given-names></name>
<name name-style="western"><surname>Melville</surname><given-names>S</given-names></name>
<name name-style="western"><surname>Hartmann</surname><given-names>C</given-names></name>
<name name-style="western"><surname>Clayton</surname><given-names>C</given-names></name>
</person-group>             <year>1999</year>             <article-title>Transcription of ‘inactive’ expression sites in African trypanosomes leads to expression of multiple transferrin receptor RNAs in bloodstream forms.</article-title>             <source>Mol Biochem Parasitol</source>             <volume>101</volume>             <fpage>81</fpage>             <lpage>94</lpage>          </element-citation></ref>
<ref id="pone.0003527-Marcello1"><label>30</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Marcello</surname><given-names>L</given-names></name>
<name name-style="western"><surname>Barry</surname><given-names>JD</given-names></name>
</person-group>             <year>2007</year>             <article-title>Analysis of the VSG gene silent archive in Trypanosoma brucei reveals that mosaic gene expression is prominent in antigenic variation and is favored by archive substructure.</article-title>             <source>Genome Res</source>             <volume>17</volume>             <fpage>1344</fpage>             <lpage>1352</lpage>          </element-citation></ref>
<ref id="pone.0003527-KosakovskyPond1"><label>31</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Kosakovsky Pond</surname><given-names>SL</given-names></name>
<name name-style="western"><surname>Posada</surname><given-names>D</given-names></name>
<name name-style="western"><surname>Gravenor</surname><given-names>MB</given-names></name>
<name name-style="western"><surname>Woelk</surname><given-names>CH</given-names></name>
<name name-style="western"><surname>Frost</surname><given-names>SD</given-names></name>
</person-group>             <year>2006</year>             <article-title>Automated phylogenetic detection of recombination using a genetic algorithm.</article-title>             <source>Mol Biol Evol</source>             <volume>23</volume>             <fpage>1891</fpage>             <lpage>1901</lpage>          </element-citation></ref>
<ref id="pone.0003527-Bruen1"><label>32</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Bruen</surname><given-names>TC</given-names></name>
<name name-style="western"><surname>Philippe</surname><given-names>H</given-names></name>
<name name-style="western"><surname>Bryant</surname><given-names>D</given-names></name>
</person-group>             <year>2006</year>             <article-title>A simple and robust statistical test for detecting the presence of recombination.</article-title>             <source>Genetics</source>             <volume>172</volume>             <fpage>2665</fpage>             <lpage>2681</lpage>          </element-citation></ref>
<ref id="pone.0003527-Melville2"><label>33</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Melville</surname><given-names>SE</given-names></name>
<name name-style="western"><surname>Leech</surname><given-names>V</given-names></name>
<name name-style="western"><surname>Gerrard</surname><given-names>CS</given-names></name>
<name name-style="western"><surname>Tait</surname><given-names>A</given-names></name>
<name name-style="western"><surname>Blackwell</surname><given-names>JM</given-names></name>
</person-group>             <year>1998</year>             <article-title>The molecular karyotype of the megabase chromosomes of Trypanosoma brucei and the assignment of chromosome markers.</article-title>             <source>Molecular &amp; Biochemical Parasitology</source>             <volume>94</volume>             <fpage>155</fpage>             <lpage>173</lpage>          </element-citation></ref>
<ref id="pone.0003527-Callejas1"><label>34</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Callejas</surname><given-names>S</given-names></name>
<name name-style="western"><surname>Leech</surname><given-names>V</given-names></name>
<name name-style="western"><surname>Reitter</surname><given-names>C</given-names></name>
<name name-style="western"><surname>Melville</surname><given-names>S</given-names></name>
</person-group>             <year>2006</year>             <article-title>Hemizygous subtelomeres of an African trypanosome chromosome may account for over 75% of chromosome length.</article-title>             <source>Genome Res</source>             <volume>16</volume>             <fpage>1109</fpage>             <lpage>1118</lpage>          </element-citation></ref>
<ref id="pone.0003527-Haber1"><label>35</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Haber</surname><given-names>JE</given-names></name>
</person-group>             <year>2006</year>             <article-title>Chromosome breakage and repair.</article-title>             <source>Genetics</source>             <volume>173</volume>             <fpage>1181</fpage>             <lpage>1185</lpage>          </element-citation></ref>
<ref id="pone.0003527-Xong1"><label>36</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Xong</surname><given-names>HV</given-names></name>
<name name-style="western"><surname>Vanhamme</surname><given-names>L</given-names></name>
<name name-style="western"><surname>Chamekh</surname><given-names>M</given-names></name>
<name name-style="western"><surname>Chimfwembe</surname><given-names>CE</given-names></name>
<name name-style="western"><surname>Van Den Abbeele</surname><given-names>J</given-names></name>
<etal/></person-group>             <year>1998</year>             <article-title>A VSG expression site-associated gene confers resistance to human serum in Trypanosoma rhodesiense.</article-title>             <source>Cell</source>             <volume>95</volume>             <fpage>839</fpage>             <lpage>846</lpage>          </element-citation></ref>
<ref id="pone.0003527-Vanhamme1"><label>37</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Vanhamme</surname><given-names>L</given-names></name>
<name name-style="western"><surname>Poelvoorde</surname><given-names>P</given-names></name>
<name name-style="western"><surname>Pays</surname><given-names>A</given-names></name>
<name name-style="western"><surname>Tebabi</surname><given-names>P</given-names></name>
<name name-style="western"><surname>Van Xong</surname><given-names>H</given-names></name>
<etal/></person-group>             <year>2000</year>             <article-title>Differential RNA elongation controls the variant surface glycoprotein gene expression sites of Trypanosoma brucei.</article-title>             <source>Mol Microbiol</source>             <volume>36</volume>             <fpage>328</fpage>             <lpage>340</lpage>          </element-citation></ref>
<ref id="pone.0003527-vanLuenen1"><label>38</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>van Luenen</surname><given-names>HG</given-names></name>
<name name-style="western"><surname>Kieft</surname><given-names>R</given-names></name>
<name name-style="western"><surname>Mussmann</surname><given-names>R</given-names></name>
<name name-style="western"><surname>Engstler</surname><given-names>M</given-names></name>
<name name-style="western"><surname>ter Riet</surname><given-names>B</given-names></name>
<etal/></person-group>             <year>2005</year>             <article-title>Trypanosomes change their transferrin receptor expression to allow effective uptake of host transferrin.</article-title>             <source>Mol Microbiol</source>             <volume>58</volume>             <fpage>151</fpage>             <lpage>165</lpage>          </element-citation></ref>
<ref id="pone.0003527-Barnes1"><label>39</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Barnes</surname><given-names>RL</given-names></name>
<name name-style="western"><surname>McCulloch</surname><given-names>R</given-names></name>
</person-group>             <year>2007</year>             <article-title>Trypanosoma brucei homologous recombination is dependent on substrate length and homology, though displays a differential dependence on mismatch repair as substrate length decreases.</article-title>             <source>Nucleic Acids Res</source>             <volume>35</volume>             <fpage>3478</fpage>             <lpage>3493</lpage>          </element-citation></ref>
<ref id="pone.0003527-Barry1"><label>40</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Barry</surname><given-names>JD</given-names></name>
<name name-style="western"><surname>Marcello</surname><given-names>L</given-names></name>
<name name-style="western"><surname>Morrison</surname><given-names>LJ</given-names></name>
<name name-style="western"><surname>Read</surname><given-names>AF</given-names></name>
<name name-style="western"><surname>Lythgoe</surname><given-names>K</given-names></name>
<etal/></person-group>             <year>2005</year>             <article-title>What the genome sequence is revealing about trypanosome antigenic variation.</article-title>             <source>Biochem Soc Trans</source>             <volume>33</volume>             <fpage>986</fpage>             <lpage>989</lpage>          </element-citation></ref>
<ref id="pone.0003527-Sheader1"><label>41</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Sheader</surname><given-names>K</given-names></name>
<name name-style="western"><surname>Vaughan</surname><given-names>S</given-names></name>
<name name-style="western"><surname>Minchin</surname><given-names>J</given-names></name>
<name name-style="western"><surname>Hughes</surname><given-names>K</given-names></name>
<name name-style="western"><surname>Gull</surname><given-names>K</given-names></name>
<etal/></person-group>             <year>2005</year>             <article-title>Variant surface glycoprotein RNA interference triggers a precytokinesis cell cycle arrest in African trypanosomes.</article-title>             <source>Proc Natl Acad Sci U S A</source>             <volume>102</volume>             <fpage>8716</fpage>             <lpage>8721</lpage>          </element-citation></ref>
<ref id="pone.0003527-Rudenko3"><label>42</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Rudenko</surname><given-names>G</given-names></name>
<name name-style="western"><surname>McCulloch</surname><given-names>R</given-names></name>
<name name-style="western"><surname>Dirks-Mulder</surname><given-names>A</given-names></name>
<name name-style="western"><surname>Borst</surname><given-names>P</given-names></name>
</person-group>             <year>1996</year>             <article-title>Telomere exchange can be an important mechanism of variant surface glycoprotein gene switching in Trypanosoma brucei.</article-title>             <source>Mol Biochem Parasitol</source>             <volume>80</volume>             <fpage>65</fpage>             <lpage>75</lpage>          </element-citation></ref>
<ref id="pone.0003527-Jackson1"><label>43</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Jackson</surname><given-names>AP</given-names></name>
</person-group>             <year>2007</year>             <article-title>Tandem gene arrays in Trypanosoma brucei: comparative phylogenomic analysis of duplicate sequence variation.</article-title>             <source>BMC Evol Biol</source>             <volume>7</volume>             <fpage>54</fpage>          </element-citation></ref>
<ref id="pone.0003527-Dreesen1"><label>44</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Dreesen</surname><given-names>O</given-names></name>
<name name-style="western"><surname>Li</surname><given-names>B</given-names></name>
<name name-style="western"><surname>Cross</surname><given-names>GA</given-names></name>
</person-group>             <year>2007</year>             <article-title>Telomere structure and function in trypanosomes: a proposal.</article-title>             <source>Nat Rev Microbiol</source>             <volume>5</volume>             <fpage>70</fpage>             <lpage>75</lpage>          </element-citation></ref>
<ref id="pone.0003527-Johnson1"><label>45</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Johnson</surname><given-names>JG</given-names></name>
<name name-style="western"><surname>Cross</surname><given-names>GA</given-names></name>
</person-group>             <year>1979</year>             <article-title>Selective cleavage of variant surface glycoproteins from Trypanosoma brucei.</article-title>             <source>Biochem J</source>             <volume>178</volume>             <fpage>689</fpage>             <lpage>697</lpage>          </element-citation></ref>
<ref id="pone.0003527-Hirumi1"><label>46</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Hirumi</surname><given-names>H</given-names></name>
<name name-style="western"><surname>Hirumi</surname><given-names>K</given-names></name>
</person-group>             <year>1989</year>             <article-title>Continuous cultivation of Trypanosoma brucei blood stream forms in a medium containing a low concentration of serum protein without feeder cell layers.</article-title>             <source>J Parasitol</source>             <volume>75</volume>             <fpage>985</fpage>             <lpage>989</lpage>          </element-citation></ref>
<ref id="pone.0003527-Wirtz1"><label>47</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Wirtz</surname><given-names>E</given-names></name>
<name name-style="western"><surname>Hartmann</surname><given-names>C</given-names></name>
<name name-style="western"><surname>Clayton</surname><given-names>C</given-names></name>
</person-group>             <year>1994</year>             <article-title>Gene expression mediated by bacteriophage T3 and T7 RNA polymerases in transgenic trypanosomes.</article-title>             <source>Nucleic Acids Res</source>             <volume>22</volume>             <fpage>3887</fpage>             <lpage>3894</lpage>          </element-citation></ref>
<ref id="pone.0003527-Leech1"><label>48</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Leech</surname><given-names>V</given-names></name>
<name name-style="western"><surname>Quail</surname><given-names>MA</given-names></name>
<name name-style="western"><surname>Melville</surname><given-names>SE</given-names></name>
</person-group>             <year>2004</year>             <article-title>Separation, digestion, and cloning of intact parasite chromosomes embedded in agarose.</article-title>             <source>Methods Mol Biol</source>             <volume>270</volume>             <fpage>335</fpage>             <lpage>352</lpage>          </element-citation></ref>
<ref id="pone.0003527-Rutherford1"><label>49</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Rutherford</surname><given-names>K</given-names></name>
<name name-style="western"><surname>Parkhill</surname><given-names>J</given-names></name>
<name name-style="western"><surname>Crook</surname><given-names>J</given-names></name>
<name name-style="western"><surname>Horsnell</surname><given-names>T</given-names></name>
<name name-style="western"><surname>Rice</surname><given-names>P</given-names></name>
<etal/></person-group>             <year>2000</year>             <article-title>Artemis: sequence visualization and annotation.</article-title>             <source>Bioinformatics</source>             <volume>16</volume>             <fpage>944</fpage>             <lpage>945</lpage>          </element-citation></ref>
<ref id="pone.0003527-Rice1"><label>50</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Rice</surname><given-names>P</given-names></name>
<name name-style="western"><surname>Longden</surname><given-names>I</given-names></name>
<name name-style="western"><surname>Bleasby</surname><given-names>A</given-names></name>
</person-group>             <year>2000</year>             <article-title>EMBOSS: the European Molecular Biology Open Software Suite.</article-title>             <source>Trends Genet</source>             <volume>16</volume>             <fpage>276</fpage>             <lpage>277</lpage>          </element-citation></ref>
<ref id="pone.0003527-Dreesen2"><label>51</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Dreesen</surname><given-names>O</given-names></name>
<name name-style="western"><surname>Cross</surname><given-names>GA</given-names></name>
</person-group>             <year>2006</year>             <article-title>Telomerase-independent stabilization of short telomeres in Trypanosoma brucei.</article-title>             <source>Mol Cell Biol</source>             <volume>26</volume>             <fpage>4911</fpage>             <lpage>4919</lpage>          </element-citation></ref>
<ref id="pone.0003527-Thompson1"><label>52</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Thompson</surname><given-names>JD</given-names></name>
<name name-style="western"><surname>Gibson</surname><given-names>TJ</given-names></name>
<name name-style="western"><surname>Plewniak</surname><given-names>F</given-names></name>
<name name-style="western"><surname>Jeanmougin</surname><given-names>F</given-names></name>
<name name-style="western"><surname>Higgins</surname><given-names>DG</given-names></name>
</person-group>             <year>1997</year>             <article-title>The CLUSTAL_X windows interface: flexible strategies for multiple sequence alignment aided by quality analysis tools.</article-title>             <source>Nucleic Acids Res</source>             <volume>25</volume>             <fpage>4876</fpage>             <lpage>4882</lpage>          </element-citation></ref>
<ref id="pone.0003527-Guindon1"><label>53</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Guindon</surname><given-names>S</given-names></name>
<name name-style="western"><surname>Lethiec</surname><given-names>F</given-names></name>
<name name-style="western"><surname>Duroux</surname><given-names>P</given-names></name>
<name name-style="western"><surname>Gascuel</surname><given-names>O</given-names></name>
</person-group>             <year>2005</year>             <article-title>PHYML Online–a web server for fast maximum likelihood-based phylogenetic inference.</article-title>             <source>Nucleic Acids Res</source>             <volume>33</volume>             <fpage>W557</fpage>             <lpage>559</lpage>          </element-citation></ref>
<ref id="pone.0003527-Shimodaira1"><label>54</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Shimodaira</surname><given-names>H</given-names></name>
<name name-style="western"><surname>Hasegawa</surname><given-names>M</given-names></name>
</person-group>             <year>2001</year>             <article-title>CONSEL: for assessing the confidence of phylogenetic tree selection.</article-title>             <source>Bioinformatics</source>             <volume>17</volume>             <fpage>1246</fpage>             <lpage>1247</lpage>          </element-citation></ref>
<ref id="pone.0003527-Pond1"><label>55</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Pond</surname><given-names>SL</given-names></name>
<name name-style="western"><surname>Frost</surname><given-names>SD</given-names></name>
<name name-style="western"><surname>Muse</surname><given-names>SV</given-names></name>
</person-group>             <year>2005</year>             <article-title>HyPhy: hypothesis testing using phylogenies.</article-title>             <source>Bioinformatics</source>             <volume>21</volume>             <fpage>676</fpage>             <lpage>679</lpage>          </element-citation></ref>
<ref id="pone.0003527-Scheffler1"><label>56</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Scheffler</surname><given-names>K</given-names></name>
<name name-style="western"><surname>Martin</surname><given-names>DP</given-names></name>
<name name-style="western"><surname>Seoighe</surname><given-names>C</given-names></name>
</person-group>             <year>2006</year>             <article-title>Robust inference of positive selection from recombining coding sequences.</article-title>             <source>Bioinformatics</source>             <volume>22</volume>             <fpage>2493</fpage>             <lpage>2499</lpage>          </element-citation></ref>
<ref id="pone.0003527-Wong1"><label>57</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Wong</surname><given-names>WS</given-names></name>
<name name-style="western"><surname>Yang</surname><given-names>Z</given-names></name>
<name name-style="western"><surname>Goldman</surname><given-names>N</given-names></name>
<name name-style="western"><surname>Nielsen</surname><given-names>R</given-names></name>
</person-group>             <year>2004</year>             <article-title>Accuracy and power of statistical methods for detecting adaptive evolution in protein coding sequences and for identifying positively selected sites.</article-title>             <source>Genetics</source>             <volume>168</volume>             <fpage>1041</fpage>             <lpage>1051</lpage>          </element-citation></ref>
<ref id="pone.0003527-Aitcheson1"><label>58</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Aitcheson</surname><given-names>N</given-names></name>
<name name-style="western"><surname>Talbot</surname><given-names>S</given-names></name>
<name name-style="western"><surname>Shapiro</surname><given-names>J</given-names></name>
<name name-style="western"><surname>Hughes</surname><given-names>K</given-names></name>
<name name-style="western"><surname>Adkin</surname><given-names>C</given-names></name>
<etal/></person-group>             <year>2005</year>             <article-title>VSG switching in Trypanosoma brucei: antigenic variation analysed using RNAi in the absence of immune selection.</article-title>             <source>Mol Microbiol</source>             <volume>57</volume>             <fpage>1608</fpage>             <lpage>1622</lpage>          </element-citation></ref>
</ref-list>

</back>
</article>