<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article
  PUBLIC "-//NLM//DTD Journal Publishing DTD v3.0 20080202//EN" "http://dtd.nlm.nih.gov/publishing/3.0/journalpublishing3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="3.0" xml:lang="EN"><front><journal-meta><journal-id journal-id-type="publisher-id">plos</journal-id><journal-id journal-id-type="publisher">pcbi</journal-id><journal-id journal-id-type="flc">plcb</journal-id><journal-id journal-id-type="nlm-ta">PLoS Comput Biol</journal-id><journal-id journal-id-type="pmc">ploscomp</journal-id><!--===== Grouping journal title elements =====--><journal-title-group><journal-title>PLoS Computational Biology</journal-title></journal-title-group><issn pub-type="ppub">1553-734X</issn><issn pub-type="epub">1553-7358</issn><publisher><publisher-name>Public Library of Science</publisher-name><publisher-loc>San Francisco, USA</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="doi">10.1371/journal.pcbi.0020086</article-id><article-id pub-id-type="publisher-id">06-PLCB-RA-0003R3</article-id><article-id pub-id-type="sici">plcb-02-07-04</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="Discipline"><subject>Genetics and Genomics/Comparative Genomics</subject><subject>Molecular Biology</subject></subj-group><subj-group subj-group-type="System Taxonomy"><subject>Caenorhabditis</subject></subj-group></article-categories><title-group><article-title>Intronic Alternative Splicing Regulators Identified by Comparative Genomics in Nematodes</article-title><alt-title alt-title-type="running-head">Intronic Alternative Splicing Regulators</alt-title></title-group><contrib-group><contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Kabat</surname><given-names>Jennifer L</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib><contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Barberan-Soler</surname><given-names>Sergio</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib><contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>McKenna</surname><given-names>Paul</given-names></name><xref ref-type="aff" rid="aff2"><sup>2</sup></xref><xref ref-type="fn" rid="n105"><sup>¤a</sup></xref></contrib><contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Clawson</surname><given-names>Hiram</given-names></name><xref ref-type="aff" rid="aff2"><sup>2</sup></xref></contrib><contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Farrer</surname><given-names>Tracy</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref><xref ref-type="fn" rid="n106"><sup>¤b</sup></xref></contrib><contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Zahler</surname><given-names>Alan M</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref><xref ref-type="corresp" rid="cor1"><sup>*</sup></xref></contrib></contrib-group><aff id="aff1">
				<label>1</label><addr-line>Department of Molecular, Cell, and Developmental Biology and Center for Molecular Biology of RNA, University of California Santa Cruz, Santa Cruz, California, United States of America
			</addr-line></aff><aff id="aff2">
				<label>2</label><addr-line>Center for Biomolecular Science and Engineering, University of California Santa Cruz, Santa Cruz, California, United States of America
			</addr-line></aff><contrib-group><contrib contrib-type="editor" xlink:type="simple"><name name-style="western"><surname>Stormo</surname><given-names>Gary</given-names></name><role>Editor</role><xref ref-type="aff" rid="edit1"/></contrib></contrib-group><aff id="edit1">Washington University in St. Louis School of Medicine, United States of America</aff><author-notes><fn fn-type="con" id="ack1"><p>JLK, SBS, PM, and AMZ conceived and designed the experiments. JLK, SBS, PM, and TF performed the experiments. JLK, SBS, HC, TF, and AMZ analyzed the data. SBS and HC contributed reagents/materials/analysis tools. JLK and AMZ wrote the paper.</p></fn><corresp id="cor1">* To whom correspondence should be addressed. E-mail: <email xlink:type="simple">zahler@biology.ucsc.edu</email></corresp><fn fn-type="current-aff" id="n105"><p>¤a Current address: Department of Biology and Center for Computing for Life Sciences, San Francisco State University, San Francisco, California, United States of America</p></fn><fn fn-type="current-aff" id="n106"><p>¤b Current address: University of Virginia School of Medicine, Charlottesville, Virginia, United States of America</p></fn><fn fn-type="conflict" id="ack3"><p> The authors have declared that no competing interests exist.</p></fn></author-notes><pub-date pub-type="ppub"><month>7</month><year>2006</year></pub-date><pub-date pub-type="epub"><day>14</day><month>7</month><year>2006</year></pub-date><pub-date pub-type="epreprint"><day>5</day><month>6</month><year>2006</year></pub-date><volume>2</volume><issue>7</issue><elocation-id>e86</elocation-id><history><date date-type="received"><day>4</day><month>1</month><year>2006</year></date><date date-type="accepted"><day>30</day><month>5</month><year>2006</year></date></history><!--===== Grouping copyright info into permissions =====--><permissions><copyright-year>2006</copyright-year><copyright-holder>Kabat et al</copyright-holder><license><license-p>This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p></license></permissions><abstract><p>Many alternative splicing events are regulated by pentameric and hexameric intronic sequences that serve as binding sites for splicing regulatory factors. We hypothesized that intronic elements that regulate alternative splicing are under selective pressure for evolutionary conservation. Using a Wobble Aware Bulk Aligner genomic alignment of <named-content content-type="genus-species" xlink:type="simple">Caenorhabditis elegans</named-content> and <italic>Caenorhabditis briggsae,</italic> we identified 147 alternatively spliced cassette exons that exhibit short regions of high nucleotide conservation in the introns flanking the alternative exon. In vivo experiments on the alternatively spliced <italic>let-2</italic> gene confirm that these conserved regions can be important for alternative splicing regulation. Conserved intronic element sequences were collected into a dataset and the occurrence of each pentamer and hexamer motif was counted. We compared the frequency of pentamers and hexamers in the conserved intronic elements to a dataset of all <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> intron sequences in order to identify short intronic motifs that are more likely to be associated with alternative splicing. High-scoring motifs were examined for upstream or downstream preferences in introns surrounding alternative exons. Many of the high- scoring nematode pentamer and hexamer motifs correspond to known mammalian splicing regulatory sequences, such as (T)GCATG, indicating that the mechanism of alternative splicing regulation is well conserved in metazoans. A comparison of the analysis of the conserved intronic elements, and analysis of the entire introns flanking these same exons, reveals that focusing on intronic conservation can increase the sensitivity of detecting putative splicing regulatory motifs. This approach also identified novel sequences whose role in splicing is under investigation and has allowed us to take a step forward in defining a catalog of splicing regulatory elements for an organism. In vivo experiments confirm that one novel high-scoring sequence from our analysis, (T)CTATC, is important for alternative splicing regulation of the <italic>unc-52</italic> gene.</p></abstract><abstract abstract-type="synopsis"><title>Synopsis</title><p>Alternative splicing of precursor messenger RNA is a process by which multiple protein isoforms are generated from a single gene. As many as 60% of human genes are processed in this manner, creating tissue-specific isoforms of proteins that may be a key factor in regulating the complexity of our physiology. One of the major challenges to understanding this process is to identify the sequences on the precursor messenger RNA responsible for splicing regulation. Some of these regulatory sequences occur in regions that are spliced out (called introns). This study tested the hypothesis that there should be evolutionary pressure to maintain these intronic regulatory sequences, even though intron sequence is non-coding and rapidly diverges between species. The authors employed a genomic alignment of two roundworms, <named-content content-type="genus-species" xlink:type="simple">Caenorhabditis elegans</named-content> and <italic>Caenorhabditis briggsae,</italic> to investigate the regulation of alternative splicing. By examining evolutionarily conserved stretches of introns flanking alternatively spliced exons, the authors identified and functionally confirmed splicing regulatory sequences. Many of the top scoring sequences match known mammalian regulators, suggesting the alternative splicing regulatory mechanism is conserved across all metazoans. Other sequences were not previously identified in mammals and may represent new alternative splicing regulatory elements in higher organisms or ones that may be specific to worms.</p></abstract><funding-group><funding-statement>This research is supported by National Institutes of Health grants R01-GM61646 to AMZ and P41-HG02731 to the UCSC Center for Genomic Science. SB is supported by a UC Mexus-CONACYT Doctoral Fellowship.</funding-statement></funding-group><counts><page-count count="14"/></counts><!--===== Restructure custom-meta-wrap to custom-meta-group =====--><custom-meta-group><custom-meta><meta-name>citation</meta-name><meta-value>Kabat JL, Barberan-Soler S, McKenna P, Clawson H, Farrer T, et al. (2006): Intronic alternative splicing regulators identified by comparative genomics in nematodes. PLoS Comput Biol 2(7): e86. DOI: <ext-link ext-link-type="doi" xlink:href="http://dx.doi.org/10.1371/journal.pcbi.0020086" xlink:type="simple">10.1371/journal.pcbi.0020086</ext-link></meta-value></custom-meta></custom-meta-group></article-meta></front><body><sec id="s1"><title>Introduction</title><p>One of the interesting lessons learned from the analysis of the human genome is that we may possess fewer than 25,000 genes [<xref ref-type="bibr" rid="pcbi-0020086-b001">1</xref>]. One mechanism to dramatically increase the complexity of the human proteome from this lower-than-expected number of genes is to allow some genes to encode multiple proteins. This process can be accomplished by alternative precursor messenger RNA (pre-mRNA) splicing. Studies that use expressed sequence tag (EST) alignments to identify alternatively spliced genes have led researchers to predict that up to 60% of human genes are alternatively spliced [<xref ref-type="bibr" rid="pcbi-0020086-b002">2</xref>–<xref ref-type="bibr" rid="pcbi-0020086-b005">5</xref>]. Alternative splicing events can be regulated in tissue-specific, developmental, and hormone-responsive manners, providing additional mechanisms for the regulation of gene expression [<xref ref-type="bibr" rid="pcbi-0020086-b006">6</xref>,<xref ref-type="bibr" rid="pcbi-0020086-b007">7</xref>]. Understanding alternative splicing and its regulation is a key component to understanding metazoan genomes.</p><p>The current models for alternative splicing regulation are based on the interactions of intronic or exonic RNA sequences, known as <italic>cis</italic> elements, with splicing regulatory proteins known as <italic>trans</italic>-acting splicing factors [<xref ref-type="bibr" rid="pcbi-0020086-b008">8</xref>]. The binding of splicing factors to the pre-mRNA regulates the ability of the spliceosomal machinery to recognize and promote alternative splicing. The role of intronic elements in regulating splicing is well established and has been shown to work in a combinatorial fashion based on the <italic>trans</italic>-acting factors that are present. For example, the inclusion of the 18-nucleotide-long, neural-specific N1 exon of the human <italic>c-SRC</italic> gene is regulated by the downstream control sequence found in the intron downstream of the N1 exon. This sequence serves as a recruitment site for both constitutive and neuronal cell-specific splicing factors such as nPTB, FOX-1, and FOX-2 [<xref ref-type="bibr" rid="pcbi-0020086-b009">9</xref>–<xref ref-type="bibr" rid="pcbi-0020086-b012">12</xref>]. The vertebrate RNA-binding protein FOX-1 can also regulate muscle-specific alternative splicing through interactions with the RNA sequence GCAUG [<xref ref-type="bibr" rid="pcbi-0020086-b013">13</xref>], and repeats of this sequence have been shown to be important for alternative splicing regulation of the fibronectin exon EIIIB and the rat calcitonin/CGRP exon 4 [<xref ref-type="bibr" rid="pcbi-0020086-b014">14</xref>,<xref ref-type="bibr" rid="pcbi-0020086-b015">15</xref>]. Many other examples of complex and combinatorial regulation of alternative splicing through intronic <italic>cis</italic> elements have been demonstrated, and combinatorial interactions between proteins such as Nova-1, polypyrimidine tract binding protein (PTB), and ETR-3, with specific <italic>cis</italic> sequences, are important for alternative splicing regulation [<xref ref-type="bibr" rid="pcbi-0020086-b016">16</xref>–<xref ref-type="bibr" rid="pcbi-0020086-b020">20</xref>].</p><p>Intronic sequences are non-coding, and therefore they should have less evolutionary selective pressure to maintain their sequence. An exception to this should be intronic sequences that regulate alternative splicing. In an analysis of alternatively spliced human cassette exons, it was found that on average, approximately 100 nucleotides of intron sequence, flanking either side of the exon, tend to be highly conserved between the mouse and human genomes, with 88% identity in the upstream sequences and 80% identity in the downstream sequences [<xref ref-type="bibr" rid="pcbi-0020086-b021">21</xref>]. Some clues to potential splicing regulatory motifs arise from these studies. For example, Sorek and Ast found that the sequence TGCATG was the second most common hexamer in the first 100 nucleotides downstream of alternatively spliced exons, appearing in 18% of these intronic regions [<xref ref-type="bibr" rid="pcbi-0020086-b021">21</xref>]. Another study of aligned mouse/human alternative exons found that GCATG is the most overrepresented pentamer in the proximal conserved region of the intron downstream of alternative exons [<xref ref-type="bibr" rid="pcbi-0020086-b022">22</xref>]. A third study found that TGCATG is frequently located in introns flanking brain-enriched alternative exons, and its presence and spacing are highly conserved in these genes from fish to man [<xref ref-type="bibr" rid="pcbi-0020086-b023">23</xref>].</p><p>Using the nematode <named-content content-type="genus-species" xlink:type="simple">Caenorhabditis elegans</named-content> as a model system, we have been working to take advantage of comparative genomics to identify <italic>cis</italic>-acting regulators of alternative splicing. The <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> gene structure, splicing machinery, and gene expression regulation is similar to that of other higher eukaryotes, with the exception that the average intron size is smaller. Our lab has previously developed methods for identification of alternatively spliced genes in <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> by aligning the genome sequence with ESTs and mRNA sequence [<xref ref-type="bibr" rid="pcbi-0020086-b024">24</xref>]. We developed an algorithm, the Wobble Aware Bulk Aligner (WABA), for creating interspecies genome alignments between <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> and the related roundworm, <named-content content-type="genus-species" xlink:type="simple">Caenorhabditis briggsae</named-content> [<xref ref-type="bibr" rid="pcbi-0020086-b025">25</xref>]. WABA employs a hidden Markov model (HMM) to identify aligned regions as coding, high homology, low homology, and no homology. It also factors the AT richness of <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> introns into its calculations when it defines an intronic region as “high” homology [<xref ref-type="bibr" rid="pcbi-0020086-b025">25</xref>]. <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content> and <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> diverged approximately 100 million years ago, yet are indistinguishable by eye [<xref ref-type="bibr" rid="pcbi-0020086-b026">26</xref>]. Alignment of these two genomes revealed that exonic sequences are highly conserved between these species, but intronic and intergenic sequences are rarely conserved [<xref ref-type="bibr" rid="pcbi-0020086-b025">25</xref>]. We found that these rare, high homology sequences in introns are more likely to occur in the introns flanking alternatively spliced exons than in total introns [<xref ref-type="bibr" rid="pcbi-0020086-b025">25</xref>]. We hypothesized that these conserved intronic regions were <italic>cis</italic>-acting regulatory elements for alternative splicing. This nematode alignment, with relatively limited regions of high homology, provides the possibility for more specific pinpointing of intronic splicing regulatory elements than the much longer 100-nucleotide-long conserved regions flanking alternative exons in mouse/human alignments [<xref ref-type="bibr" rid="pcbi-0020086-b021">21</xref>].</p><p>In this paper, we present the analysis of conserved regions of introns flanking alternatively spliced exons in <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> and correlate these conserved regions with alternative splicing regulation. We collected these conserved sequence regions into a database and searched for overrepresented pentamers and hexamers relative to a total intron database, similar to the method used by Burge's group to identify exonic splicing enhancers [<xref ref-type="bibr" rid="pcbi-0020086-b027">27</xref>]. This allowed us to create a table of potential intronic alternative splicing <italic>cis</italic>-regulatory motifs. Since many RNA recognition motif–containing splicing factors recognize specific sequences on the order of 4–6 nucleotides in length [<xref ref-type="bibr" rid="pcbi-0020086-b011">11</xref>,<xref ref-type="bibr" rid="pcbi-0020086-b013">13</xref>,<xref ref-type="bibr" rid="pcbi-0020086-b018">18</xref>,<xref ref-type="bibr" rid="pcbi-0020086-b028">28</xref>–<xref ref-type="bibr" rid="pcbi-0020086-b032">32</xref>], the high-scoring motifs in this catalog may represent specific binding sites for particular splicing factors. Several of our highest scoring motifs in this analysis correlate with known vertebrate splicing regulatory elements, for example, (T)GCATG [<xref ref-type="bibr" rid="pcbi-0020086-b023">23</xref>], but several have not been previously identified. A number of candidates identified by this method were tested in an in vivo splicing reporter system in <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content>. We have used this analysis to identify and confirm a new, highly conserved, alternative splicing regulatory element, (T)CTATC. We show that this sequence works in coordination with GCATG to regulate the alternative splicing of the <italic>unc-52</italic> gene.</p></sec><sec id="s2"><title>Results</title><sec id="s2a"><title>Identification of Highly Conserved Regions in Introns Flanking Alternatively Spliced Exons</title><p>In order to identify alternatively spliced cassette exons in the <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> genome, we used the Intronerator [<xref ref-type="bibr" rid="pcbi-0020086-b024">24</xref>] to generate an initial set of 1,471 putative alternatively spliced genes. We did this by aligning over 200,000 ESTs and mRNAs to the <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> genome and identifying regions where the alignments are consistent with more than one way to process a gene. The program could not distinguish between alternative splicing and alternative promoters, so we analyzed each of these alignments individually to verify alternative splicing. We found 449 examples of genes with strong cDNA evidence for alternative cassette exons, and 454 examples of genes with alternative promoters, which usually had unique first exons that are spliced to common second exons. Of the genes with alternative splicing, 162 also contained alternative promoter usage. The remaining genes in the initial set of putative alternatively spliced genes were mostly due to unusual ESTs in the database that did not fit a gene model. We also saw evidence of ESTs that showed internal deletions at short direct repeats. To the program, these indicated the potential for intron removal, but upon further inspection, these did not meet the criteria of introns (start with the dinucleotides GT or GC and end with AG) and were likely the result of cloning artifacts of the ESTs.</p><p>Intronic regions that are highly conserved between <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> and <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content> are rarely identified by WABA [<xref ref-type="bibr" rid="pcbi-0020086-b025">25</xref>]. While analyzing our alternative cassette exon database, we were struck by the fact that we could identify many examples of WABA-defined high homology sequences in introns flanking the alternatively spliced cassette exons, suggesting strong evolutionary conservation. For 142 of the 449 alternatively spliced genes, WABA identified a highly conserved sequence in flanking introns upstream or downstream of 147 alternative cassette exons. <xref ref-type="fig" rid="pcbi-0020086-g001">Figure 1</xref> shows several examples of screen shots from the Intronerator browser of cDNA-confirmed <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> alternatively spliced isoforms (in blue) and a graphical representation of the WABA alignments between <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> and <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content> (in purple). Dark purple regions, indicating high homology, can be seen in these introns either upstream or downstream of the alternative exon. Sometimes a single conserved element is identified by WABA, while for other cases multiple regions in the introns are conserved.</p><fig id="pcbi-0020086-g001" position="float"><object-id pub-id-type="doi">10.1371/journal.pcbi.0020086.g001</object-id><label>Figure 1</label><caption><title>Images from the Intronerator Genome Browser Showing Alternatively Spliced Genes</title><p>Gene isoforms predicted by the Wormbase Consortium are shown in blue, and WABA homology alignments for <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content> to this region of the <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> genome are shown in purple. Dark purple indicates a region of WABA high homology, light purple corresponds to low homology, and white indicates no homology between species. Regions of alternatively spliced genes: (A) W01F3.1, (B) ZC477.9, (C) ZK637.8, (D) H24G06.1, and (E) C11D2.6 are shown.</p></caption><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.0020086.g001" xlink:type="simple"/></fig><p>An important question is whether these 147 <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> alternative cassette exons are also alternatively spliced in <italic>C. briggsae.</italic> Due to a lack of <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content> transcript data, we have no direct evidence for alternative splicing of these exons. Therefore, we examined the <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content> homologs of these alternative exons for features of functional exons. A previous alignment of 8 MB of the <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content> genome with the complete <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> genome found that in coding exons there is 79.3% overall nucleotide identity [<xref ref-type="bibr" rid="pcbi-0020086-b025">25</xref>]. Consistent with these findings, cross-species alignment of these 147 alternative cassette exons revealed an average nucleotide identity between <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> and <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content> of 81.8%. Amino acid identity of the open reading frame of these exons was 85.4%. Maintenance of the reading frame for these exons also appears to be well conserved: 57.0% of the 147 exons are the exact same size, 34.3% differ by a multiple of three nucleotides, and only 8.8% differ by a non-multiple of three nucleotides (unpublished data). The high conservation of nucleotide sequence, amino acid sequence, and maintenance of open reading frame is consistent with these being coding exons in <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content>.</p><p>One feature of alternative exons is that they are often flanked by weak splice sites which allow for splicing regulation (reviewed in [<xref ref-type="bibr" rid="pcbi-0020086-b033">33</xref>]). If these exons are alternatively spliced in <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content> we would expect that they would be flanked by 3′ and 5′ splice sites of similar strength. We used the UCSC Genome Table Browser (<ext-link ext-link-type="uri" xlink:href="http://www.genome.ucsc.edu" xlink:type="simple">http://www.genome.ucsc.edu</ext-link>) in an attempt to automate rapid alignment of the splice junctions for these 147 exons in <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> and <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content>. For the majority of these alternative exons, this automated method was successful in identifying <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> and <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content> 5′ and 3′ splice sites for each exon, and we used these data to compare the similarity of splice sites between the two species. For 5′ splice sites we examined the last three nucleotides of the exon and first six nucleotides of the intron, as these base-pair with U1 small nuclear RNA during initial 5′ splice-site recognition[<xref ref-type="bibr" rid="pcbi-0020086-b031">31</xref>]. We found that these nine nucleotides were completely identical for 47.1% of the alternative exons and differed by only one nucleotide in 27.1% of the exons. For the 3′ splice sites, we examined the conservation of the last six nucleotides of the intron and the first nucleotide of the exon, as these are a binding site for the <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> homolog of the heterodimeric U2 auxiliary factor (U2AF) involved in initial 3′ splice-site recognition [<xref ref-type="bibr" rid="pcbi-0020086-b034">34</xref>]. For 55.4% of the alternative exons examined, these seven nucleotides were completely identical, and for an additional 30.1% they differed by only one nucleotide. This strong conservation of splice-site sequence strength, along with regions of conservation in flanking introns, suggests that these exons may be substrates for alternative splicing in <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content>.</p></sec><sec id="s2b"><title>The Role of Conserved Elements in Alternative Splicing Regulation</title><p>There are many examples of regions of introns flanking alternatively spliced exons that function as <italic>cis</italic>-acting regulators of alternative splicing. We hypothesized that the reason that these high homology WABA-identified intronic elements have been conserved over 100 million years of evolution is that they may regulate alternative splicing. In order to test this hypothesis, we looked at the <italic>C. elegans/C. briggsae</italic> alignment of the alternatively spliced region of the <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> alpha(2) type IV collagen gene <italic>let-2. Let-2</italic> has two mutually exclusive alternative exons, exons 9 and 10, and their splicing pattern is evolutionarily conserved as far back as the distantly related parasitic nematode, <named-content content-type="genus-species" xlink:type="simple">Ascaris suum</named-content> [<xref ref-type="bibr" rid="pcbi-0020086-b035">35</xref>]. Messages incorporate either exon 9 or exon 10 in a developmentally regulated manner; embryos predominantly use exon 9, adults predominantly use exon 10, and there is a gradual shift in the usage of these two exons during the larval stages [<xref ref-type="bibr" rid="pcbi-0020086-b036">36</xref>]. The WABA alignment of this 400-base intron identifies four conserved regions in the intron between exons 10 and 11 (<xref ref-type="fig" rid="pcbi-0020086-g002">Figure 2</xref>). To test the role of these conserved intronic elements in alternative splicing regulation, we employed a splicing reporter construct system containing the alternatively spliced region between exons 8 and 11 that mimics the developmental control of alternative splicing for this region when transformed into <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> [<xref ref-type="bibr" rid="pcbi-0020086-b037">37</xref>]. We mutated the first conserved element in this intron and monitored the developmental regulation of this splicing. Deletion of this conserved element, in which 28 of 34 bases have been conserved between <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> and <italic>C. briggsae,</italic> results in a major reduction in the usage of exon 10 in L4 animals (unpublished data). The identical effect on splicing of an even smaller deletion within this element, del1.2, is shown in <xref ref-type="fig" rid="pcbi-0020086-g002">Figure 2</xref>. For the L4 time point, the developmental stage at which we should detect maximal exon 10 usage, only minimal splicing of this exon is detected. Since mutation of this element results in only minimal exon 10 inclusion, we hypothesize that either adults produce a splicing factor that interacts with this element to promote exon 10 splicing or that embryos produce a splicing repressor that inhibits exon 10 splicing. In the past, researchers have identified splicing regulatory elements by creating a series of mutations across an intron. In this computational approach, the interspecies genome alignments led us directly to a small element required for the developmentally regulated switch in this splicing.</p><fig id="pcbi-0020086-g002" position="float"><object-id pub-id-type="doi">10.1371/journal.pcbi.0020086.g002</object-id><label>Figure 2</label><caption><title>An Intronic Element Regulates <italic>let-2</italic> Alternative Splicing</title><p>The top of this figure shows the alignment of <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> and <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content> sequences for the alternatively spliced region of <italic>let-2</italic>. Blue tracks indicate the splicing for the embryonic (top) and adult (bottom) isoforms. The purple track indicates homology between the <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content> and <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> genomes as determined by WABA. Dark purple tracks indicate regions of strong homology (&gt;70%). The sequence of the first conserved element of intron 10 is shown. The box indicates the part deleted and replaced with the sequence GAA in the del1.2 splicing reporter construct. The lower left part of the figure shows the results of <sup>32</sup>P RT-PCR reactions with primers specific for the splicing reporter. Products for exon 9- or exon 10-containing messages are indicated. In embryos, only usage of exon 9 is detected for either reporter. At the L4 stage, 34% of the wild-type reporter messages contain exon 10 while del1.2 mutant messages contain only a trace amount of this exon.</p></caption><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.0020086.g002" xlink:type="simple"/></fig></sec><sec id="s2c"><title>Analysis of a Database of Conserved Intronic Elements Flanking Alternatively Spliced Exons</title><p>As demonstrated in the previous section, evolutionarily conserved elements in introns flanking alternatively spliced exons can be important for alternative splicing. We used a computational approach to identify sequences that are more likely to occur in these conserved elements than in total intron sequences. As described above, we have identified 142 alternatively spliced genes in which the introns flanking an alternatively spliced cassette exon contain high homology regions with <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content> as defined by WABA. We extracted the highly conserved <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> sequences from these introns and put them into a database. The first or last seven nucleotides of introns were excluded from this dataset as these contain conserved signals for the constitutive splicing machinery [<xref ref-type="bibr" rid="pcbi-0020086-b038">38</xref>]. This dataset contained 537 conserved elements of average length, 38.5 bases (minimum length, seven bases, longest, 231 bases, and median length, 28 bases) for a total of 20,675 bases. See <xref ref-type="supplementary-material" rid="pcbi-0020086-st001">Table S1</xref> for a list of these elements and the alternatively spliced genes from which they were derived. We also generated a control dataset of all introns annotated in Wormbase genome sequence release WS 120.</p><p>Because many alternative splicing factors have binding preferences for relatively short sequence motifs [<xref ref-type="bibr" rid="pcbi-0020086-b011">11</xref>,<xref ref-type="bibr" rid="pcbi-0020086-b013">13</xref>,<xref ref-type="bibr" rid="pcbi-0020086-b018">18</xref>,<xref ref-type="bibr" rid="pcbi-0020086-b028">28</xref>–<xref ref-type="bibr" rid="pcbi-0020086-b032">32</xref>], we decided to search the conserved intronic element dataset for short sequence motifs that appear more frequently here than in total introns. In order to identify sequences that are more prevalent in the conserved intronic regions bordering alternative exons, we counted the number of occurrences of every possible hexamer or pentamer motif in both our conserved intron element and total intron datasets. For each motif in the conserved element dataset, we determined the observed frequency, which was the count of each motif divided by the total number of possible motifs of that length in that dataset. We also determined an expected frequency based on the number of counts of each motif in the total intron dataset divided by the total number of possible motifs in that dataset. We then calculated an observed over expected (obs/exp) ratio for each motif, which was the observed frequency of each motif in the conserved element dataset divided by the expected frequency of each motif based on the total intron dataset. <xref ref-type="table" rid="pcbi-0020086-t001">Table 1</xref> shows the 40 top scoring pentamer and hexamer motifs in the conserved element dataset as determined by the obs/exp ratio value.</p><table-wrap content-type="1col" id="pcbi-0020086-t001" position="float"><object-id pub-id-type="doi">10.1371/journal.pcbi.0020086.t001</object-id><label>Table 1</label><caption><p>Pentamer and Hexamer Sequence Motifs That Occur More Frequently in Conserved Intronic Elements Flanking Alternatively Spliced Exons than in the Total Intron Dataset</p></caption><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.0020086.t001" xlink:type="simple"/><!-- <table frame="hsides" rules="none"><colgroup><col id="tb1col1" align="left" charoff="0" char=""/><col id="tb1col2" align="left" charoff="0" char=""/><col id="tb1col3" align="left" charoff="0" char=""/><col id="tb1col4" align="left" charoff="0" char=""/><col id="tb1col5" align="char" charoff="0" char="."/><col id="tb1col6" align="left" charoff="0" char=""/></colgroup><thead><tr><td align="left" colspan="2"><hr/>Pentamers</td><td rowspan="2"><hr/>Obs/Exp</td><td colspan="2"><hr/>Hexamers</td><td rowspan="2"><hr/>Obs/Exp</td></tr><tr><td><hr/>Word</td><td><hr/>Count</td><td><hr/>Word</td><td><hr/>Count</td></tr></thead><tbody><tr><td valign="bottom">GCATG</td><td valign="bottom">50</td><td valign="bottom">6.65</td><td valign="bottom">CCGTGC</td><td valign="bottom">9</td><td valign="bottom">9.29</td></tr><tr><td valign="bottom">GTGTG</td><td valign="bottom">58</td><td valign="bottom">4.63</td><td valign="bottom">GCATGC</td><td valign="bottom">13</td><td valign="bottom">8.88</td></tr><tr><td valign="bottom">CTATC</td><td valign="bottom">37</td><td valign="bottom">4.23</td><td valign="bottom">TGCATG</td><td valign="bottom">22</td><td valign="bottom">8.87</td></tr><tr><td valign="bottom">TGTGT</td><td valign="bottom">79</td><td valign="bottom">4.08</td><td valign="bottom">CGCATG</td><td valign="bottom">11</td><td valign="bottom">8.84</td></tr><tr><td valign="bottom">CTCTC</td><td valign="bottom">52</td><td valign="bottom">3.77</td><td valign="bottom">GCATGA</td><td valign="bottom">17</td><td valign="bottom">8.27</td></tr><tr><td valign="bottom">GCCCG</td><td valign="bottom">12</td><td valign="bottom">3.66</td><td valign="bottom">CGTTCC</td><td valign="bottom">10</td><td valign="bottom">7.45</td></tr><tr><td valign="bottom">CATGC</td><td valign="bottom">25</td><td valign="bottom">3.57</td><td valign="bottom">CTATCC</td><td valign="bottom">10</td><td valign="bottom">7.06</td></tr><tr><td valign="bottom">CTTCT</td><td valign="bottom">79</td><td valign="bottom">3.56</td><td valign="bottom">TCTATC</td><td valign="bottom">23</td><td valign="bottom">6.96</td></tr><tr><td valign="bottom">GTCGT</td><td valign="bottom">24</td><td valign="bottom">3.55</td><td valign="bottom">CGTGTG</td><td valign="bottom">11</td><td valign="bottom">6.93</td></tr><tr><td valign="bottom">CGTCC</td><td valign="bottom">13</td><td valign="bottom">3.50</td><td valign="bottom">CTAACC</td><td valign="bottom">12</td><td valign="bottom">6.90</td></tr><tr><td valign="bottom">CGTCG</td><td valign="bottom">17</td><td valign="bottom">3.46</td><td valign="bottom">GTGTTG</td><td valign="bottom">20</td><td valign="bottom">6.63</td></tr><tr><td valign="bottom">GTGTC</td><td valign="bottom">33</td><td valign="bottom">3.40</td><td valign="bottom">GTGTGC</td><td valign="bottom">17</td><td valign="bottom">6.58</td></tr><tr><td valign="bottom">CTCGC</td><td valign="bottom">17</td><td valign="bottom">3.40</td><td valign="bottom">TGCACG</td><td valign="bottom">8</td><td valign="bottom">6.54</td></tr><tr><td valign="bottom">TGTCC</td><td valign="bottom">26</td><td valign="bottom">3.35</td><td valign="bottom">GTCCGT</td><td valign="bottom">7</td><td valign="bottom">6.49</td></tr><tr><td valign="bottom">CATGT</td><td valign="bottom">43</td><td valign="bottom">3.32</td><td valign="bottom">CATGTC</td><td valign="bottom">12</td><td valign="bottom">6.28</td></tr><tr><td valign="bottom">TCCGT</td><td valign="bottom">28</td><td valign="bottom">3.30</td><td valign="bottom">CGGAGG</td><td valign="bottom">5</td><td valign="bottom">6.17</td></tr><tr><td valign="bottom">GTGCT</td><td valign="bottom">27</td><td valign="bottom">3.29</td><td valign="bottom">GCTTCT</td><td valign="bottom">24</td><td valign="bottom">6.17</td></tr><tr><td valign="bottom">TCCTC</td><td valign="bottom">36</td><td valign="bottom">3.27</td><td valign="bottom">CGCTTC</td><td valign="bottom">10</td><td valign="bottom">6.15</td></tr><tr><td valign="bottom">GCTTC</td><td valign="bottom">36</td><td valign="bottom">3.26</td><td valign="bottom">TGTGTC</td><td valign="bottom">19</td><td valign="bottom">6.13</td></tr><tr><td valign="bottom">TCTCT</td><td valign="bottom">72</td><td valign="bottom">3.25</td><td valign="bottom">CCGTCC</td><td valign="bottom">5</td><td valign="bottom">5.79</td></tr><tr><td valign="bottom">CGCTT</td><td valign="bottom">25</td><td valign="bottom">3.23</td><td valign="bottom">GTGTGT</td><td valign="bottom">27</td><td valign="bottom">5.77</td></tr><tr><td valign="bottom">CTAAC</td><td valign="bottom">32</td><td valign="bottom">3.22</td><td valign="bottom">GTCGTG</td><td valign="bottom">8</td><td valign="bottom">5.74</td></tr><tr><td valign="bottom">CATCC</td><td valign="bottom">21</td><td valign="bottom">3.19</td><td valign="bottom">GCAAGG</td><td valign="bottom">6</td><td valign="bottom">5.69</td></tr><tr><td valign="bottom">CGTGC</td><td valign="bottom">14</td><td valign="bottom">3.19</td><td valign="bottom">GCCCGG</td><td valign="bottom">3</td><td valign="bottom">5.69</td></tr><tr><td valign="bottom">GTTGT</td><td valign="bottom">52</td><td valign="bottom">3.12</td><td valign="bottom">TCCTCC</td><td valign="bottom">15</td><td valign="bottom">5.63</td></tr><tr><td valign="bottom">TGTGC</td><td valign="bottom">36</td><td valign="bottom">3.12</td><td valign="bottom">CCTTGT</td><td valign="bottom">12</td><td valign="bottom">5.61</td></tr><tr><td valign="bottom">TGTCT</td><td valign="bottom">43</td><td valign="bottom">3.11</td><td valign="bottom">GTTGTG</td><td valign="bottom">18</td><td valign="bottom">5.59</td></tr><tr><td valign="bottom">CCGTG</td><td valign="bottom">15</td><td valign="bottom">3.03</td><td valign="bottom">ACCGTG</td><td valign="bottom">6</td><td valign="bottom">5.55</td></tr><tr><td valign="bottom">CGGAC</td><td valign="bottom">10</td><td valign="bottom">3.01</td><td valign="bottom">GCCCGC</td><td valign="bottom">4</td><td valign="bottom">5.54</td></tr><tr><td valign="bottom">TCATG</td><td valign="bottom">37</td><td valign="bottom">2.90</td><td valign="bottom">GATGGT</td><td valign="bottom">9</td><td valign="bottom">5.39</td></tr><tr><td valign="bottom">TGCAC</td><td valign="bottom">29</td><td valign="bottom">2.90</td><td valign="bottom">CGAGTG</td><td valign="bottom">6</td><td valign="bottom">5.37</td></tr><tr><td valign="bottom">CTCCT</td><td valign="bottom">27</td><td valign="bottom">2.89</td><td valign="bottom">CCCGTC</td><td valign="bottom">5</td><td valign="bottom">5.32</td></tr><tr><td valign="bottom">GTCCA</td><td valign="bottom">19</td><td valign="bottom">2.87</td><td valign="bottom">CCAGGC</td><td valign="bottom">5</td><td valign="bottom">5.30</td></tr><tr><td valign="bottom">GTCCG</td><td valign="bottom">11</td><td valign="bottom">2.84</td><td valign="bottom">CCTCGC</td><td valign="bottom">4</td><td valign="bottom">5.27</td></tr><tr><td valign="bottom">CCTCC</td><td valign="bottom">20</td><td valign="bottom">2.79</td><td valign="bottom">GTCGCC</td><td valign="bottom">5</td><td valign="bottom">5.26</td></tr><tr><td valign="bottom">TGTTG</td><td valign="bottom">55</td><td valign="bottom">2.79</td><td valign="bottom">GACGTG</td><td valign="bottom">6</td><td valign="bottom">5.25</td></tr><tr><td valign="bottom">GTCGC</td><td valign="bottom">12</td><td valign="bottom">2.79</td><td valign="bottom">GTGCCC</td><td valign="bottom">5</td><td valign="bottom">5.25</td></tr><tr><td valign="bottom">TTGTG</td><td valign="bottom">63</td><td valign="bottom">2.77</td><td valign="bottom">TGTTGT</td><td valign="bottom">31</td><td valign="bottom">5.23</td></tr><tr><td valign="bottom">TTGTC</td><td valign="bottom">55</td><td valign="bottom">2.76</td><td valign="bottom">CTATCT</td><td valign="bottom">13</td><td valign="bottom">5.21</td></tr><tr><td valign="bottom">TGCTT</td><td valign="bottom">43</td><td valign="bottom">2.74</td><td valign="bottom">TCTCTC</td><td valign="bottom">34</td><td valign="bottom">5.20</td></tr></tbody></table> --><!-- <table-wrap-foot><fn id="nt101"><p>The Count column indicates the number of occurrences of each motif in the conserved intron element dataset. Obs/Exp is the ratio of the observed frequency score of these motifs in the conserved element dataset divided by the expected occurrence of each motif based on the total intron dataset. The top 40 highest scoring motifs as determined by the obs/exp value for pentamers and hexamers are listed.</p></fn></table-wrap-foot> --></table-wrap><p>Several previously identified mammalian splicing regulatory sequences are present in our lists of high-scoring hexamers and pentamers. This is encouraging because many of the known mammalian splicing factors have <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> homologs. For example, the sequence TGCATG and its subset pentamer GCATG have been shown to be important intronic regulators of splicing for the mammalian fibronectin and calcitionin/CGRP genes [<xref ref-type="bibr" rid="pcbi-0020086-b014">14</xref>,<xref ref-type="bibr" rid="pcbi-0020086-b015">15</xref>,<xref ref-type="bibr" rid="pcbi-0020086-b039">39</xref>]. The mammalian FOX-1 protein selected the GCAUG sequence in a SELEX experiment, and it has been shown that the FOX-1 protein alters alternative splicing of several GCAUG-containing genes in transient transfection assays [<xref ref-type="bibr" rid="pcbi-0020086-b013">13</xref>]. FOX-2, a homolog of FOX-1, has also been shown to regulate splicing of transcripts containing UGCAUG in neuronal cell culture [<xref ref-type="bibr" rid="pcbi-0020086-b012">12</xref>]. FOX-1 was originally identified in <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> as a splicing factor of the transcript for the sex determination gene, <italic>xol-1</italic> [<xref ref-type="bibr" rid="pcbi-0020086-b040">40</xref>]. Another well studied mammalian motif is that of intronic GU dinucleotide repeats, which have been shown to regulate splicing of the human <italic>CFTR</italic> gene [<xref ref-type="bibr" rid="pcbi-0020086-b041">41</xref>] and serve as a binding site for the ETR-3 splicing regulatory factor [<xref ref-type="bibr" rid="pcbi-0020086-b042">42</xref>]. CU dinucleotide repeats serve as a binding site for the PTB family members in the intronic regions that regulate inclusion of the N1 exon of <italic>c-src</italic> [<xref ref-type="bibr" rid="pcbi-0020086-b043">43</xref>]. While targets for <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> alternative splicing factors might be inferred from their homology to mammalian proteins, very little experimental evidence exists for nematode splicing-factor binding sites. The <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> muscle-specific splicing factor SUP-12 regulates <italic>unc-60</italic> alternative splicing. This protein interacts with a GU-rich region, similar to the GU-rich motifs identified in <xref ref-type="table" rid="pcbi-0020086-t001">Table 1</xref>, of an <italic>unc-60</italic> intron [<xref ref-type="bibr" rid="pcbi-0020086-b044">44</xref>]. (For a review of other mammalian splicing factors with <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> homologs see [<xref ref-type="bibr" rid="pcbi-0020086-b033">33</xref>].) While many of the high-scoring conserved motifs that we identified match known mammalian splicing regulatory sequences, we have also identified new motifs that may also be involved in pre-mRNA splicing regulation in mammals as well as nematodes.</p><p>One important aspect of <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> introns is that they are shorter than introns in vertebrates. Half of <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> introns are below 60 nucleotides in length, too short to be spliced in vertebrates [<xref ref-type="bibr" rid="pcbi-0020086-b038">38</xref>]. However, many <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> introns are long and resemble vertebrate introns. In our alternatively spliced intron dataset, the median intron size is 263 bases (shortest is 43, longest is 10,719, and average is 561), indicating that these regulated introns generally belong in the larger intron class. We asked whether a similar analysis of the pentamers and hexamers found in the full introns flanking alternatively spliced exons would yield similar high-scoring motifs as our analysis of the conserved sequence subset of these introns. We did a pentamer and hexamer motif count of the full introns flanking the 147 alternatively spliced exons from which we previously extracted evolutionarily conserved elements. We counted the occurrence of every pentamer and hexamer in these full-length alternative introns. We ranked these motifs by the obs/exp ratio when we compared the occurrence of these motifs to their prevalence in our total intron dataset. The top 40 pentamer and hexamer motifs ranked by their obs/exp ratios are shown in <xref ref-type="table" rid="pcbi-0020086-t002">Table 2</xref>. Many of the top scoring pentamers and hexamers that are overrepresented in conserved elements in introns flanking alternatively spliced exons are also overrepresented in total introns flanking alternatively spliced exons (compare <xref ref-type="table" rid="pcbi-0020086-t001">Table 1</xref> with <xref ref-type="table" rid="pcbi-0020086-t002">Table 2</xref>). However, the obs/exp scores for the motifs in the alternative splicing introns is 2- to 3-fold lower than in the conserved element dataset extracted from these introns. For example, TGCATG has an observed to expected ratio of 3.35 in the whole introns that flank alternative exons but 8.87 for the conserved elements within those introns. TCTATC has a ratio of 2.55 in the total alternatively spliced intron analysis and 6.96 in the conserved element dataset analysis. The same holds true for high-scoring pentamers. CTATC goes from 1.85 for the observed to expected ratio in the introns flanking alternative exon dataset up to 4.23 in the conserved element dataset. From this analysis, the sequences of the introns flanking alternatively spliced exons can yield some data about potential pentamers and hexamers involved in alternative splicing regulation. However, limiting this analysis to WABA-conserved regions between <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> and <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content> can substantially improve the signal to help us identify splicing regulatory elements.</p><table-wrap content-type="1col" id="pcbi-0020086-t002" position="float"><object-id pub-id-type="doi">10.1371/journal.pcbi.0020086.t002</object-id><label>Table 2</label><caption><p>Pentamer and Hexamer Sequence Motifs That Occur More Frequently in the Introns Flanking Alternatively Spliced Exons than in Total Introns</p></caption><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.0020086.t002" xlink:type="simple"/><!-- <table frame="hsides" rules="none"><colgroup><col id="tb2col1" align="left" charoff="0" char=""/><col id="tb2col2" align="char" charoff="0" char="."/><col id="tb2col3" align="left" charoff="0" char=""/><col id="tb2col4" align="left" charoff="0" char=""/><col id="tb2col5" align="char" charoff="0" char="."/><col id="tb2col6" align="left" charoff="0" char=""/></colgroup><thead><tr><td align="left" colspan="2"><hr/>Pentamers</td><td rowspan="2"><hr/>Obs/Exp</td><td colspan="2"><hr/>Hexamers</td><td rowspan="2"><hr/>Obs/Exp</td></tr><tr><td><hr/>Word</td><td><hr/>Count</td><td><hr/>Word</td><td><hr/>Count</td></tr></thead><tbody><tr><td valign="bottom">GCATG</td><td valign="bottom">160</td><td valign="bottom">2.43</td><td valign="bottom">TGCATG</td><td valign="bottom">75</td><td valign="bottom">3.35</td></tr><tr><td valign="bottom">CTCTC</td><td valign="bottom">273</td><td valign="bottom">2.26</td><td valign="bottom">CTCTCT</td><td valign="bottom">173</td><td valign="bottom">3.35</td></tr><tr><td valign="bottom">TCTCT</td><td valign="bottom">391</td><td valign="bottom">2.01</td><td valign="bottom">TCTCTC</td><td valign="bottom">186</td><td valign="bottom">3.15</td></tr><tr><td valign="bottom">CTATC</td><td valign="bottom">142</td><td valign="bottom">1.85</td><td valign="bottom">CCAGGG</td><td valign="bottom">20</td><td valign="bottom">3.06</td></tr><tr><td valign="bottom">CGCTT</td><td valign="bottom">125</td><td valign="bottom">1.84</td><td valign="bottom">CTAACC</td><td valign="bottom">46</td><td valign="bottom">2.93</td></tr><tr><td valign="bottom">TGTGT</td><td valign="bottom">306</td><td valign="bottom">1.80</td><td valign="bottom">CCCTGG</td><td valign="bottom">21</td><td valign="bottom">2.92</td></tr><tr><td valign="bottom">CTAAC</td><td valign="bottom">156</td><td valign="bottom">1.79</td><td valign="bottom">CGCATG</td><td valign="bottom">31</td><td valign="bottom">2.76</td></tr><tr><td valign="bottom">GTGTG</td><td valign="bottom">194</td><td valign="bottom">1.76</td><td valign="bottom">GGGTCG</td><td valign="bottom">16</td><td valign="bottom">2.74</td></tr><tr><td valign="bottom">GGGGG</td><td valign="bottom">93</td><td valign="bottom">1.71</td><td valign="bottom">CTACCC</td><td valign="bottom">28</td><td valign="bottom">2.67</td></tr><tr><td valign="bottom">TAACC</td><td valign="bottom">150</td><td valign="bottom">1.69</td><td valign="bottom">ACCGTG</td><td valign="bottom">25</td><td valign="bottom">2.56</td></tr><tr><td valign="bottom">ACCTC</td><td valign="bottom">110</td><td valign="bottom">1.66</td><td valign="bottom">GCATGT</td><td valign="bottom">58</td><td valign="bottom">2.55</td></tr><tr><td valign="bottom">GTCGT</td><td valign="bottom">98</td><td valign="bottom">1.65</td><td valign="bottom">TCTATC</td><td valign="bottom">76</td><td valign="bottom">2.55</td></tr><tr><td valign="bottom">CCCAC</td><td valign="bottom">108</td><td valign="bottom">1.64</td><td valign="bottom">GCATGA</td><td valign="bottom">47</td><td valign="bottom">2.53</td></tr><tr><td valign="bottom">CCTCT</td><td valign="bottom">131</td><td valign="bottom">1.62</td><td valign="bottom">GCATGC</td><td valign="bottom">33</td><td valign="bottom">2.50</td></tr><tr><td valign="bottom">GTTGT</td><td valign="bottom">237</td><td valign="bottom">1.62</td><td valign="bottom">TGTCCC</td><td valign="bottom">38</td><td valign="bottom">2.41</td></tr><tr><td valign="bottom">GTCCC</td><td valign="bottom">68</td><td valign="bottom">1.62</td><td valign="bottom">ACGGGC</td><td valign="bottom">18</td><td valign="bottom">2.41</td></tr><tr><td valign="bottom">TGTCC</td><td valign="bottom">110</td><td valign="bottom">1.62</td><td valign="bottom">CGCAGT</td><td valign="bottom">25</td><td valign="bottom">2.37</td></tr><tr><td valign="bottom">CTCCC</td><td valign="bottom">97</td><td valign="bottom">1.61</td><td valign="bottom">CTATCC</td><td valign="bottom">30</td><td valign="bottom">2.35</td></tr><tr><td valign="bottom">CCTCC</td><td valign="bottom">101</td><td valign="bottom">1.61</td><td valign="bottom">CCTCCC</td><td valign="bottom">33</td><td valign="bottom">2.34</td></tr><tr><td valign="bottom">CGCAC</td><td valign="bottom">69</td><td valign="bottom">1.60</td><td valign="bottom">CTATCT</td><td valign="bottom">51</td><td valign="bottom">2.27</td></tr><tr><td valign="bottom">CTTCT</td><td valign="bottom">310</td><td valign="bottom">1.59</td><td valign="bottom">GGGGGG</td><td valign="bottom">47</td><td valign="bottom">2.24</td></tr><tr><td valign="bottom">TGCAT</td><td valign="bottom">205</td><td valign="bottom">1.59</td><td valign="bottom">AGCCCG</td><td valign="bottom">17</td><td valign="bottom">2.22</td></tr><tr><td valign="bottom">CATGT</td><td valign="bottom">179</td><td valign="bottom">1.58</td><td valign="bottom">ACCTCT</td><td valign="bottom">46</td><td valign="bottom">2.19</td></tr><tr><td valign="bottom">CCGCA</td><td valign="bottom">86</td><td valign="bottom">1.56</td><td valign="bottom">CCAACC</td><td valign="bottom">32</td><td valign="bottom">2.16</td></tr><tr><td valign="bottom">CATGC</td><td valign="bottom">95</td><td valign="bottom">1.55</td><td valign="bottom">CTGCAC</td><td valign="bottom">27</td><td valign="bottom">2.16</td></tr><tr><td valign="bottom">CAACC</td><td valign="bottom">109</td><td valign="bottom">1.54</td><td valign="bottom">TGTGTG</td><td valign="bottom">105</td><td valign="bottom">2.16</td></tr><tr><td valign="bottom">CTCCT</td><td valign="bottom">126</td><td valign="bottom">1.54</td><td valign="bottom">CCGCAG</td><td valign="bottom">19</td><td valign="bottom">2.15</td></tr><tr><td valign="bottom">TCCTC</td><td valign="bottom">148</td><td valign="bottom">1.53</td><td valign="bottom">GTTCGC</td><td valign="bottom">22</td><td valign="bottom">2.15</td></tr><tr><td valign="bottom">ATCCT</td><td valign="bottom">137</td><td valign="bottom">1.52</td><td valign="bottom">CGAACC</td><td valign="bottom">24</td><td valign="bottom">2.14</td></tr><tr><td valign="bottom">TCCCT</td><td valign="bottom">117</td><td valign="bottom">1.50</td><td valign="bottom">GCAGTC</td><td valign="bottom">20</td><td valign="bottom">2.14</td></tr><tr><td valign="bottom">CGAAC</td><td valign="bottom">95</td><td valign="bottom">1.50</td><td valign="bottom">GTCCCA</td><td valign="bottom">33</td><td valign="bottom">2.13</td></tr><tr><td valign="bottom">TCCCC</td><td valign="bottom">108</td><td valign="bottom">1.50</td><td valign="bottom">ACTAAC</td><td valign="bottom">57</td><td valign="bottom">2.12</td></tr><tr><td valign="bottom">CGTCC</td><td valign="bottom">49</td><td valign="bottom">1.50</td><td valign="bottom">TCCTCC</td><td valign="bottom">51</td><td valign="bottom">2.12</td></tr><tr><td valign="bottom">TGTCT</td><td valign="bottom">182</td><td valign="bottom">1.50</td><td valign="bottom">CGCTTC</td><td valign="bottom">31</td><td valign="bottom">2.11</td></tr><tr><td valign="bottom">GCCCG</td><td valign="bottom">43</td><td valign="bottom">1.50</td><td valign="bottom">CTGCGC</td><td valign="bottom">18</td><td valign="bottom">2.09</td></tr><tr><td valign="bottom">CCGTG</td><td valign="bottom">65</td><td valign="bottom">1.49</td><td valign="bottom">TGCACG</td><td valign="bottom">23</td><td valign="bottom">2.08</td></tr><tr><td valign="bottom">GGCTT</td><td valign="bottom">152</td><td valign="bottom">1.49</td><td valign="bottom">AGCATG</td><td valign="bottom">36</td><td valign="bottom">2.08</td></tr><tr><td valign="bottom">CATCC</td><td valign="bottom">86</td><td valign="bottom">1.49</td><td valign="bottom">CCGCAC</td><td valign="bottom">23</td><td valign="bottom">2.07</td></tr><tr><td valign="bottom">CTACC</td><td valign="bottom">101</td><td valign="bottom">1.49</td><td valign="bottom">GCACGG</td><td valign="bottom">18</td><td valign="bottom">2.07</td></tr><tr><td valign="bottom">CCCTG</td><td valign="bottom">61</td><td valign="bottom">1.48</td><td valign="bottom">CCGTCT</td><td valign="bottom">26</td><td valign="bottom">2.06</td></tr></tbody></table> --><!-- <table-wrap-foot><fn id="nt201"><p>We determined the number of occurrences of every pentamer and hexamer motif in the complete introns flanking 147 alternatively spliced exons that contain the evolutionarily conserved elements used for <xref ref-type="table" rid="pcbi-0020086-t001">Table 1</xref>. The Count column indicates the number of occurrences of each motif in the dataset of introns flanking the 147 alternative exons. Obs/Exp is the ratio of the observed frequency of occurrence of these motifs in the introns flanking alternative exons dataset divided by the expected frequency score of each motif based on the control total intron dataset. The top 40 highest scoring motifs as determined by the obs/exp value for pentamers and hexamers are listed.</p></fn></table-wrap-foot> --></table-wrap><p>We also used the database of introns flanking alternatively spliced exons to identify potential differences in the appearance of pentamer and hexamer motifs in the introns upstream or downstream of alternative exons. We grouped the introns upstream of the alternative exons and the introns downstream of the alternative exons separately into datasets and did motif counts and determined the obs/exp ratio for each when compared to the total intron dataset. These results are shown in <xref ref-type="table" rid="pcbi-0020086-t003">Tables 3</xref> and <xref ref-type="table" rid="pcbi-0020086-t004">4</xref>, with the top scoring pentamers and hexamers in the introns upstream and downstream of alternative exons ranked by their obs/exp ratios. Some of the high- scoring motifs show very little preference for the upstream or downstream intron. For example, high-scoring hexamer TGCATG has an obs/exp ratio of 3.90 in the downstream intron and 3.06 in the upstream intron. Others show a strong preference. CTCTCT and TCTCTC, likely binding sites for PTB, have obs/exp ratios of 5.15 and 4.84, respectively, in upstream introns, but 1.36 and 1.30 in downstream introns. TCTATC, which will be analyzed below, also has a preference for upstream introns, with an obs/exp ratio of 3.25 in upstream introns and 1.79 in downstream introns. Conversely, CCAACC has a strong preference for downstream introns, with an obs/exp ratio of 3.17 in the downstream intron and 1.29 in the upstream intron. In addition to identifying potential binding sites for splicing regulatory factors, these differences in appearance in introns upstream or downstream of alternatively spliced exons may hold some keys to function.</p><table-wrap content-type="2col" id="pcbi-0020086-t003" position="float"><object-id pub-id-type="doi">10.1371/journal.pcbi.0020086.t003</object-id><label>Table 3</label><caption><p>Comparison of the Occurrence of Pentamer Motifs in Introns Upstream versus Downstream of Alternative Cassette Exons</p></caption><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.0020086.t003" xlink:type="simple"/><!-- <table frame="hsides" rules="none"><colgroup><col id="tb3col1" align="left" charoff="0" char=""/><col id="tb3col2" align="left" charoff="0" char=""/><col id="tb3col3" align="char" charoff="0" char="."/><col id="tb3col4" align="char" charoff="0" char="."/><col id="tb3col5" align="char" charoff="0" char="."/><col id="tb3col6" align="char" charoff="0" char="."/><col id="tb3col7" align="left" charoff="0" char=""/><col id="tb3col8" align="left" charoff="0" char=""/><col id="tb3col9" align="left" charoff="0" char=""/><col id="tb3col10" align="char" charoff="0" char="."/><col id="tb3col11" align="char" charoff="0" char="."/><col id="tb3col12" align="char" charoff="0" char="."/><col id="tb3col13" align="char" charoff="0" char="."/><col id="tb3col14" align="char" charoff="0" char="."/></colgroup><thead><tr><td align="left" colspan="14"><hr/>Pentamers</td></tr><tr><td colspan="7"><hr/>Upstream Intron Ranks</td><td colspan="7"><hr/>Downstream Intron Ranks</td></tr><tr><td><hr/>US Rank</td><td><hr/>Motif</td><td><hr/>US Obs/ Exp</td><td><hr/>DS Rank</td><td><hr/>DS Obs/ Exp</td><td><hr/>NC Rank</td><td><hr/>NC Obs/ Exp</td><td><hr/>DS Rank</td><td><hr/>Motif</td><td><hr/>DS Obs/ Exp</td><td><hr/>US Rank</td><td><hr/>US Obs/ Exp</td><td><hr/>NC Rank</td><td><hr/>NC Obs/ Exp</td></tr></thead><tbody><tr><td valign="bottom">1</td><td valign="bottom">CTCTC</td><td valign="bottom">3.18</td><td valign="bottom">162</td><td valign="bottom">1.25</td><td valign="bottom">130</td><td valign="bottom">1.31</td><td valign="bottom">1</td><td valign="bottom">GCATG</td><td valign="bottom">2.88</td><td valign="bottom">4</td><td valign="bottom">2.11</td><td valign="bottom">19</td><td valign="bottom">1.6</td></tr><tr><td valign="bottom">2</td><td valign="bottom">TCTCT</td><td valign="bottom">2.74</td><td valign="bottom">202</td><td valign="bottom">1.22</td><td valign="bottom">72</td><td valign="bottom">1.39</td><td valign="bottom">2</td><td valign="bottom">TGTGT</td><td valign="bottom">1.96</td><td valign="bottom">20</td><td valign="bottom">1.69</td><td valign="bottom">46</td><td valign="bottom">1.44</td></tr><tr><td valign="bottom">3</td><td valign="bottom">CTATC</td><td valign="bottom">2.28</td><td valign="bottom">81</td><td valign="bottom">1.39</td><td valign="bottom">166</td><td valign="bottom">1.27</td><td valign="bottom">3</td><td valign="bottom">TAACC</td><td valign="bottom">1.92</td><td valign="bottom">62</td><td valign="bottom">1.5</td><td valign="bottom">266</td><td valign="bottom">1.14</td></tr><tr><td valign="bottom">4</td><td valign="bottom">GCATG</td><td valign="bottom">2.11</td><td valign="bottom">1</td><td valign="bottom">2.88</td><td valign="bottom">115</td><td valign="bottom">1.33</td><td valign="bottom">4</td><td valign="bottom">GTGTG</td><td valign="bottom">1.9</td><td valign="bottom">23</td><td valign="bottom">1.66</td><td valign="bottom">114</td><td valign="bottom">1.29</td></tr><tr><td valign="bottom">5</td><td valign="bottom">CGTCC</td><td valign="bottom">1.92</td><td valign="bottom">457</td><td valign="bottom">1.05</td><td valign="bottom">8</td><td valign="bottom">1.82</td><td valign="bottom">5</td><td valign="bottom">ACCTC</td><td valign="bottom">1.9</td><td valign="bottom">82</td><td valign="bottom">1.46</td><td valign="bottom">15</td><td valign="bottom">1.64</td></tr><tr><td valign="bottom">6</td><td valign="bottom">CTCCC</td><td valign="bottom">1.87</td><td valign="bottom">116</td><td valign="bottom">1.31</td><td valign="bottom">296</td><td valign="bottom">1.15</td><td valign="bottom">6</td><td valign="bottom">CGCAC</td><td valign="bottom">1.88</td><td valign="bottom">147</td><td valign="bottom">1.37</td><td valign="bottom">511</td><td valign="bottom">1.01</td></tr><tr><td valign="bottom">7</td><td valign="bottom">GCACG</td><td valign="bottom">1.86</td><td valign="bottom">464</td><td valign="bottom">1.04</td><td valign="bottom">28</td><td valign="bottom">1.54</td><td valign="bottom">7</td><td valign="bottom">CGCTT</td><td valign="bottom">1.85</td><td valign="bottom">9</td><td valign="bottom">1.85</td><td valign="bottom">156</td><td valign="bottom">1.22</td></tr><tr><td valign="bottom">8</td><td valign="bottom">GGGGG</td><td valign="bottom">1.86</td><td valign="bottom">37</td><td valign="bottom">1.53</td><td valign="bottom">383</td><td valign="bottom">1.09</td><td valign="bottom">8</td><td valign="bottom">GTCCC</td><td valign="bottom">1.83</td><td valign="bottom">86</td><td valign="bottom">1.45</td><td valign="bottom">26</td><td valign="bottom">1.54</td></tr><tr><td valign="bottom">9</td><td valign="bottom">CGCTT</td><td valign="bottom">1.85</td><td valign="bottom">7</td><td valign="bottom">1.85</td><td valign="bottom">118</td><td valign="bottom">1.33</td><td valign="bottom">9</td><td valign="bottom">CCGTG</td><td valign="bottom">1.81</td><td valign="bottom">261</td><td valign="bottom">1.22</td><td valign="bottom">170</td><td valign="bottom">1.21</td></tr><tr><td valign="bottom">10</td><td valign="bottom">CTAAC</td><td valign="bottom">1.83</td><td valign="bottom">14</td><td valign="bottom">1.74</td><td valign="bottom">88</td><td valign="bottom">1.36</td><td valign="bottom">10</td><td valign="bottom">TGTCC</td><td valign="bottom">1.79</td><td valign="bottom">71</td><td valign="bottom">1.48</td><td valign="bottom">14</td><td valign="bottom">1.64</td></tr><tr><td valign="bottom">11</td><td valign="bottom">GTCGT</td><td valign="bottom">1.79</td><td valign="bottom">50</td><td valign="bottom">1.47</td><td valign="bottom">29</td><td valign="bottom">1.54</td><td valign="bottom">11</td><td valign="bottom">CATGC</td><td valign="bottom">1.77</td><td valign="bottom">121</td><td valign="bottom">1.39</td><td valign="bottom">9</td><td valign="bottom">1.69</td></tr><tr><td valign="bottom">12</td><td valign="bottom">CACTC</td><td valign="bottom">1.79</td><td valign="bottom">455</td><td valign="bottom">1.05</td><td valign="bottom">429</td><td valign="bottom">1.07</td><td valign="bottom">12</td><td valign="bottom">TGCAT</td><td valign="bottom">1.75</td><td valign="bottom">66</td><td valign="bottom">1.49</td><td valign="bottom">128</td><td valign="bottom">1.27</td></tr><tr><td valign="bottom">13</td><td valign="bottom">GCCCG</td><td valign="bottom">1.79</td><td valign="bottom">242</td><td valign="bottom">1.19</td><td valign="bottom">37</td><td valign="bottom">1.5</td><td valign="bottom">13</td><td valign="bottom">CCTCT</td><td valign="bottom">1.74</td><td valign="bottom">68</td><td valign="bottom">1.48</td><td valign="bottom">190</td><td valign="bottom">1.2</td></tr><tr><td valign="bottom">14</td><td valign="bottom">CCTCC</td><td valign="bottom">1.79</td><td valign="bottom">68</td><td valign="bottom">1.42</td><td valign="bottom">34</td><td valign="bottom">1.51</td><td valign="bottom">14</td><td valign="bottom">CTAAC</td><td valign="bottom">1.74</td><td valign="bottom">10</td><td valign="bottom">1.83</td><td valign="bottom">140</td><td valign="bottom">1.25</td></tr><tr><td valign="bottom">15</td><td valign="bottom">TCCGC</td><td valign="bottom">1.77</td><td valign="bottom">430</td><td valign="bottom">1.06</td><td valign="bottom">30</td><td valign="bottom">1.54</td><td valign="bottom">15</td><td valign="bottom">CAACC</td><td valign="bottom">1.71</td><td valign="bottom">144</td><td valign="bottom">1.37</td><td valign="bottom">543</td><td valign="bottom">1</td></tr><tr><td valign="bottom">16</td><td valign="bottom">CCGCT</td><td valign="bottom">1.76</td><td valign="bottom">263</td><td valign="bottom">1.17</td><td valign="bottom">181</td><td valign="bottom">1.25</td><td valign="bottom">16</td><td valign="bottom">GCACC</td><td valign="bottom">1.69</td><td valign="bottom">622</td><td valign="bottom">0.99</td><td valign="bottom">330</td><td valign="bottom">1.1</td></tr><tr><td valign="bottom">17</td><td valign="bottom">GGCTT</td><td valign="bottom">1.73</td><td valign="bottom">179</td><td valign="bottom">1.23</td><td valign="bottom">10</td><td valign="bottom">1.79</td><td valign="bottom">17</td><td valign="bottom">CATGT</td><td valign="bottom">1.69</td><td valign="bottom">65</td><td valign="bottom">1.49</td><td valign="bottom">298</td><td valign="bottom">1.11</td></tr><tr><td valign="bottom">18</td><td valign="bottom">CTTCT</td><td valign="bottom">1.72</td><td valign="bottom">41</td><td valign="bottom">1.49</td><td valign="bottom">102</td><td valign="bottom">1.35</td><td valign="bottom">18</td><td valign="bottom">GTTGT</td><td valign="bottom">1.65</td><td valign="bottom">26</td><td valign="bottom">1.64</td><td valign="bottom">226</td><td valign="bottom">1.17</td></tr><tr><td valign="bottom">19</td><td valign="bottom">CCCCG</td><td valign="bottom">1.7</td><td valign="bottom">174</td><td valign="bottom">1.24</td><td valign="bottom">178</td><td valign="bottom">1.25</td><td valign="bottom">19</td><td valign="bottom">CTACC</td><td valign="bottom">1.63</td><td valign="bottom">118</td><td valign="bottom">1.4</td><td valign="bottom">27</td><td valign="bottom">1.53</td></tr><tr><td valign="bottom">20</td><td valign="bottom">TGTGT</td><td valign="bottom">1.69</td><td valign="bottom">2</td><td valign="bottom">1.96</td><td valign="bottom">158</td><td valign="bottom">1.28</td><td valign="bottom">20</td><td valign="bottom">CCGCA</td><td valign="bottom">1.62</td><td valign="bottom">57</td><td valign="bottom">1.52</td><td valign="bottom">181</td><td valign="bottom">1.2</td></tr><tr><td valign="bottom">21</td><td valign="bottom">GCTTC</td><td valign="bottom">1.69</td><td valign="bottom">158</td><td valign="bottom">1.26</td><td valign="bottom">73</td><td valign="bottom">1.39</td><td valign="bottom">21</td><td valign="bottom">CGAAC</td><td valign="bottom">1.62</td><td valign="bottom">99</td><td valign="bottom">1.42</td><td valign="bottom">482</td><td valign="bottom">1.03</td></tr><tr><td valign="bottom">22</td><td valign="bottom">CCCAC</td><td valign="bottom">1.67</td><td valign="bottom">22</td><td valign="bottom">1.62</td><td valign="bottom">361</td><td valign="bottom">1.11</td><td valign="bottom">22</td><td valign="bottom">CCCAC</td><td valign="bottom">1.62</td><td valign="bottom">22</td><td valign="bottom">1.67</td><td valign="bottom">641</td><td valign="bottom">0.96</td></tr><tr><td valign="bottom">23</td><td valign="bottom">GTGTG</td><td valign="bottom">1.66</td><td valign="bottom">4</td><td valign="bottom">1.9</td><td valign="bottom">157</td><td valign="bottom">1.28</td><td valign="bottom">23</td><td valign="bottom">CTCCT</td><td valign="bottom">1.61</td><td valign="bottom">101</td><td valign="bottom">1.42</td><td valign="bottom">20</td><td valign="bottom">1.6</td></tr><tr><td valign="bottom">24</td><td valign="bottom">CGTCT</td><td valign="bottom">1.65</td><td valign="bottom">252</td><td valign="bottom">1.18</td><td valign="bottom">267</td><td valign="bottom">1.17</td><td valign="bottom">24</td><td valign="bottom">CCCCA</td><td valign="bottom">1.59</td><td valign="bottom">591</td><td valign="bottom">1.01</td><td valign="bottom">86</td><td valign="bottom">1.34</td></tr><tr><td valign="bottom">25</td><td valign="bottom">GGTGC</td><td valign="bottom">1.64</td><td valign="bottom">138</td><td valign="bottom">1.28</td><td valign="bottom">106</td><td valign="bottom">1.34</td><td valign="bottom">25</td><td valign="bottom">AACCT</td><td valign="bottom">1.58</td><td valign="bottom">617</td><td valign="bottom">0.99</td><td valign="bottom">834</td><td valign="bottom">0.86</td></tr><tr><td valign="bottom">26</td><td valign="bottom">GTTGT</td><td valign="bottom">1.64</td><td valign="bottom">18</td><td valign="bottom">1.65</td><td valign="bottom">112</td><td valign="bottom">1.33</td><td valign="bottom">26</td><td valign="bottom">CGGGG</td><td valign="bottom">1.57</td><td valign="bottom">935</td><td valign="bottom">0.79</td><td valign="bottom">89</td><td valign="bottom">1.34</td></tr><tr><td valign="bottom">27</td><td valign="bottom">AGAGT</td><td valign="bottom">1.63</td><td valign="bottom">365</td><td valign="bottom">1.09</td><td valign="bottom">303</td><td valign="bottom">1.14</td><td valign="bottom">27</td><td valign="bottom">CAGGG</td><td valign="bottom">1.57</td><td valign="bottom">111</td><td valign="bottom">1.4</td><td valign="bottom">987</td><td valign="bottom">0.71</td></tr><tr><td valign="bottom">28</td><td valign="bottom">TGCTG</td><td valign="bottom">1.63</td><td valign="bottom">350</td><td valign="bottom">1.11</td><td valign="bottom">200</td><td valign="bottom">1.22</td><td valign="bottom">28</td><td valign="bottom">CACCG</td><td valign="bottom">1.57</td><td valign="bottom">882</td><td valign="bottom">0.83</td><td valign="bottom">307</td><td valign="bottom">1.11</td></tr><tr><td valign="bottom">29</td><td valign="bottom">CCCTG</td><td valign="bottom">1.62</td><td valign="bottom">98</td><td valign="bottom">1.35</td><td valign="bottom">264</td><td valign="bottom">1.17</td><td valign="bottom">29</td><td valign="bottom">GAGCC</td><td valign="bottom">1.57</td><td valign="bottom">409</td><td valign="bottom">1.11</td><td valign="bottom">877</td><td valign="bottom">0.83</td></tr><tr><td valign="bottom">30</td><td valign="bottom">CGCAT</td><td valign="bottom">1.61</td><td valign="bottom">382</td><td valign="bottom">1.08</td><td valign="bottom">648</td><td valign="bottom">0.99</td><td valign="bottom">30</td><td valign="bottom">TACCC</td><td valign="bottom">1.57</td><td valign="bottom">329</td><td valign="bottom">1.17</td><td valign="bottom">148</td><td valign="bottom">1.24</td></tr></tbody></table> --><!-- <table-wrap-foot><fn id="nt301"><p>Left side of table is analysis of upstream pentamer motifs. US Rank is the relative rank for the top 30 motifs based on Obs/Exp ratio (US Obs/Exp) for motifs in upstream introns that contain WABA-conserved elements (conserved introns). The relative rank of these motifs in the downstream conserved intron (DS Rank) and their obs/exp ratios for the downstream conserved intron dataset (DS Obs/Exp) are also indicated. NC Rank is based on Obs/Exp ratio for motifs found in upstream alternative introns lacking WABA-conserved elements (non-conserved introns). NC Obs/Exp indicates the ratios for each motif in the non-conserved intron analysis. Right side of table is analysis of downstream pentamers. DS Rank is the ranking of the motifs in conserved downstream introns based on the Obs/Exp ratio for motifs in downstream introns (DS Obs/Exp). The relative ranking of these motifs in the upstream introns (US Rank) and their Obs/Exp ratios in upstream introns (US Obs/Exp) are also indicated. NC Rank is based on Obs/Exp ratio from downstream non-conserved introns. NC Obs/Exp indicates the ratios for each motif in the non-conserved intron analysis. See <xref ref-type="supplementary-material" rid="pcbi-0020086-st002">Table S2</xref> for a more complete analysis of motifs in non-conserved introns.</p></fn></table-wrap-foot> --></table-wrap><table-wrap content-type="2col" id="pcbi-0020086-t004" position="float"><object-id pub-id-type="doi">10.1371/journal.pcbi.0020086.t004</object-id><label>Table 4</label><caption><p>Comparison of the Occurrence of Hexamer Motifs in Introns Upstream versus Downstream of Alternative Cassette Exons</p></caption><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.0020086.t004" xlink:type="simple"/><!-- <table frame="hsides" rules="none"><colgroup><col id="tb4col1" align="left" charoff="0" char=""/><col id="tb4col2" align="left" charoff="0" char=""/><col id="tb4col3" align="char" charoff="0" char="."/><col id="tb4col4" align="char" charoff="0" char="."/><col id="tb4col5" align="char" charoff="0" char="."/><col id="tb4col6" align="char" charoff="0" char="."/><col id="tb4col7" align="left" charoff="0" char=""/><col id="tb4col8" align="left" charoff="0" char=""/><col id="tb4col9" align="left" charoff="0" char=""/><col id="tb4col10" align="char" charoff="0" char="."/><col id="tb4col11" align="char" charoff="0" char="."/><col id="tb4col12" align="char" charoff="0" char="."/><col id="tb4col13" align="char" charoff="0" char="."/><col id="tb4col14" align="char" charoff="0" char="."/></colgroup><thead><tr><td align="left" colspan="14"><hr/>Hexamers</td></tr><tr><td colspan="7"><hr/>Upstream Intron Ranks</td><td colspan="7"><hr/>Downstream Intron Ranks</td></tr><tr><td><hr/>US Rank</td><td><hr/>Motif</td><td><hr/>US Obs/ Exp</td><td><hr/>DS Rank</td><td><hr/>DS Obs/ Exp</td><td><hr/>NC Rank</td><td><hr/>NC Obs/ Exp</td><td><hr/>DS Rank</td><td><hr/>Motif</td><td><hr/>DS Obs/ Exp</td><td><hr/>US Rank</td><td><hr/>US Obs/ Exp</td><td><hr/>NC Rank</td><td><hr/>NC Obs/ Exp</td></tr></thead><tbody><tr><td valign="bottom">1</td><td valign="bottom">CTCTCT</td><td valign="bottom">5.15</td><td valign="bottom">780</td><td valign="bottom">1.36</td><td valign="bottom">579</td><td valign="bottom">1.43</td><td valign="bottom">1</td><td valign="bottom">TGCATG</td><td valign="bottom">3.9</td><td valign="bottom">8</td><td valign="bottom">3.06</td><td valign="bottom">178</td><td valign="bottom">1.75</td></tr><tr><td valign="bottom">2</td><td valign="bottom">TCTCTC</td><td valign="bottom">4.84</td><td valign="bottom">914</td><td valign="bottom">1.3</td><td valign="bottom">688</td><td valign="bottom">1.38</td><td valign="bottom">2</td><td valign="bottom">ACCGTG</td><td valign="bottom">3.71</td><td valign="bottom">507</td><td valign="bottom">1.56</td><td valign="bottom">122</td><td valign="bottom">1.85</td></tr><tr><td valign="bottom">3</td><td valign="bottom">ACGGGC</td><td valign="bottom">3.56</td><td valign="bottom">1,464</td><td valign="bottom">1.14</td><td valign="bottom">1,405</td><td valign="bottom">1.15</td><td valign="bottom">3</td><td valign="bottom">CTACCC</td><td valign="bottom">3.65</td><td valign="bottom">239</td><td valign="bottom">1.81</td><td valign="bottom">1,325</td><td valign="bottom">1.15</td></tr><tr><td valign="bottom">4</td><td valign="bottom">CCAGGG</td><td valign="bottom">3.49</td><td valign="bottom">23</td><td valign="bottom">2.61</td><td valign="bottom">1,523</td><td valign="bottom">1.13</td><td valign="bottom">4</td><td valign="bottom">GGGTCG</td><td valign="bottom">3.65</td><td valign="bottom">146</td><td valign="bottom">1.95</td><td valign="bottom">3,866</td><td valign="bottom">0.52</td></tr><tr><td valign="bottom">5</td><td valign="bottom">TCTATC</td><td valign="bottom">3.25</td><td valign="bottom">208</td><td valign="bottom">1.79</td><td valign="bottom">721</td><td valign="bottom">1.37</td><td valign="bottom">5</td><td valign="bottom">CGAACC</td><td valign="bottom">3.24</td><td valign="bottom">1,453</td><td valign="bottom">1.19</td><td valign="bottom">2,333</td><td valign="bottom">0.94</td></tr><tr><td valign="bottom">6</td><td valign="bottom">CTAACC</td><td valign="bottom">3.15</td><td valign="bottom">14</td><td valign="bottom">2.85</td><td valign="bottom">197</td><td valign="bottom">1.73</td><td valign="bottom">6</td><td valign="bottom">GCATGT</td><td valign="bottom">3.19</td><td valign="bottom">114</td><td valign="bottom">2.01</td><td valign="bottom">1,150</td><td valign="bottom">1.19</td></tr><tr><td valign="bottom">7</td><td valign="bottom">CCTCCC</td><td valign="bottom">3.1</td><td valign="bottom">512</td><td valign="bottom">1.51</td><td valign="bottom">351</td><td valign="bottom">1.58</td><td valign="bottom">7</td><td valign="bottom">CCAACC</td><td valign="bottom">3.17</td><td valign="bottom">1,119</td><td valign="bottom">1.29</td><td valign="bottom">386</td><td valign="bottom">1.53</td></tr><tr><td valign="bottom">8</td><td valign="bottom">TGCATG</td><td valign="bottom">3.06</td><td valign="bottom">1</td><td valign="bottom">3.9</td><td valign="bottom">97</td><td valign="bottom">1.93</td><td valign="bottom">8</td><td valign="bottom">GCATGA</td><td valign="bottom">3.1</td><td valign="bottom">76</td><td valign="bottom">2.15</td><td valign="bottom">208</td><td valign="bottom">1.71</td></tr><tr><td valign="bottom">9</td><td valign="bottom">GCAGTC</td><td valign="bottom">3.06</td><td valign="bottom">1,456</td><td valign="bottom">1.14</td><td valign="bottom">2,636</td><td valign="bottom">0.93</td><td valign="bottom">9</td><td valign="bottom">GGGGTC</td><td valign="bottom">3.04</td><td valign="bottom">2,091</td><td valign="bottom">1.04</td><td valign="bottom">4,079</td><td valign="bottom">0.17</td></tr><tr><td valign="bottom">10</td><td valign="bottom">CTATCT</td><td valign="bottom">2.96</td><td valign="bottom">508</td><td valign="bottom">1.52</td><td valign="bottom">846</td><td valign="bottom">1.32</td><td valign="bottom">10</td><td valign="bottom">ACCCGC</td><td valign="bottom">3.04</td><td valign="bottom">2,355</td><td valign="bottom">0.99</td><td valign="bottom">3,762</td><td valign="bottom">0.59</td></tr><tr><td valign="bottom">11</td><td valign="bottom">TGCACG</td><td valign="bottom">2.93</td><td valign="bottom">1,395</td><td valign="bottom">1.16</td><td valign="bottom">545</td><td valign="bottom">1.45</td><td valign="bottom">11</td><td valign="bottom">TGTCCC</td><td valign="bottom">2.97</td><td valign="bottom">167</td><td valign="bottom">1.93</td><td valign="bottom">44</td><td valign="bottom">2.1</td></tr><tr><td valign="bottom">12</td><td valign="bottom">CCCTGG</td><td valign="bottom">2.91</td><td valign="bottom">12</td><td valign="bottom">2.96</td><td valign="bottom">2,045</td><td valign="bottom">1.03</td><td valign="bottom">12</td><td valign="bottom">CCCTGG</td><td valign="bottom">2.96</td><td valign="bottom">12</td><td valign="bottom">2.91</td><td valign="bottom">1,773</td><td valign="bottom">1.05</td></tr><tr><td valign="bottom">13</td><td valign="bottom">GGGGGG</td><td valign="bottom">2.9</td><td valign="bottom">480</td><td valign="bottom">1.53</td><td valign="bottom">3,439</td><td valign="bottom">0.77</td><td valign="bottom">13</td><td valign="bottom">GCATGC</td><td valign="bottom">2.9</td><td valign="bottom">48</td><td valign="bottom">2.3</td><td valign="bottom">24</td><td valign="bottom">2.4</td></tr><tr><td valign="bottom">14</td><td valign="bottom">CTATCC</td><td valign="bottom">2.83</td><td valign="bottom">175</td><td valign="bottom">1.83</td><td valign="bottom">389</td><td valign="bottom">1.54</td><td valign="bottom">14</td><td valign="bottom">CTAACC</td><td valign="bottom">2.85</td><td valign="bottom">6</td><td valign="bottom">3.15</td><td valign="bottom">193</td><td valign="bottom">1.73</td></tr><tr><td valign="bottom">15</td><td valign="bottom">CTGCAC</td><td valign="bottom">2.74</td><td valign="bottom">460</td><td valign="bottom">1.54</td><td valign="bottom">928</td><td valign="bottom">1.29</td><td valign="bottom">15</td><td valign="bottom">CGCATG</td><td valign="bottom">2.85</td><td valign="bottom">18</td><td valign="bottom">2.71</td><td valign="bottom">726</td><td valign="bottom">1.34</td></tr><tr><td valign="bottom">16</td><td valign="bottom">CGCTTC</td><td valign="bottom">2.72</td><td valign="bottom">594</td><td valign="bottom">1.45</td><td valign="bottom">581</td><td valign="bottom">1.43</td><td valign="bottom">16</td><td valign="bottom">GCACCG</td><td valign="bottom">2.81</td><td valign="bottom">3,362</td><td valign="bottom">0.75</td><td valign="bottom">611</td><td valign="bottom">1.39</td></tr><tr><td valign="bottom">17</td><td valign="bottom">CATCGC</td><td valign="bottom">2.72</td><td valign="bottom">2,373</td><td valign="bottom">0.94</td><td valign="bottom">3,219</td><td valign="bottom">0.81</td><td valign="bottom">17</td><td valign="bottom">AGCATG</td><td valign="bottom">2.71</td><td valign="bottom">544</td><td valign="bottom">1.54</td><td valign="bottom">93</td><td valign="bottom">1.92</td></tr><tr><td valign="bottom">18</td><td valign="bottom">CGCATG</td><td valign="bottom">2.71</td><td valign="bottom">15</td><td valign="bottom">2.85</td><td valign="bottom">3,923</td><td valign="bottom">0.55</td><td valign="bottom">18</td><td valign="bottom">CATGCT</td><td valign="bottom">2.69</td><td valign="bottom">1,203</td><td valign="bottom">1.26</td><td valign="bottom">500</td><td valign="bottom">1.45</td></tr><tr><td valign="bottom">19</td><td valign="bottom">TGCTGC</td><td valign="bottom">2.65</td><td valign="bottom">3,311</td><td valign="bottom">0.71</td><td valign="bottom">867</td><td valign="bottom">1.31</td><td valign="bottom">19</td><td valign="bottom">CGTGAC</td><td valign="bottom">2.67</td><td valign="bottom">1,440</td><td valign="bottom">1.19</td><td valign="bottom">190</td><td valign="bottom">1.73</td></tr><tr><td valign="bottom">20</td><td valign="bottom">GTTCGC</td><td valign="bottom">2.6</td><td valign="bottom">297</td><td valign="bottom">1.67</td><td valign="bottom">557</td><td valign="bottom">1.45</td><td valign="bottom">20</td><td valign="bottom">GGCACC</td><td valign="bottom">2.64</td><td valign="bottom">3,479</td><td valign="bottom">0.72</td><td valign="bottom">1,327</td><td valign="bottom">1.15</td></tr><tr><td valign="bottom">21</td><td valign="bottom">CGGGCT</td><td valign="bottom">2.59</td><td valign="bottom">1,389</td><td valign="bottom">1.16</td><td valign="bottom">3,713</td><td valign="bottom">0.67</td><td valign="bottom">21</td><td valign="bottom">TGTGTG</td><td valign="bottom">2.63</td><td valign="bottom">283</td><td valign="bottom">1.76</td><td valign="bottom">486</td><td valign="bottom">1.46</td></tr><tr><td valign="bottom">22</td><td valign="bottom">GCACGA</td><td valign="bottom">2.55</td><td valign="bottom">2,913</td><td valign="bottom">0.82</td><td valign="bottom">2,536</td><td valign="bottom">0.94</td><td valign="bottom">22</td><td valign="bottom">CGCAGT</td><td valign="bottom">2.63</td><td valign="bottom">72</td><td valign="bottom">2.16</td><td valign="bottom">877</td><td valign="bottom">1.29</td></tr><tr><td valign="bottom">23</td><td valign="bottom">CCTGGT</td><td valign="bottom">2.52</td><td valign="bottom">655</td><td valign="bottom">1.41</td><td valign="bottom">2,660</td><td valign="bottom">0.92</td><td valign="bottom">23</td><td valign="bottom">CCAGGG</td><td valign="bottom">2.61</td><td valign="bottom">4</td><td valign="bottom">3.49</td><td valign="bottom">4,061</td><td valign="bottom">0.23</td></tr><tr><td valign="bottom">24</td><td valign="bottom">GTGTTG</td><td valign="bottom">2.52</td><td valign="bottom">421</td><td valign="bottom">1.57</td><td valign="bottom">1,513</td><td valign="bottom">1.13</td><td valign="bottom">24</td><td valign="bottom">GTGGCT</td><td valign="bottom">2.58</td><td valign="bottom">3,884</td><td valign="bottom">0.54</td><td valign="bottom">2,189</td><td valign="bottom">0.97</td></tr><tr><td valign="bottom">25</td><td valign="bottom">ACGTCC</td><td valign="bottom">2.51</td><td valign="bottom">3,689</td><td valign="bottom">0.56</td><td valign="bottom">31</td><td valign="bottom">2.28</td><td valign="bottom">25</td><td valign="bottom">CGCACC</td><td valign="bottom">2.56</td><td valign="bottom">2,220</td><td valign="bottom">1.02</td><td valign="bottom">293</td><td valign="bottom">1.61</td></tr><tr><td valign="bottom">26</td><td valign="bottom">CCCGGT</td><td valign="bottom">2.51</td><td valign="bottom">3,772</td><td valign="bottom">0.51</td><td valign="bottom">290</td><td valign="bottom">1.63</td><td valign="bottom">26</td><td valign="bottom">TAACCT</td><td valign="bottom">2.56</td><td valign="bottom">1,196</td><td valign="bottom">1.26</td><td valign="bottom">1703</td><td valign="bottom">1.06</td></tr><tr><td valign="bottom">27</td><td valign="bottom">CACTGC</td><td valign="bottom">2.5</td><td valign="bottom">284</td><td valign="bottom">1.68</td><td valign="bottom">1,155</td><td valign="bottom">1.22</td><td valign="bottom">27</td><td valign="bottom">CGCTTG</td><td valign="bottom">2.55</td><td valign="bottom">596</td><td valign="bottom">1.51</td><td valign="bottom">1,606</td><td valign="bottom">1.08</td></tr><tr><td valign="bottom">28</td><td valign="bottom">ACGCTT</td><td valign="bottom">2.49</td><td valign="bottom">486</td><td valign="bottom">1.52</td><td valign="bottom">304</td><td valign="bottom">1.62</td><td valign="bottom">28</td><td valign="bottom">ACCTCT</td><td valign="bottom">2.54</td><td valign="bottom">181</td><td valign="bottom">1.9</td><td valign="bottom">330</td><td valign="bottom">1.58</td></tr><tr><td valign="bottom">29</td><td valign="bottom">TATCCT</td><td valign="bottom">2.48</td><td valign="bottom">611</td><td valign="bottom">1.44</td><td valign="bottom">313</td><td valign="bottom">1.61</td><td valign="bottom">29</td><td valign="bottom">GGTCGA</td><td valign="bottom">2.51</td><td valign="bottom">861</td><td valign="bottom">1.38</td><td valign="bottom">262</td><td valign="bottom">1.64</td></tr><tr><td valign="bottom">30</td><td valign="bottom">TCCGCT</td><td valign="bottom">2.47</td><td valign="bottom">3,099</td><td valign="bottom">0.77</td><td valign="bottom">442</td><td valign="bottom">1.51</td><td valign="bottom">30</td><td valign="bottom">CCGCAC</td><td valign="bottom">2.49</td><td valign="bottom">324</td><td valign="bottom">1.71</td><td valign="bottom">693</td><td valign="bottom">1.36</td></tr></tbody></table> --><!-- <table-wrap-foot><fn id="nt401"><p>Analysis of hexamer motifs. The legend for <xref ref-type="table" rid="pcbi-0020086-t003">Table 3</xref> also applies, except that here hexamers are ranked. See <xref ref-type="supplementary-material" rid="pcbi-0020086-st002">Table S2</xref> for a more complete analysis of motifs in non-conserved introns.</p></fn></table-wrap-foot> --></table-wrap><p>To determine whether these pentamers and hexamers are found in introns flanking all alternative cassette exons or are specific for those introns with WABA-conserved elements, another dataset was constructed from the introns flanking the alternative cassette exons of 307 genes lacking WABA-defined evolutionarily conserved intronic elements. A motif search similar to that described in the previous paragraph was conducted by dividing the new, non-conserved intron dataset into two sets: introns upstream of alternative exons and those downstream. Motifs were counted for each of the sets and compared to the total intron dataset to generate an obs/exp ratio and corresponding ranking for each element. It can be seen from <xref ref-type="table" rid="pcbi-0020086-t004">Table 4</xref> that the obs/exp scores of all of the top 30 hexamer motifs identified in conserved introns drop in the analysis of non-conserved introns, suggesting the motifs are indeed specific to introns containing conserved regions. For example, our top ranking hexamer from the conserved intron analysis, TGCATG, has an obs/exp score of 3.9 in downstream introns and 3.06 upstream. This same motif only scores 1.75 in downstream and 1.93 in upstream in non-conserved alternative introns (<xref ref-type="table" rid="pcbi-0020086-t004">Table 4</xref>). For CTCTCT and TCTCTC, our two top hexamer upstream motifs in introns with WABA-conserved elements, the obs/exp ratio drops over 3-fold in this analysis, and they rank as 579 and 688, respectively, in the upstream non-conserved intron set (<xref ref-type="table" rid="pcbi-0020086-t004">Table 4</xref>). Conversely, top scoring motifs from the non-conserved intron database are not highly represented in the conserved intron dataset. For example, GGCCAC, with an obs/exp ratio of 4.36 (<xref ref-type="supplementary-material" rid="pcbi-0020086-st002">Table S2</xref>) was the top scoring motif in the upstream non-conserved dataset. Strikingly, this same motif has an obs/exp score of 0.11 in total introns that contain WABA-conserved elements upstream of an alternatively spliced exon (unpublished data). This dramatically different representation of top scoring pentamers and hexamers in introns containing WABA-conserved elements versus those that do not suggests that the presence or absence of intronic WABA-defined conservation may define two distinct classes of alternatively spliced exons with distinct splicing regulatory mechanisms.</p><p>To ensure that the motifs identified in the conserved element dataset were truly overrepresented in this region and not a consequence of WABA creating bias towards GC-rich regions in the AT-rich nematode genomes, we analyzed the base composition of our datasets. The GC content of our WABA-defined conserved element dataset was 39%, the total intron dataset that contained these conserved elements was 34%, and the total intron reference dataset was 32%. While this slight variation in GC content might suggest that the WABA HMM may have created a bias, two arguments can be made against this. The first is that the high-scoring motifs in the WABA-conserved region were also highly represented in the total introns containing these motifs (<xref ref-type="table" rid="pcbi-0020086-t002">Table 2</xref>), consistent with these results not being derived from bias in GC content. The second is that GC enrichment bias is not observed in many of our highest scoring motifs. For example, TCTATC has a GC content of 33%, yet is highly enriched in conserved elements.</p></sec><sec id="s2d"><title>The Candidate Motifs (T)GCATG and (T)CTATC Are Required for <italic>unc-52</italic> Alternative Splicing Regulation</title><p>The <italic>C. elegans unc-52</italic> gene is a homolog of the mammalian extracellular matrix protein perlecan and contains 37 exons. Exons 16, 17, and 18 are alternatively spliced in a complex and regulated manner. These three exons each encode an Ig protein motif and can be included or skipped in any number of combinations in the final <italic>unc-52</italic> mRNA transcript [<xref ref-type="bibr" rid="pcbi-0020086-b045">45</xref>]. RT-PCR analysis shows <italic>unc-52</italic> is also alternatively spliced in <italic>C. briggsae,</italic> suggesting the splicing pattern may be controlled by similar methods (unpublished data). The use of a subset of these alternatively spliced forms is controlled by the splicing regulatory protein, MEC-8 [<xref ref-type="bibr" rid="pcbi-0020086-b046">46</xref>,<xref ref-type="bibr" rid="pcbi-0020086-b047">47</xref>]. The genetic regulation of <italic>unc-52</italic> alternative splicing makes this gene an attractive model for studying splicing regulation. Most importantly for this analysis, the introns flanking either side of alternative exon 16 contain regions of high nucleotide conservation as identified by WABA. A number of the top scoring pentamers and hexamers from our conserved element motif analysis are found in these conserved regions (<xref ref-type="fig" rid="pcbi-0020086-g003">Figure 3</xref>A).</p><fig id="pcbi-0020086-g003" position="float"><object-id pub-id-type="doi">10.1371/journal.pcbi.0020086.g003</object-id><label>Figure 3</label><caption><title>Conserved Intronic Elements of <italic>unc-52</italic> Contain Putative Regulators of Alternative Splicing</title><p>(A) <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> and <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content> sequence alignment is shown for the alternatively spliced portion of <italic>unc-52</italic>. Not all spliced isoforms are predicted by Wormbase software (blue); see <xref ref-type="fig" rid="pcbi-0020086-g004">Figure 4</xref>A for observed alternative splicing patterns<italic>.</italic> PhastCons sequence alignment is shown with WABA-designated conservation in bold. Upper line of sequence is <italic>C. elegans; C. briggsae</italic> is below. High-scoring conserved motifs identified in our pentamer/hexamer analysis of conserved intronic elements flanking alternatively spliced exons, GCATG, TCTATC, CTATCC, CTATC, and TGCAC are underlined.</p><p>(B) Diagram of alternative splicing reporter constructs for testing putative <italic>cis</italic>-regulatory splicing motifs. Part of exon 15 through part of exon 19 of <italic>unc-52</italic> was cloned into a GFP/lacZ fusion vector with an <italic>unc-54</italic> promoter and nuclear localization sequence suitable for expression in <italic>C. elegans.</italic> Site-directed mutagenesis of the wild-type substrate was performed in order to test putative <italic>cis</italic>-splicing regulatory elements<italic>.</italic> A table of the splicing reporter constructs and their alterations is shown. Asterisks denote highly conserved intronic nucleotides deleted by site-directed mutagenesis. To maintain the intron length, yet remove motifs in question, a reporter was also made in which native sequence was replaced with the reverse complement sequence (shown in bold) and a HindIII site (italics) for diagnostic purposes.</p></caption><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.0020086.g003" xlink:type="simple"/></fig><fig id="pcbi-0020086-g004" position="float"><object-id pub-id-type="doi">10.1371/journal.pcbi.0020086.g004</object-id><label>Figure 4</label><caption><title>Deletion or Mutation of Top Scoring Pentamers or Hexamers Alters <italic>unc-52</italic> Alternative Splicing</title><p>(A) Autoradiogram of <italic>unc-52</italic> reporter gene alternative splicing. Left side shows <sup>32</sup>P RT-PCR analysis (with BamHI digest) performed on strains carrying each of the reporter constructs described in <xref ref-type="fig" rid="pcbi-0020086-g003">Figure 3</xref>B. The reporter is indicated at top of gel. Table on right shows the relative percentage of each alternatively spliced isoform produced from the indicated in vivo splicing reporter constructs. Arrows point to the corresponding band on the gel. Asterisk denotes a non-specific band resulting from RT-PCR.</p><p>(B) Graphical summary of <italic>unc-52</italic> in vivo splicing reporter assays. Horizontal axis indicates spliced mRNA isoform. Vertical axis represents the relative percentage of each isoform. Color key on figure indicates which bars correspond to which strain. Standard deviation and mean values were calculated based on a minimum of three independent RNA extractions and subsequent RT-PCRs for each reporter.</p></caption><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.0020086.g004" xlink:type="simple"/></fig><p>To test the role of these motifs in alternative splicing of <italic>unc-52,</italic> we created a muscle-expressed alternative splicing reporter transgene derived from this region (<xref ref-type="fig" rid="pcbi-0020086-g003">Figure 3</xref>B). Expression studies using the native <italic>unc-52</italic> promoter to drive GFP expression have indicated that this extracellular matrix protein is expressed in the muscle and hypodermis [<xref ref-type="bibr" rid="pcbi-0020086-b047">47</xref>,<xref ref-type="bibr" rid="pcbi-0020086-b048">48</xref>]. However, studies of the <italic>unc-52</italic> splicing regulator <italic>mec-8</italic> have suggested that <italic>mec-8</italic> function on <italic>unc-52</italic> alternative splicing is mostly focused in hypodermal tissues [<xref ref-type="bibr" rid="pcbi-0020086-b047">47</xref>]. Our intention is to mimic the native gene's splicing as closely as possible, so we tested whether the alternative splicing of our muscle-specific <italic>unc-52</italic> reporter could be regulated by <italic>mec-8</italic>. RT-PCR analysis of our wild-type <italic>unc-52</italic> alternative splicing reporter in <italic>mec-8(+)</italic> (wild-type) and <italic>mec-8(e398)</italic> (mutant) backgrounds indicates a dramatic difference in splicing (<xref ref-type="supplementary-material" rid="pcbi-0020086-st003">Table S3</xref>). When the reporter is spliced in a <italic>mec-8(e398)</italic> mutant that lacks its RNA-binding domain, an increase in exon 18-containing transcripts is observed, as well as a 75% drop in abundance of 15-16-19 and 15–19 isoforms. This closely mimics the effects of <italic>mec-8(e398)</italic> on native <italic>unc-52</italic> splicing [<xref ref-type="bibr" rid="pcbi-0020086-b046">46</xref>]. These results demonstrate that the tissue-specific expression of our <italic>unc-52</italic> reporter is an adequate representation of the alternative splicing of the native gene, and that it is also under the control of the splicing factor MEC-8.</p><p>In order to test the role of evolutionarily conserved intronic elements and motifs in the regulation of <italic>unc-52</italic> alternative splicing, we created <italic>unc-52</italic> alternative splicing reporter constructs with different combinations of deletions in these sequences and monitored their in vivo splicing by RT-PCR. Due to the similar size of exons 17 and 18, a restriction digest with BamHI was performed on the RT-PCR products. Spliced isoforms containing exon 18 would be cleaved by BamHI and thus run at smaller sizes on the gel (<xref ref-type="fig" rid="pcbi-0020086-g003">Figures 3</xref>B and <xref ref-type="fig" rid="pcbi-0020086-g004">4</xref>A). A summary of these results is shown in <xref ref-type="fig" rid="pcbi-0020086-g004">Figure 4</xref>. All quantitation is based on the analysis of a minimum of three different RNA isolations from the indicated strains. In general, splicing reporters with deletions of the conserved intronic sequences flanking either side of exon 16 seemed to have the largest effect on three specific isoforms of mature <italic>unc-52</italic> mRNA, those containing exons 15-16-19, 15-16-18–19, and 15-18-19 (<xref ref-type="fig" rid="pcbi-0020086-g004">Figure 4</xref>B).</p><p>Our pentamer and hexamer motif analysis of conserved intronic elements flanking alternatively spliced exons identified GCATG and TGCATG as high-scoring motifs likely to be found in introns flanking either side of an alternative exon. Deletion of the GCATG upstream of alternative exon 16 from the <italic>unc-52</italic> splicing reporter resulted in nearly a doubling of the proportion of reporter transcripts containing exon 16 and a drop in the proportion using 15-18-19. This suggests that GCATG may play a role in repressing the inclusion of exon 16 (<xref ref-type="fig" rid="pcbi-0020086-g004">Figure 4</xref>B).</p><p>A conserved intronic element just downstream of exon 16 contains another of our top scoring motifs, (T)CTATC. A deletion of this TCTATC had the opposite effect of deleting the upstream intronic GCATG; the proportion of exon 16-containing transcripts decreased while the amount of 15-18-19 increased. A larger deletion of this downstream motif (Deletion B) or a replacement of the motif with the reverse complement sequence (Mutation B) amplified this effect as summarized in <xref ref-type="fig" rid="pcbi-0020086-g004">Figure 4</xref>B. Specifically, an approximately 75% reduction in exon 16- containing transcripts relative to wild-type can be seen when this conserved region is altered in the Mutation B construct. A similar drop of almost 85% is seen when this conserved element is deleted in the Deletion B reporter construct. This indicates that TCTATC is part of a regulatory element that enhances the inclusion of exon 16, and its loss by mutation leads to a decrease in exon 16 inclusion.</p><p>Perhaps most interesting was the effect produced by the double deletion of two conserved motifs flanking exon 16: the upstream GCATG and the downstream TCTATC. Individual deletions of these two motifs suggested they work in opposition to include or exclude exon 16. However, the double mutant causes a shift in splice pattern similar to, but much more dramatic, than that seen in the ΔGCATG construct (<xref ref-type="fig" rid="pcbi-0020086-g004">Figure 4</xref>B). The double mutant had such a dramatic increase in 15-16-19 levels that it became the new predominant isoform, making up 61% of the mRNAs. This result suggests that the conserved motifs on either side of exon 16 are responsible for the inclusion of this exon and that they work in collaboration and as part of a larger regulatory network to produce a multilayered regulation of <italic>unc-52</italic> splicing. In general, changes to the evolutionarily conserved intronic elements flanking exon 16 did not alter the relative amounts of the 15-17-19, 15-17-18–19, and 15–19 isoforms dramatically. These elements flanking exon 16, for the most part, appear to regulate the decision to form either the 15-16-19 isoform or the 15-18-19 isoform (<xref ref-type="fig" rid="pcbi-0020086-g004">Figure 4</xref>B).</p></sec></sec><sec id="s3"><title>Discussion</title><p>Our comparative genomic analysis of <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> and <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content> allowed us to identify 142 alternatively spliced genes that exhibit regions of high nucleotide conservation in introns flanking alternatively spliced exons. These conserved regions were then analyzed for pentamer and hexamer motifs present at a statistically higher level than found in total introns. Many of the high scorers on these lists matched known mammalian splicing regulatory elements. This indicates that this approach can find alternative splicing regulatory sequences, and it is consistent with our observations that there are <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> homologs for the major mammalian splicing regulatory factors (unpublished data). In addition to finding known splicing regulatory sequences, this approach identified potentially novel splicing regulatory sequences. We have confirmed that the sequence (T)CTATC is important for alternative splicing regulation of the <italic>unc-52</italic> gene.</p><p>The limited sequence conservation between <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> and <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content> in introns flanking alternatively spliced exons contrasts with that seen in mammalian interspecies genome alignments. In mouse/human alignments of alternatively spliced human cassette exons, it was found that the 100 nucleotides of intron sequence flanking either side of alternative cassette exons tend to be highly conserved [<xref ref-type="bibr" rid="pcbi-0020086-b021">21</xref>,<xref ref-type="bibr" rid="pcbi-0020086-b022">22</xref>]. It is unclear from these mouse/human analyses which specific portion(s) of the introns immediately flanking these alternatively spliced exons are essential for alternative splicing regulation. Our analysis indicates that the WABA-identified regions of intronic homology flanking alternatively spliced exons are likely to be important for alternative splicing regulation. Therefore, the <italic>C. elegans/C. briggsae</italic> evolutionary distance, along with the sensitivity of WABA, provides for a more simplified method for pinpointing splicing regulatory sequences. One of the interesting questions resulting from our identification of intronic alternative splicing regulatory motifs in <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> is whether these will also function to regulate alternative splicing in mammals. It has been suggested that there is a difference in frequency of usage of constitutive intronic splicing enhancers between mammals and fish, which can explain why fish introns are not always spliced efficiently in mammalian cells [<xref ref-type="bibr" rid="pcbi-0020086-b049">49</xref>]. No similar study for alternative splicing regulatory elements has yet been done. Our data on <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> alternative splicing regulatory elements suggest that there are many similarities in alternative splicing regulation across metazoans. This is seen in the fact that many of the motifs we identified in worms are known to regulate alternative splicing in mammals. Whether novel elements we have identified, such as TCTATC, can also function in mammals has yet to be determined.</p><p>The identification of (T)GCATG as a top scoring alternative splicing regulatory motif demonstrated the usefulness of this approach, as many examples of this motif as a splicing regulatory element are present in the literature [<xref ref-type="bibr" rid="pcbi-0020086-b014">14</xref>,<xref ref-type="bibr" rid="pcbi-0020086-b015">15</xref>,<xref ref-type="bibr" rid="pcbi-0020086-b050">50</xref>]. (T)GCATG is statistically overrepresented in introns downstream of alternative exons conserved between human and mouse genomes [<xref ref-type="bibr" rid="pcbi-0020086-b021">21</xref>,<xref ref-type="bibr" rid="pcbi-0020086-b022">22</xref>] and may have a spatially conserved role in directing splice-site choice [<xref ref-type="bibr" rid="pcbi-0020086-b023">23</xref>]. On the other hand, in vitro studies have demonstrated that the splicing factor FOX-1 affects splicing of transcripts with GCATG either upstream or downstream of an alternative exon [<xref ref-type="bibr" rid="pcbi-0020086-b013">13</xref>]. One interesting finding of our <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> work is that GCATG in introns flanking alternatively spliced exons shows no preference for being upstream or downstream of alternative exons. This may be evidence that while the motifs that regulate alternative splicing between mammals and nematodes may be the same, they may be used in different ways to promote splicing.</p><p>A recent analysis of the <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> genome used a support vector machine to identify predictive features of <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> alternative exons [<xref ref-type="bibr" rid="pcbi-0020086-b051">51</xref>]. One of the predictive features of an alternatively spliced exon that they identified is the presence of several different hexamers in the introns surrounding alternative exons. In their supplemental materials (<ext-link ext-link-type="uri" xlink:href="http://www2.fml.tuebingen.mpg.de/raetsch/projects/RASE" xlink:type="simple">http://www2.fml.tuebingen.mpg.de/raetsch/projects/RASE</ext-link>) they list the top 12 predictive hexamers in the introns upstream and downstream of the alternative exon. Comparison of their high-scoring results with our conserved element analysis indicates that many of the top scorers in both approaches are identical (for example, TGCATG, CTAACC, GTGTGT, CTCTCT, and TCTATC). That both their support vector machine and our comparative genomics methods yielded similar results helps to confirm the validity of both methods.</p><p>Comparing the motif searches from different classes of intronic sequence (total introns, WABA-conserved elements, entire conserved introns flanking alternative exons, and non-conserved introns flanking alternative exons) brought about a number of insights concerning the presence of certain motifs in introns. First, it can be noted that many of these sequences are still found, although at lower frequency, in total introns as well as those that are alternatively spliced. They may therefore, in a method analogous to SR protein-binding sites in exons, play a role in constitutive as well as alternative splicing (SR proteins reviewed in [<xref ref-type="bibr" rid="pcbi-0020086-b052">52</xref>]). Second, the comparison of motif analyses of introns lacking conserved elements and those containing WABA conservation reveals two dramatically different lists of overrepresented motifs. This suggests that there may in fact, be two separate classes of cassette exon splicing regulation, and WABA can help us distinguish between them.</p><p>Our splicing reporter system allowed us to directly test the role of the conserved elements GCATG and TCTATC flanking alternative exon 16 of the <italic>unc-52</italic> gene in vivo. Deletion of either of these elements individually led to measurable but opposing effects on the inclusion of this exon (<xref ref-type="fig" rid="pcbi-0020086-g004">Figure 4</xref>). These first results suggested the two <italic>cis</italic> elements might be counter-balancing each other to regulate splicing in this region. However, the creation of a double deletion of these two elements demonstrated that this was a naive assumption. The splicing program exhibited by the double deletion construct was similar to that seen from the ΔGCATG construct: an upregulation of the exon 16-containing transcripts. However, the proportional increase of these isoforms was far more dramatic in the double than the single deletion. The 15-16-19 isoform became the predominant spliced transcript, as opposed to 15–19 seen for all other splicing reporter constructs. This striking result is a good reminder that although these motifs can work independently and their deletion may produce measurable effects on splicing, they may work in a combinatorial way in vivo, and the effects of multiple deletions of important elements may be hard to predict. This type of combinatorial multifactor splicing regulatory mechanism has been described for several vertebrate genes including <italic>c-src</italic> [<xref ref-type="bibr" rid="pcbi-0020086-b011">11</xref>] and cardiac troponin T [<xref ref-type="bibr" rid="pcbi-0020086-b017">17</xref>]. While our comparative genomics approach gives us a method of identifying putative <italic>cis</italic>-regulatory elements of alternative splicing and our in vivo reporter assay provides a method for directly testing candidates, we still need more experimental information before we can predict the combinatorial effects of these elements on splicing.</p><p>Our comparative genomics analysis has not only provided a method for identifying intronic <italic>cis-</italic>regulatory elements, but also a starting point to investigate the mechanisms by which they control splicing. Consistent with current models of alternative splicing, <italic>cis</italic> elements are predicted to be binding sites for <italic>trans</italic> factors. Our identification of the novel splicing regulatory sequence (T)CTATC will lead us to subsequent experiments to identify its potential protein partner. The lists we generated of potential splicing regulatory elements include many sequences that have yet to be tested for a role in alternative splicing regulation. Experiments still need to be performed, similar to those done on <italic>unc-52</italic> and <italic>let-2,</italic> in which these elements are tested for a functional role in alternative splicing regulation. Due to the rapid release of new alignment programs and genomes, our list of conserved pentamers and hexamers will likely see some adjustments before all potential regulatory motifs have been tested. WABA has a limitation of needing to see relatively large sequence alignments in order to call a region as high homology (the minimum WABA high homology sequence run we detected was seven consecutive identical nucleotides). WABA high homology regions in introns flanking alternatively spliced exons were only detected for approximately 25% of alternative cassette exons in our dataset. The newer alignment algorithm PhastCons [<xref ref-type="bibr" rid="pcbi-0020086-b053">53</xref>], which uses an HMM to align multiple genomes using a smaller window size than that of WABA, can allow us to more accurately pinpoint smaller regions of conserved nucleotides within introns flanking additional alternatively spliced exons (unpublished data). The release of additional nematode genomes such as <named-content content-type="genus-species" xlink:type="simple">Caenorhabditis remanei</named-content> should provide us with the prospect of creating a three-way nematode genomic alignment, allowing us even more accuracy in our regulatory motif predictions. By systematically testing the pentamers and hexamers on our list of conserved motifs, we may be able to confirm more alternative splicing regulatory motifs. A compilation of these results will provide us with a better comprehension of the rules governing this complex and essential process.</p></sec><sec id="s4"><title>Materials and Methods</title><sec id="s4a"><title>Database construction.</title><p>A control dataset of introns was obtained by downloading from the UCSC Genome Browser (<ext-link ext-link-type="uri" xlink:href="http://www.genome.ucsc.edu" xlink:type="simple">http://www.genome.ucsc.edu</ext-link>) all of the introns in the <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> genome as annotated in Wormbase release WS120. From the sequences of these 118,492 introns, we removed the first and last seven nucleotides to avoid constitutive splicing signals. We then counted the number of occurrences of every possible hexamer or pentamer motif in the database by using the EMBOSS Compseq program [<xref ref-type="bibr" rid="pcbi-0020086-b054">54</xref>]. For each motif in the database, we assigned a frequency score that was the number of occurrences of each motif divided by the total number of possible occurrences of motifs of that length in the dataset. This score for each possible motif in the control set was used in our analysis of both the introns that flank alternatively spliced exons and the conserved elements in these introns as our expected score. In order to obtain the obs/exp ratio for each motif in a test dataset, we divided the observed frequency score for each motif in that dataset by the expected frequency score for each motif based on the total intron control dataset.</p></sec><sec id="s4b"><title>Analysis of alternative exons.</title><p><named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> and <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content> alignments for the 147 alternative spliced exons with intronic conservation were obtained from the UCSC Genome Table Browser conservation track [<xref ref-type="bibr" rid="pcbi-0020086-b055">55</xref>]. The mean nucleotide percentage identity was computed from this alignment along with the number of insertions and deletions. In order to obtain the mean amino acid identity, all the 147 exons were compared to the complete <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content> genome (WormBase cb25.agp8) using TBLASTX [<xref ref-type="bibr" rid="pcbi-0020086-b056">56</xref>], and the mean amino acid identity was then calculated from these alignments.</p></sec><sec id="s4c"><title>Generation of <italic>let-2</italic> splicing reporter constructs.</title><p>We have previously described the development of an in vivo splicing reporter for the alternatively spliced region of the <italic>let-2</italic> gene fused to GFP and expressed in muscle cells [<xref ref-type="bibr" rid="pcbi-0020086-b037">37</xref>]. Site-directed mutagenesis of the wild-type reporter for <italic>let-2</italic> alternative splicing from that paper was used to delete the core of the first conserved element, indicated in <xref ref-type="fig" rid="pcbi-0020086-g002">Figure 2</xref>, and replace it with GAA. Methods for detecting alternative splicing of this transcript with <sup>32</sup>P-labeled primers using RT-PCR, denaturing polyacrylamide gel electrophoresis, and autoradiography have been previously described [<xref ref-type="bibr" rid="pcbi-0020086-b037">37</xref>].</p></sec><sec id="s4d"><title>Generation of <italic>unc-52</italic> splicing reporter constructs.</title><p>The exon 15–19 region of <italic>unc-52</italic> was PCR-amplified from wild-type (N2) <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> genomic DNA using primers 5′-GGAATTCGATGAGTACATCTGTATCGC and 5′-GGAATTCACATCTGAACTGATGTCGCTC for cloning into the vector pPD96.02, developed by Andrew Fire's lab. This vector contains the <italic>unc-54</italic> body wall muscle-specific promoter driving expression of a green fluorescent protein (GFP)/β galactosidase (lacZ) fusion protein with an N-terminal nuclear localization signal derived from SV40 T antigen. The final 127 nucleotides of exon 15 through the first 173 nucleotides of exon 19 of <italic>unc-52</italic> and all the genomic sequence in between were cloned into a unique EcoRI site, 16 codons before the end of the lacZ open reading frame in the final exon of the fusion protein. The Kunkel method of site-directed mutagenesis was used to create the larger deletion and mutations for the plasmid constructs Mutation B and Deletion B [<xref ref-type="bibr" rid="pcbi-0020086-b057">57</xref>]. Pentamer and hexamer deletion constructs of the conserved <italic>unc-52</italic> intron sequence were created using the Quickchange site-directed mutagenesis kit (Stratagene, La Jolla, California, United States) according to the manufacturer's instructions. Animals carrying these constructs as extra-chromosomal arrays were generated by standard injection/transformation [<xref ref-type="bibr" rid="pcbi-0020086-b058">58</xref>]. Transformed N2 animals were identified by GFP-expression in nuclei of body wall muscle cells.</p></sec><sec id="s4e"><title>Growth of <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> strains and isolation of RNA.</title><p><named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> strains were grown on NGM agar plates using standard methods [<xref ref-type="bibr" rid="pcbi-0020086-b059">59</xref>]. RNA was extracted from worms as previously described [<xref ref-type="bibr" rid="pcbi-0020086-b060">60</xref>]. Strain CB938 carrying the <italic>mec-8(e398)</italic> mutant allele was obtained from the <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> Genetics Center, a National Institutes of Health funded Center for Research Resources at the University of Minnesota.</p></sec><sec id="s4f"><title>Production of cDNAs.</title><p>cDNAs of the <italic>unc-52</italic> splicing reporters were made in 25-μl reaction mixtures. The annealing step contained 3 μg total RNA and 25-pmol oligodeoxynucleotide primer complementary to the lacZ construct (5′- GTTGAAGAGTAATTGGACTTA-3′ for <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> and 5′- AACTGGTGTCGCTCTCCT-3′ for <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content>) in 17-μl final volume. These were heated to 94 °C for 2 min and cooled to room temperature for 10 min. The rest of the reverse transcription reaction components were added to reach a final volume of 25 μl. The final reaction mixtures consisted of 1 mM each of dATP, dCTP, dGTP, and dTTP; 1 U RNA Guard (Promega, Madison, Wisconsin, United States); 1 × AMV RT buffer (Promega); and 10 U AMV reverse transcriptase (Promega). Reactions were incubated at 37 °C for 1.5 h and stored at −20 °C.</p></sec><sec id="s4g"><title>Polymerase chain reaction.</title><p>1.0 μl of the cDNA reaction mixture was used as the template in 25-μl PCR reaction mixtures. 1.0 pmoles of the same oligonucleotide used in the reverse transcription reactions was added to PCR reaction mixtures along with <sup>32</sup>P-labeled 5′ lacZ vector-specific primer (5′-CTGGAGCCCGTCAGTATCGGC-3′ for <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> and 5′-ATTCGTTGCTGGGTCCCAGG-3′ for <named-content content-type="genus-species" xlink:type="simple">C. briggsae</named-content>). The reaction mixtures also contained 1 × PCR buffer, 0.25 mM of each of the four dNTPs, and <italic>Taq</italic> DNA polymerase. The 5′ oligo was labeled with (γ-<sup>32</sup>P) ATP by T4 polynucleotide kinase. Reaction mixtures were incubated for 25 cycles at 94 °C for 1.0 min, 59 °C for 1.0 min, and 72 °C for 1.0 min. 2.0 μl of PCR product were digested with the restriction enzyme BamHI. There is a unique BamH1 site in <italic>unc-52</italic> exon 18, and this digestion step allows us to distinguish the different alternatively spliced isoforms more clearly on the gel. Digested PCR products were separated on 40-cm long, 0.4-mm thick, 5% or 6% polyacrylamide urea gels in TBE buffer. Gels were dried onto filter paper. These were then visualized using a Molecular Dynamics PhosphorImager (Sunnyvale, California, United States). Relative splice-site usage was quantified using ImageQuant software as previously described [<xref ref-type="bibr" rid="pcbi-0020086-b037">37</xref>].</p></sec></sec><sec id="s5"><title>Supporting Information</title><supplementary-material id="pcbi-0020086-st001" mimetype="application/msexcel" position="float" xlink:href="info:doi/10.1371/journal.pcbi.0020086.st001" xlink:type="simple"><label>Table S1</label><caption><title>Complete Database of Highly Conserved Intronic Elements Used in Motif Analysis</title><p>Column (A) indicates <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> gene name. Columns (B–AI) list the WABA high homology sequences found in <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> introns flanking alternative exons of the corresponding gene.</p><p>(51 KB XLS)</p></caption></supplementary-material><supplementary-material id="pcbi-0020086-st002" mimetype="application/msexcel" position="float" xlink:href="info:doi/10.1371/journal.pcbi.0020086.st002" xlink:type="simple"><label>Table S2</label><caption><title>Complete Table Detailing Ranks of Pentamer and Hexamer Motifs in Introns Lacking Evolutionary Conservation Surrounding 307 Alternatively Spliced Exons</title><p>On both worksheets: Column (A) represents rank of motif from search based on obs/exp frequency in introns lacking evolutionary conservation downstream of alternative introns. Column (B) denotes motif and (C) contains the number of times the motif was observed in the dataset. (D) The observed frequency of the motif in the dataset. (E) Contains the expected frequency of motif based on total intron dataset. Column (F) is the ratio of observed frequency to expected frequency. Columns (H–M) are data from the same analysis in the same order for upstream introns.</p><p>(1.2 MB XLS)</p></caption></supplementary-material><supplementary-material id="pcbi-0020086-st003" mimetype="image/tiff" position="float" xlink:href="info:doi/10.1371/journal.pcbi.0020086.st003" xlink:type="simple"><label>Table S3</label><caption><title>Each Row in the Table Represents a Different Spliced Isoform of the <italic>unc-52</italic> Reporter Constructs, and Each Column Denotes the Reporter Being Monitored</title><p>The first six columns show the relative percentage of alternative splice-site usage of the specified reporter in a <italic>mec-8(+)</italic> background as quantified from <sup>32</sup>P RT-PCR<italic>.</italic> The seventh column shows results of the wild-type sequence reporter that has been crossed into <italic>mec-8(e398)</italic> mutant animals.</p><p>(185 KB TIF)</p></caption></supplementary-material></sec></body><back><ack><p>We are grateful to Jim Kent for his work to establish the WABA alignment software and the Intronerator and UCSC Genome Browsers. Many thanks to Jim Kent, Manny Ares, David Haussler, Guoping Gu, and all of the Zahler lab members for helpful discussions. Thanks to Valerie Hunt for technical assistance and Artem Lyubimov for initial construction of the <italic>unc-52</italic> splicing reporter.</p></ack><glossary><title>Abbreviations</title><def-list><def-item><term>EST</term><def><p>expressed sequence tag</p></def></def-item><def-item><term>HMM</term><def><p>hidden Markov model</p></def></def-item><def-item><term>obs/exp</term><def><p>observed over expected</p></def></def-item><def-item><term>pre-mRNA</term><def><p>precursor messenger RNA</p></def></def-item><def-item><term>PTB</term><def><p>polypyrimidine tract binding protein</p></def></def-item><def-item><term>WABA</term><def><p>Wobble Aware Bulk Aligner</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="pcbi-0020086-b001"><label>1</label><element-citation publication-type="journal" xlink:type="simple">
					<collab xlink:type="simple">International Human Genome Sequencing Consortium</collab>
					<year>2004</year>
					<article-title>Finishing the euchromatic sequence of the human genome.</article-title>
					<source>Nature</source>
					<volume>431</volume>
					<fpage>931</fpage>
					<lpage>945</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b002"><label>2</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Hide</surname><given-names>WA</given-names></name><name name-style="western"><surname>Babenko</surname><given-names>VN</given-names></name><name name-style="western"><surname>van Heusden</surname><given-names>PA</given-names></name><name name-style="western"><surname>Seoighe</surname><given-names>C</given-names></name><name name-style="western"><surname>Kelso</surname><given-names>JF</given-names></name></person-group>
					<year>2001</year>
					<article-title>The contribution of exon-skipping events on Chromosome 22 to protein coding diversity.</article-title>
					<source>Genome Res</source>
					<volume>11</volume>
					<fpage>1848</fpage>
					<lpage>1853</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b003"><label>3</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Kan</surname><given-names>Z</given-names></name><name name-style="western"><surname>Rouchka</surname><given-names>EC</given-names></name><name name-style="western"><surname>Gish</surname><given-names>WR</given-names></name><name name-style="western"><surname>States</surname><given-names>DJ</given-names></name></person-group>
					<year>2001</year>
					<article-title>Gene structure prediction and alternative splicing analysis using genomically aligned ESTs.</article-title>
					<source>Genome Res</source>
					<volume>11</volume>
					<fpage>889</fpage>
					<lpage>900</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b004"><label>4</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Modrek</surname><given-names>B</given-names></name><name name-style="western"><surname>Resch</surname><given-names>A</given-names></name><name name-style="western"><surname>Grasso</surname><given-names>C</given-names></name><name name-style="western"><surname>Lee</surname><given-names>C</given-names></name></person-group>
					<year>2001</year>
					<article-title>Genome-wide detection of alternative splicing in expressed sequences of human genes.</article-title>
					<source>Nucleic Acids Res</source>
					<volume>29</volume>
					<fpage>2850</fpage>
					<lpage>2859</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b005"><label>5</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Croft</surname><given-names>L</given-names></name><name name-style="western"><surname>Schandorff</surname><given-names>S</given-names></name><name name-style="western"><surname>Clark</surname><given-names>F</given-names></name><name name-style="western"><surname>Burrage</surname><given-names>K</given-names></name><name name-style="western"><surname>Arctander</surname><given-names>P</given-names></name><etal/></person-group>
					<year>2000</year>
					<article-title>ISIS, the intron information system, reveals the high frequency of alternative splicing in the human genome.</article-title>
					<source>Nat Genet</source>
					<volume>24</volume>
					<fpage>340</fpage>
					<lpage>341</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b006"><label>6</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Singh</surname><given-names>R</given-names></name></person-group>
					<year>2002</year>
					<article-title>RNA-protein interactions that regulate pre-mRNA splicing.</article-title>
					<source>Gene Expr</source>
					<volume>10</volume>
					<fpage>79</fpage>
					<lpage>92</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b007"><label>7</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Caceres</surname><given-names>JF</given-names></name><name name-style="western"><surname>Kornblihtt</surname><given-names>AR</given-names></name></person-group>
					<year>2002</year>
					<article-title>Alternative splicing: Multiple control mechanisms and involvement in human disease.</article-title>
					<source>Trends Genet</source>
					<volume>18</volume>
					<fpage>186</fpage>
					<lpage>193</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b008"><label>8</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Matlin</surname><given-names>AJ</given-names></name><name name-style="western"><surname>Clark</surname><given-names>F</given-names></name><name name-style="western"><surname>Smith</surname><given-names>CW</given-names></name></person-group>
					<year>2005</year>
					<article-title>Understanding alternative splicing: Towards a cellular code.</article-title>
					<source>Nat Rev Mol Cell Biol</source>
					<volume>6</volume>
					<fpage>386</fpage>
					<lpage>398</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b009"><label>9</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Black</surname><given-names>DL</given-names></name></person-group>
					<year>1992</year>
					<article-title>Activation of c-src neuron specific splicing by an unusual RNA element in vivo and in vitro.</article-title>
					<source>Cell</source>
					<volume>69</volume>
					<fpage>795</fpage>
					<lpage>807</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b010"><label>10</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Modafferi</surname><given-names>EF</given-names></name><name name-style="western"><surname>Black</surname><given-names>DL</given-names></name></person-group>
					<year>1997</year>
					<article-title>A complex intronic splicing enhancer from the c-src pre-mRNA activates inclusion of a heterologous exon.</article-title>
					<source>Mol Cell Biol</source>
					<volume>17</volume>
					<fpage>6537</fpage>
					<lpage>6545</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b011"><label>11</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Markovtsov</surname><given-names>V</given-names></name><name name-style="western"><surname>Nikolic</surname><given-names>JM</given-names></name><name name-style="western"><surname>Goldman</surname><given-names>JA</given-names></name><name name-style="western"><surname>Turck</surname><given-names>CW</given-names></name><name name-style="western"><surname>Chou</surname><given-names>MY</given-names></name><etal/></person-group>
					<year>2000</year>
					<article-title>Cooperative assembly of an hnRNP complex induced by a tissue-specific homolog of polypyrimidine tract binding protein.</article-title>
					<source>Mol Cell Biol</source>
					<volume>20</volume>
					<fpage>7463</fpage>
					<lpage>7479</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b012"><label>12</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Underwood</surname><given-names>JG</given-names></name><name name-style="western"><surname>Boutz</surname><given-names>PL</given-names></name><name name-style="western"><surname>Dougherty</surname><given-names>JD</given-names></name><name name-style="western"><surname>Stoilov</surname><given-names>P</given-names></name><name name-style="western"><surname>Black</surname><given-names>DL</given-names></name></person-group>
					<year>2005</year>
					<article-title>Homologs of the <named-content content-type="genus-species" xlink:type="simple">Caenorhabditis elegans</named-content> Fox-1 protein are neuronal splicing regulators in mammals.</article-title>
					<source>Mol Cell Biol</source>
					<volume>25</volume>
					<fpage>10005</fpage>
					<lpage>10016</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b013"><label>13</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Jin</surname><given-names>Y</given-names></name><name name-style="western"><surname>Suzuki</surname><given-names>H</given-names></name><name name-style="western"><surname>Maegawa</surname><given-names>S</given-names></name><name name-style="western"><surname>Endo</surname><given-names>H</given-names></name><name name-style="western"><surname>Sugano</surname><given-names>S</given-names></name><etal/></person-group>
					<year>2003</year>
					<article-title>A vertebrate RNA-binding protein Fox-1 regulates tissue-specific splicing via the pentanucleotide GCAUG.</article-title>
					<source>Embo J</source>
					<volume>22</volume>
					<fpage>905</fpage>
					<lpage>912</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b014"><label>14</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Huh</surname><given-names>GS</given-names></name><name name-style="western"><surname>Hynes</surname><given-names>RO</given-names></name></person-group>
					<year>1994</year>
					<article-title>Regulation of alternative pre-mRNA splicing by a novel repeated hexanucleotide element.</article-title>
					<source>Gene Dev</source>
					<volume>8</volume>
					<fpage>1561</fpage>
					<lpage>1574</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b015"><label>15</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Hedjran</surname><given-names>F</given-names></name><name name-style="western"><surname>Yeakley</surname><given-names>JM</given-names></name><name name-style="western"><surname>Huh</surname><given-names>GS</given-names></name><name name-style="western"><surname>Hynes</surname><given-names>RO</given-names></name><name name-style="western"><surname>Rosenfeld</surname><given-names>MG</given-names></name></person-group>
					<year>1997</year>
					<article-title>Control of alternative pre-mRNA splicing by distributed pentameric repeats.</article-title>
					<source>Proc Natl Acad Sci U S A</source>
					<volume>94</volume>
					<fpage>12343</fpage>
					<lpage>12347</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b016"><label>16</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Ryan</surname><given-names>KJ</given-names></name><name name-style="western"><surname>Cooper</surname><given-names>TA</given-names></name></person-group>
					<year>1996</year>
					<article-title>Muscle-specific splicing enhancers regulate inclusion of the cardiac troponin T alternative exon in embryonic skeletal muscle.</article-title>
					<source>Mol Cell Biol</source>
					<volume>16</volume>
					<fpage>4014</fpage>
					<lpage>4023</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b017"><label>17</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Charlet</surname><given-names>BN</given-names></name><name name-style="western"><surname>Logan</surname><given-names>P</given-names></name><name name-style="western"><surname>Singh</surname><given-names>G</given-names></name><name name-style="western"><surname>Cooper</surname><given-names>TA</given-names></name></person-group>
					<year>2002</year>
					<article-title>Dynamic antagonism between ETR-3 and PTB regulates cell type-specific alternative splicing.</article-title>
					<source>Molecular Cell</source>
					<volume>9</volume>
					<fpage>649</fpage>
					<lpage>658</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b018"><label>18</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Jensen</surname><given-names>KB</given-names></name><name name-style="western"><surname>Musunuru</surname><given-names>K</given-names></name><name name-style="western"><surname>Lewis</surname><given-names>HA</given-names></name><name name-style="western"><surname>Burley</surname><given-names>SK</given-names></name><name name-style="western"><surname>Darnell</surname><given-names>RB</given-names></name></person-group>
					<year>2000</year>
					<article-title>The tetranucleotide UCAY directs the specific recognition of RNA by the Nova K-homology 3 domain.</article-title>
					<source>Proc Natl Acad Sci U S A</source>
					<volume>97</volume>
					<fpage>5740</fpage>
					<lpage>5745</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b019"><label>19</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Jensen</surname><given-names>KB</given-names></name><name name-style="western"><surname>Dredge</surname><given-names>BK</given-names></name><name name-style="western"><surname>Stefani</surname><given-names>G</given-names></name><name name-style="western"><surname>Zhong</surname><given-names>R</given-names></name><name name-style="western"><surname>Buckanovich</surname><given-names>RJ</given-names></name><etal/></person-group>
					<year>2000</year>
					<article-title>Nova-1 regulates neuron-specific alternative splicing and is essential for neuronal viability.</article-title>
					<source>Neuron</source>
					<volume>25</volume>
					<fpage>359</fpage>
					<lpage>371</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b020"><label>20</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Polydorides</surname><given-names>AD</given-names></name><name name-style="western"><surname>Okano</surname><given-names>HJ</given-names></name><name name-style="western"><surname>Yang</surname><given-names>YY</given-names></name><name name-style="western"><surname>Stefani</surname><given-names>G</given-names></name><name name-style="western"><surname>Darnell</surname><given-names>RB</given-names></name></person-group>
					<year>2000</year>
					<article-title>A brain-enriched polypyrimidine tract-binding protein antagonizes the ability of Nova to regulate neuron-specific alternative splicing.</article-title>
					<source>Proc Natl Acad Sci U S A</source>
					<volume>97</volume>
					<fpage>6350</fpage>
					<lpage>6355</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b021"><label>21</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Sorek</surname><given-names>R</given-names></name><name name-style="western"><surname>Ast</surname><given-names>G</given-names></name></person-group>
					<year>2003</year>
					<article-title>Intronic sequences flanking alternatively spliced exons are conserved between human and mouse.</article-title>
					<source>Genome Res</source>
					<volume>13</volume>
					<fpage>1631</fpage>
					<lpage>1637</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b022"><label>22</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Yeo</surname><given-names>GW</given-names></name><name name-style="western"><surname>Van Nostrand</surname><given-names>E</given-names></name><name name-style="western"><surname>Holste</surname><given-names>D</given-names></name><name name-style="western"><surname>Poggio</surname><given-names>T</given-names></name><name name-style="western"><surname>Burge</surname><given-names>CB</given-names></name></person-group>
					<year>2005</year>
					<article-title>Identification and analysis of alternative splicing events conserved in human and mouse.</article-title>
					<source>Proc Natl Acad Sci U S A</source>
					<volume>102</volume>
					<fpage>2850</fpage>
					<lpage>2855</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b023"><label>23</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Minovitsky</surname><given-names>S</given-names></name><name name-style="western"><surname>Gee</surname><given-names>SL</given-names></name><name name-style="western"><surname>Schokrpur</surname><given-names>S</given-names></name><name name-style="western"><surname>Dubchak</surname><given-names>I</given-names></name><name name-style="western"><surname>Conboy</surname><given-names>JG</given-names></name></person-group>
					<year>2005</year>
					<article-title>The splicing regulatory element, UGCAUG, is phylogenetically and spatially conserved in introns that flank tissue-specific alternative exons.</article-title>
					<source>Nucleic Acids Res</source>
					<volume>33</volume>
					<fpage>714</fpage>
					<lpage>724</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b024"><label>24</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Kent</surname><given-names>WJ</given-names></name><name name-style="western"><surname>Zahler</surname><given-names>AM</given-names></name></person-group>
					<year>2000</year>
					<article-title>The Intronerator: Exploring introns and alternative splicing in <named-content content-type="genus-species" xlink:type="simple">Caenorhabditis elegans</named-content>.</article-title>
					<source>Nucleic Acids Res</source>
					<volume>28</volume>
					<fpage>91</fpage>
					<lpage>93</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b025"><label>25</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Kent</surname><given-names>WJ</given-names></name><name name-style="western"><surname>Zahler</surname><given-names>AM</given-names></name></person-group>
					<year>2000</year>
					<article-title>Conservation, regulation, synteny, and introns in a large-scale <italic>C. briggsae/C. elegans</italic> genomic alignment.</article-title>
					<source>Genome Res</source>
					<volume>10</volume>
					<fpage>1115</fpage>
					<lpage>1125</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b026"><label>26</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Stein</surname><given-names>LD</given-names></name><name name-style="western"><surname>Bao</surname><given-names>Z</given-names></name><name name-style="western"><surname>Blasiar</surname><given-names>D</given-names></name><name name-style="western"><surname>Blumenthal</surname><given-names>T</given-names></name><name name-style="western"><surname>Brent</surname><given-names>MR</given-names></name><etal/></person-group>
					<year>2003</year>
					<article-title>The genome sequence of <italic>Caenorhabditis briggsae:</italic> A platform for comparative genomics.</article-title>
					<source>PLoS Biol</source>
					<volume>1</volume>
					<elocation-id>e45.</elocation-id>
					<comment>DOI: <ext-link ext-link-type="doi" xlink:href="http://dx.doi.org/10.1371/journal.pbio.0000045" xlink:type="simple">10.1371/journal.pbio.0000045</ext-link></comment>
				</element-citation></ref><ref id="pcbi-0020086-b027"><label>27</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Fairbrother</surname><given-names>WG</given-names></name><name name-style="western"><surname>Yeh</surname><given-names>RF</given-names></name><name name-style="western"><surname>Sharp</surname><given-names>PA</given-names></name><name name-style="western"><surname>Burge</surname><given-names>CB</given-names></name></person-group>
					<year>2002</year>
					<article-title>Predictive identification of exonic splicing enhancers in human genes.</article-title>
					<source>Science</source>
					<volume>297</volume>
					<fpage>1007</fpage>
					<lpage>1013</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b028"><label>28</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Burd</surname><given-names>CG</given-names></name><name name-style="western"><surname>Dreyfuss</surname><given-names>G</given-names></name></person-group>
					<year>1994</year>
					<article-title>RNA-binding specificity of hnRNP A1: Significance of hnRNP A1 high-affinity binding sites in pre-mRNA splicing.</article-title>
					<source>EMBO J</source>
					<volume>13</volume>
					<fpage>1197</fpage>
					<lpage>1204</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b029"><label>29</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Tacke</surname><given-names>R</given-names></name><name name-style="western"><surname>Manley</surname><given-names>JL</given-names></name></person-group>
					<year>1995</year>
					<article-title>The human splicing factors ASF/SF2 and SC35 possess distinct, functionally significant RNA-binding specificities.</article-title>
					<source>EMBO J</source>
					<volume>14</volume>
					<fpage>3540</fpage>
					<lpage>3551</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b030"><label>30</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Caputi</surname><given-names>M</given-names></name><name name-style="western"><surname>Zahler</surname><given-names>AM</given-names></name></person-group>
					<year>2001</year>
					<article-title>Determination of the RNA-binding specificity of the heterogenous nuclear ribonucleoprotein (hnRNP) H/H′/F/2H9 family.</article-title>
					<source>J Biol Chem</source>
					<volume>276</volume>
					<fpage>43850</fpage>
					<lpage>43859</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b031"><label>31</label><element-citation publication-type="other" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Moore</surname><given-names>MJ</given-names></name><name name-style="western"><surname>Query</surname><given-names>CC</given-names></name><name name-style="western"><surname>Sharp</surname><given-names>PA</given-names></name></person-group>
					<year>1993</year>
					<article-title>Splicing of precursors to mRNA by the spliceosome.</article-title>
					<comment>In:</comment>
					<person-group person-group-type="editor"><name name-style="western"><surname>Gesteland</surname><given-names>RF</given-names></name><name name-style="western"><surname>Atkins</surname><given-names>JF</given-names></name></person-group>
					<source>The RNA world</source>
					<publisher-loc>New York</publisher-loc>
					<publisher-name>Cold Spring Harbor Press</publisher-name>
					<comment>pp.</comment>
					<fpage>303</fpage>
					<lpage>357</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b032"><label>32</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Ladd</surname><given-names>AN</given-names></name><name name-style="western"><surname>Charlet</surname><given-names>N</given-names></name><name name-style="western"><surname>Cooper</surname><given-names>TA</given-names></name></person-group>
					<year>2001</year>
					<article-title>The CELF family of RNA-binding proteins is implicated in cell-specific and developmentally regulated alternative splicing.</article-title>
					<source>Mol Cell Biol</source>
					<volume>21</volume>
					<fpage>1285</fpage>
					<lpage>1296</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b033"><label>33</label><element-citation publication-type="other" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Zahler</surname><given-names>AM</given-names></name></person-group>
					<year>2005</year>
					<source>Alternative splicing in <italic>C. elegans</italic>. The <italic><named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content></italic> research community. Wormbook. DOI: 10.1895/wormbook.1.31.1</source>
					<comment>Available: <ext-link ext-link-type="uri" xlink:href="http://www.wormbook.org" xlink:type="simple">http://www.wormbook.org</ext-link>. Accessed 25 September 2005.</comment>
				</element-citation></ref><ref id="pcbi-0020086-b034"><label>34</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Zorio</surname><given-names>DA</given-names></name><name name-style="western"><surname>Blumenthal</surname><given-names>T</given-names></name></person-group>
					<year>1999</year>
					<article-title>Both subunits of U2AF recognize the 3′ splice site in <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content>.</article-title>
					<source>Nature</source>
					<volume>402</volume>
					<fpage>835</fpage>
					<lpage>838</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b035"><label>35</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Pettitt</surname><given-names>J</given-names></name><name name-style="western"><surname>Kingston</surname><given-names>IB</given-names></name></person-group>
					<year>1994</year>
					<article-title>Developmentally regulated alternative splicing of a nematode type IV collagen gene.</article-title>
					<source>Dev Biol</source>
					<volume>161</volume>
					<fpage>22</fpage>
					<lpage>29</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b036"><label>36</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Sibley</surname><given-names>MH</given-names></name><name name-style="western"><surname>Johnson</surname><given-names>JJ</given-names></name><name name-style="western"><surname>Mello</surname><given-names>CC</given-names></name><name name-style="western"><surname>Kramer</surname><given-names>JM</given-names></name></person-group>
					<year>1993</year>
					<article-title>Genetic identification, sequence, and alternative splicing of the <named-content content-type="genus-species" xlink:type="simple">Caenorhabditis elegans</named-content> alpha 2 (IV) collagen gene.</article-title>
					<source>J Cell Biol</source>
					<volume>123</volume>
					<fpage>255</fpage>
					<lpage>264</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b037"><label>37</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Farrer</surname><given-names>T</given-names></name><name name-style="western"><surname>Roller</surname><given-names>AB</given-names></name><name name-style="western"><surname>Kent</surname><given-names>WJ</given-names></name><name name-style="western"><surname>Zahler</surname><given-names>AM</given-names></name></person-group>
					<year>2002</year>
					<article-title>Analysis of the role of <named-content content-type="genus-species" xlink:type="simple">Caenorhabditis elegans</named-content> GC-AG introns in regulated splicing.</article-title>
					<source>Nucleic Acids Res</source>
					<volume>30</volume>
					<fpage>3360</fpage>
					<lpage>3367</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b038"><label>38</label><element-citation publication-type="other" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Blumenthal</surname><given-names>T</given-names></name><name name-style="western"><surname>Steward</surname><given-names>K</given-names></name></person-group>
					<year>1997</year>
					<article-title>RNA processing and gene structure.</article-title>
					<comment>In:</comment>
					<person-group person-group-type="editor"><name name-style="western"><surname>Riddle</surname><given-names>DL</given-names></name><name name-style="western"><surname>Blumenthal</surname><given-names>T</given-names></name><name name-style="western"><surname>Meyer</surname><given-names>BJ</given-names></name><name name-style="western"><surname>Priess</surname><given-names>JR</given-names></name></person-group>
					<source>C. elegans II</source>
					<publisher-loc>Plainview (New York)</publisher-loc>
					<publisher-name>Cold Spring Harbor Laboratory Press</publisher-name>
					<comment>pp.</comment>
					<fpage>117</fpage>
					<lpage>145</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b039"><label>39</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Lim</surname><given-names>LP</given-names></name><name name-style="western"><surname>Sharp</surname><given-names>PA</given-names></name></person-group>
					<year>1998</year>
					<article-title>Alternative splicing of the fibronectin EIIIB exon depends on specific TGCATG repeats.</article-title>
					<source>Mol Cell Biol</source>
					<volume>18</volume>
					<fpage>3900</fpage>
					<lpage>3906</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b040"><label>40</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Nicoll</surname><given-names>M</given-names></name><name name-style="western"><surname>Akerib</surname><given-names>CC</given-names></name><name name-style="western"><surname>Meyer</surname><given-names>BJ</given-names></name></person-group>
					<year>1997</year>
					<article-title>X-chromosome-counting mechanisms that determine nematode sex.</article-title>
					<source>Nature</source>
					<volume>388</volume>
					<fpage>200</fpage>
					<lpage>204</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b041"><label>41</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Buratti</surname><given-names>E</given-names></name><name name-style="western"><surname>Brindisi</surname><given-names>A</given-names></name><name name-style="western"><surname>Pagani</surname><given-names>F</given-names></name><name name-style="western"><surname>Baralle</surname><given-names>FE</given-names></name></person-group>
					<year>2004</year>
					<article-title>Nuclear factor TDP-43 binds to the polymorphic TG repeats in CFTR intron 8 and causes skipping of exon 9: A functional link with disease penetrance.</article-title>
					<source>Am J Hum Genet</source>
					<volume>74</volume>
					<fpage>1322</fpage>
					<lpage>1325</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b042"><label>42</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Faustino</surname><given-names>NA</given-names></name><name name-style="western"><surname>Cooper</surname><given-names>TA</given-names></name></person-group>
					<year>2005</year>
					<article-title>Identification of putative new splicing targets for ETR-3 using sequences identified by systematic evolution of ligands by exponential enrichment.</article-title>
					<source>Mol Cell Biol</source>
					<volume>25</volume>
					<fpage>879</fpage>
					<lpage>887</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b043"><label>43</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Chou</surname><given-names>MY</given-names></name><name name-style="western"><surname>Underwood</surname><given-names>JG</given-names></name><name name-style="western"><surname>Nikolic</surname><given-names>J</given-names></name><name name-style="western"><surname>Luu</surname><given-names>MH</given-names></name><name name-style="western"><surname>Black</surname><given-names>DL</given-names></name></person-group>
					<year>2000</year>
					<article-title>Multi-site RNA binding and release of polypyrimidine tract binding protein during the regulation of c-src neural-specific splicing.</article-title>
					<source>Mol Cell</source>
					<volume>5</volume>
					<fpage>949</fpage>
					<lpage>957</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b044"><label>44</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Anyanful</surname><given-names>A</given-names></name><name name-style="western"><surname>Ono</surname><given-names>K</given-names></name><name name-style="western"><surname>Johnsen</surname><given-names>RC</given-names></name><name name-style="western"><surname>Ly</surname><given-names>H</given-names></name><name name-style="western"><surname>Jensen</surname><given-names>V</given-names></name><etal/></person-group>
					<year>2004</year>
					<article-title>The RNA-binding protein SUP-12 controls muscle-specific splicing of the ADF/cofilin pre-mRNA in <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content>.</article-title>
					<source>J Cell Biol</source>
					<volume>167</volume>
					<fpage>639</fpage>
					<lpage>647</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b045"><label>45</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Rogalski</surname><given-names>TM</given-names></name><name name-style="western"><surname>Gilchrist</surname><given-names>EJ</given-names></name><name name-style="western"><surname>Mullen</surname><given-names>GP</given-names></name><name name-style="western"><surname>Moerman</surname><given-names>DG</given-names></name></person-group>
					<year>1995</year>
					<article-title>Mutations in the <italic>unc-52</italic> gene responsible for body wall muscle defects in adult <named-content content-type="genus-species" xlink:type="simple">Caenorhabditis elegans</named-content> are located in alternatively spliced exons.</article-title>
					<source>Genetics</source>
					<volume>139</volume>
					<fpage>159</fpage>
					<lpage>169</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b046"><label>46</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Lundquist</surname><given-names>EA</given-names></name><name name-style="western"><surname>Herman</surname><given-names>RK</given-names></name><name name-style="western"><surname>Rogalski</surname><given-names>TM</given-names></name><name name-style="western"><surname>Mullen</surname><given-names>GP</given-names></name><name name-style="western"><surname>Moerman</surname><given-names>DG</given-names></name><etal/></person-group>
					<year>1996</year>
					<article-title>The <italic>mec-8</italic> gene of <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> encodes a protein with two RNA recognition motifs and regulates alternative splicing of <italic>unc-52</italic> transcripts.</article-title>
					<source>Development</source>
					<volume>122</volume>
					<fpage>1601</fpage>
					<lpage>1610</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b047"><label>47</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Spike</surname><given-names>CA</given-names></name><name name-style="western"><surname>Davies</surname><given-names>AG</given-names></name><name name-style="western"><surname>Shaw</surname><given-names>JE</given-names></name><name name-style="western"><surname>Herman</surname><given-names>RK</given-names></name></person-group>
					<year>2002</year>
					<article-title>MEC-8 regulates alternative splicing of <italic>unc-52</italic> transcripts in <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content> hypodermal cells.</article-title>
					<source>Development</source>
					<volume>129</volume>
					<fpage>4999</fpage>
					<lpage>5008</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b048"><label>48</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Mullen</surname><given-names>GP</given-names></name><name name-style="western"><surname>Rogalski</surname><given-names>TM</given-names></name><name name-style="western"><surname>Bush</surname><given-names>JA</given-names></name><name name-style="western"><surname>Gorji</surname><given-names>PR</given-names></name><name name-style="western"><surname>Moerman</surname><given-names>DG</given-names></name></person-group>
					<year>1999</year>
					<article-title>Complex patterns of alternative splicing mediate the spatial and temporal distribution of perlecan/UNC-52 in <named-content content-type="genus-species" xlink:type="simple">Caenorhabditis elegans</named-content>.</article-title>
					<source>Mol Biol Cell</source>
					<volume>10</volume>
					<fpage>3205</fpage>
					<lpage>3221</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b049"><label>49</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Yeo</surname><given-names>G</given-names></name><name name-style="western"><surname>Hoon</surname><given-names>S</given-names></name><name name-style="western"><surname>Venkatesh</surname><given-names>B</given-names></name><name name-style="western"><surname>Burge</surname><given-names>CB</given-names></name></person-group>
					<year>2004</year>
					<article-title>Variation in sequence and organization of splicing regulatory elements in vertebrate genes.</article-title>
					<source>Proc Natl Acad Sci U S A</source>
					<volume>101</volume>
					<fpage>15700</fpage>
					<lpage>15705</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b050"><label>50</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Min</surname><given-names>H</given-names></name><name name-style="western"><surname>Turck</surname><given-names>CW</given-names></name><name name-style="western"><surname>Nikolic</surname><given-names>JM</given-names></name><name name-style="western"><surname>Black</surname><given-names>DL</given-names></name></person-group>
					<year>1997</year>
					<article-title>A new regulatory protein, KSRP, mediates exon inclusion through an intronic splicing enhancer.</article-title>
					<source>Genes Dev</source>
					<volume>11</volume>
					<fpage>1023</fpage>
					<lpage>1036</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b051"><label>51</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Ratsch</surname><given-names>G</given-names></name><name name-style="western"><surname>Sonnenburg</surname><given-names>S</given-names></name><name name-style="western"><surname>Scholkopf</surname><given-names>B</given-names></name></person-group>
					<year>2005</year>
					<article-title>RASE: Recognition of alternatively spliced exons in <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content>.</article-title>
					<source>Bioinformatics</source>
					<comment>21 Suppl</comment>
					<volume>1</volume>
					<fpage>i369</fpage>
					<lpage>377</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b052"><label>52</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Sanford</surname><given-names>JR</given-names></name><name name-style="western"><surname>Ellis</surname><given-names>J</given-names></name><name name-style="western"><surname>Caceres</surname><given-names>JF</given-names></name></person-group>
					<year>2005</year>
					<article-title>Multiple roles of arginine/serine-rich splicing factors in RNA processing.</article-title>
					<source>Biochem Soc Trans</source>
					<volume>33</volume>
					<fpage>443</fpage>
					<lpage>446</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b053"><label>53</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Siepel</surname><given-names>A</given-names></name><name name-style="western"><surname>Haussler</surname><given-names>D</given-names></name></person-group>
					<year>2004</year>
					<article-title>Combining phylogenetic and hidden Markov models in biosequence analysis.</article-title>
					<source>J Comput Biol</source>
					<volume>11</volume>
					<fpage>413</fpage>
					<lpage>428</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b054"><label>54</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Rice</surname><given-names>P</given-names></name><name name-style="western"><surname>Longden</surname><given-names>I</given-names></name><name name-style="western"><surname>Bleasby</surname><given-names>A</given-names></name></person-group>
					<year>2000</year>
					<article-title>EMBOSS: The European Molecular Biology Open Software Suite.</article-title>
					<source>Trends Genet</source>
					<volume>16</volume>
					<fpage>276</fpage>
					<lpage>277</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b055"><label>55</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Karolchik</surname><given-names>D</given-names></name><name name-style="western"><surname>Hinrichs</surname><given-names>AS</given-names></name><name name-style="western"><surname>Furey</surname><given-names>TS</given-names></name><name name-style="western"><surname>Roskin</surname><given-names>KM</given-names></name><name name-style="western"><surname>Sugnet</surname><given-names>CW</given-names></name><etal/></person-group>
					<year>2004</year>
					<article-title>The UCSC Table Browser data retrieval tool.</article-title>
					<source>Nucl Acids Res</source>
					<volume>32</volume>
					<fpage>D493</fpage>
					<lpage>D496</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b056"><label>56</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Altschul</surname><given-names>SF</given-names></name><name name-style="western"><surname>Madden</surname><given-names>TL</given-names></name><name name-style="western"><surname>Schaffer</surname><given-names>AA</given-names></name><name name-style="western"><surname>Zhang</surname><given-names>J</given-names></name><name name-style="western"><surname>Zhang</surname><given-names>Z</given-names></name><etal/></person-group>
					<year>1997</year>
					<article-title>Gapped BLAST and PSI-BLAST: A new generation of protein database search programs.</article-title>
					<source>Nucl Acids Res</source>
					<volume>25</volume>
					<fpage>3389</fpage>
					<lpage>3402</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b057"><label>57</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Kunkel</surname><given-names>TA</given-names></name><name name-style="western"><surname>Roberts</surname><given-names>JD</given-names></name><name name-style="western"><surname>Zakour</surname><given-names>RA</given-names></name></person-group>
					<year>1987</year>
					<article-title>Rapid and efficient site-specific mutagenesis without phenotypic selection.</article-title>
					<source>Methods Enzymol</source>
					<volume>154</volume>
					<fpage>367</fpage>
					<lpage>382</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b058"><label>58</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Mello</surname><given-names>C</given-names></name><name name-style="western"><surname>Fire</surname><given-names>A</given-names></name></person-group>
					<year>1995</year>
					<article-title>DNA transformation.</article-title>
					<source>Methods Cell Biol</source>
					<volume>48</volume>
					<fpage>451</fpage>
					<lpage>482</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b059"><label>59</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Lewis</surname><given-names>JA</given-names></name><name name-style="western"><surname>Fleming</surname><given-names>JT</given-names></name></person-group>
					<year>1995</year>
					<article-title>Basic culture methods.</article-title>
					<source>Methods Cell Biol</source>
					<volume>48</volume>
					<fpage>3</fpage>
					<lpage>29</lpage>
				</element-citation></ref><ref id="pcbi-0020086-b060"><label>60</label><element-citation publication-type="journal" xlink:type="simple">
					<person-group person-group-type="author"><name name-style="western"><surname>Roller</surname><given-names>AB</given-names></name><name name-style="western"><surname>Hoffman</surname><given-names>DC</given-names></name><name name-style="western"><surname>Zahler</surname><given-names>AM</given-names></name></person-group>
					<year>2000</year>
					<article-title>The allele-specific suppressor <italic>sup-39</italic> alters use of cryptic splice sites in <named-content content-type="genus-species" xlink:type="simple">C. elegans</named-content>.</article-title>
					<source>Genetics</source>
					<volume>154</volume>
					<fpage>1169</fpage>
					<lpage>1179</lpage>
				</element-citation></ref></ref-list></back></article>