<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article
  PUBLIC "-//NLM//DTD Journal Publishing DTD v3.0 20080202//EN" "http://dtd.nlm.nih.gov/publishing/3.0/journalpublishing3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="3.0" xml:lang="en">
<front>
<journal-meta>
<journal-id journal-id-type="nlm-ta">PLoS ONE</journal-id>
<journal-id journal-id-type="publisher-id">plos</journal-id>
<journal-id journal-id-type="pmc">plosone</journal-id><journal-title-group>
<journal-title>PLoS ONE</journal-title></journal-title-group>
<issn pub-type="epub">1932-6203</issn>
<publisher>
<publisher-name>Public Library of Science</publisher-name>
<publisher-loc>San Francisco, USA</publisher-loc></publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">PONE-D-14-00837</article-id>
<article-id pub-id-type="doi">10.1371/journal.pone.0093827</article-id>
<article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="Discipline-v2"><subject>Biology and life sciences</subject><subj-group><subject>Biochemistry</subject><subj-group><subject>Nucleic acids</subject><subject>RNA</subject></subj-group></subj-group><subj-group><subject>Computational biology</subject><subj-group><subject>Comparative genomics</subject></subj-group></subj-group><subj-group><subject>Ecology</subject><subj-group><subject>Community ecology</subject><subj-group><subject>Community structure</subject></subj-group></subj-group><subj-group><subject>Biodiversity</subject><subject>Freshwater ecology</subject><subject>Microbial ecology</subject></subj-group></subj-group><subj-group><subject>Genetics</subject><subj-group><subject>Genomics</subject><subj-group><subject>Metagenomics</subject></subj-group></subj-group></subj-group><subj-group><subject>Marine biology</subject></subj-group><subj-group><subject>Microbiology</subject></subj-group></subj-group><subj-group subj-group-type="Discipline-v2"><subject>Ecology and environmental sciences</subject></subj-group></article-categories>
<title-group>
<article-title>Strengths and Limitations of 16S rRNA Gene Amplicon Sequencing in Revealing Temporal Microbial Community Dynamics</article-title>
<alt-title alt-title-type="running-head">Strengths and Limitations of 16S rRNA Sequencing</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Poretsky</surname><given-names>Rachel</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref><xref ref-type="corresp" rid="cor1"><sup>*</sup></xref><xref ref-type="fn" rid="fn1"><sup>¤</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Rodriguez-R</surname><given-names>Luis M.</given-names></name><xref ref-type="aff" rid="aff2"><sup>2</sup></xref><xref ref-type="aff" rid="aff3"><sup>3</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Luo</surname><given-names>Chengwei</given-names></name><xref ref-type="aff" rid="aff2"><sup>2</sup></xref><xref ref-type="aff" rid="aff3"><sup>3</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Tsementzi</surname><given-names>Despina</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Konstantinidis</surname><given-names>Konstantinos T.</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref><xref ref-type="aff" rid="aff2"><sup>2</sup></xref><xref ref-type="aff" rid="aff3"><sup>3</sup></xref></contrib>
</contrib-group>
<aff id="aff1"><label>1</label><addr-line>School of Civil and Environmental Engineering, Georgia Institute of Technology, Atlanta, Georgia, United States of America</addr-line></aff>
<aff id="aff2"><label>2</label><addr-line>School of Biology, Georgia Institute of Technology, Atlanta, Georgia, United States of America</addr-line></aff>
<aff id="aff3"><label>3</label><addr-line>Center for Bioinformatics Computational Genomics, Georgia Institute of Technology, Atlanta, Georgia, United States of America</addr-line></aff>
<contrib-group>
<contrib contrib-type="editor" xlink:type="simple"><name name-style="western"><surname>Rodriguez-Valera</surname><given-names>Francisco</given-names></name>
<role>Editor</role>
<xref ref-type="aff" rid="edit1"/></contrib>
</contrib-group>
<aff id="edit1"><addr-line>Universidad Miguel Hernandez, Spain</addr-line></aff>
<author-notes>
<corresp id="cor1">* E-mail: <email xlink:type="simple">microbe@uic.edu</email></corresp>
<fn fn-type="conflict"><p>The authors have declared that no competing interests exist.</p></fn>
<fn fn-type="con"><p>Conceived and designed the experiments: RP DT KTK. Performed the experiments: RP DT. Analyzed the data: RP LMR CL. Contributed reagents/materials/analysis tools: RP LMR CL DT KTK. Wrote the paper: RP KTK.</p></fn>
<fn id="fn1" fn-type="current-aff"><label>¤</label><p>Current address: Department of Biological Sciences, University of Illinois at Chicago, Chicago, Illinois, United States of America</p></fn>
</author-notes>
<pub-date pub-type="collection"><year>2014</year></pub-date>
<pub-date pub-type="epub"><day>8</day><month>4</month><year>2014</year></pub-date>
<volume>9</volume>
<issue>4</issue>
<elocation-id>e93827</elocation-id>
<history>
<date date-type="received"><day>8</day><month>1</month><year>2014</year></date>
<date date-type="accepted"><day>19</day><month>2</month><year>2014</year></date>
</history>
<permissions>
<copyright-year>2014</copyright-year>
<copyright-holder>Poretsky et al</copyright-holder><license xlink:type="simple"><license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">Creative Commons Attribution License</ext-link>, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p></license></permissions>
<abstract>
<p>This study explored the short-term planktonic microbial community structure and resilience in Lake Lanier (GA, USA) while simultaneously evaluating the technical aspects of identifying taxa via 16S rRNA gene amplicon and metagenomic sequence data. 16S rRNA gene amplicons generated from four temporally discrete samples were sequenced with 454 GS-FLX-Ti yielding ∼40,000 rRNA gene sequences from each sample and representing ∼300 observed OTUs. Replicates obtained from the same biological sample clustered together but several biases were observed, linked to either the PCR or sequencing-preparation steps. In comparisons with companion whole-community shotgun metagenome datasets, the estimated number of OTUs at each timepoint was concordant, but 1.5 times and ∼10 times as many phyla and genera, respectively, were identified in the metagenomes. Our analyses showed that the 16S rRNA gene captures broad shifts in community diversity over time, but with limited resolution and lower sensitivity compared to metagenomic data. We also identified OTUs that showed marked shifts in abundance over four close timepoints separated by perturbations and tracked these taxa in the metagenome vs. 16S rRNA amplicon data. A strong summer storm had less of an effect on community composition than did seasonal mixing, which revealed a distinct succession of organisms. This study provides insights into freshwater microbial communities and advances the approaches for assessing community diversity and dynamics <italic>in situ</italic>.</p>
</abstract>
<funding-group><funding-statement>This research was supported in part by the U.S. Department of Energy (Award DE-SC0006662) and by U. S. National Science Foundation (Award 1241046). The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</funding-statement></funding-group><counts><page-count count="12"/></counts></article-meta>
</front>
<body><sec id="s1">
<title>Introduction</title>
<p>A key step in understanding microbial community structure, dynamics, and how organisms might influence or be influenced by their surroundings is to classify DNA sequences taxonomically or phylogenetically. To date, most studies of microbial communities in systems ranging from the open ocean to soil to the human gut have depended on a single gene, the 16S small subunit ribosomal RNA (rRNA) gene <xref ref-type="bibr" rid="pone.0093827-Costello1">[1]</xref>–<xref ref-type="bibr" rid="pone.0093827-Nemergut1">[4]</xref>. Massively parallel sequencing methods are increasingly being applied to the characterization of microbial communities based on amplification of this gene and have led to a better appreciation of extant biodiversity <xref ref-type="bibr" rid="pone.0093827-Sogin1">[5]</xref>; however, the 16S rRNA -based techniques are known to be limited by the short read lengths obtained, sequencing errors <xref ref-type="bibr" rid="pone.0093827-Quince1">[6]</xref>, <xref ref-type="bibr" rid="pone.0093827-Quince2">[7]</xref>, differences arising from the different regions chosen <xref ref-type="bibr" rid="pone.0093827-Youssef1">[8]</xref>, and difficulties in assessing operational taxonomic units (OTUs) <xref ref-type="bibr" rid="pone.0093827-Huse1">[9]</xref>. Furthermore, the use of a single marker gene to assess diversity is challenging, given the prevalence of horizontal gene transfer and the difficulty inherent in defining bacterial species <xref ref-type="bibr" rid="pone.0093827-McDonald1">[10]</xref>–<xref ref-type="bibr" rid="pone.0093827-RosselloMora1">[12]</xref> as well as the limited resolution of the 16S rRNA gene among closely related species. Recently, 16S rRNA gene amplicon sequencing was compared to metagenomic data from synthetic communities <xref ref-type="bibr" rid="pone.0093827-Shakya1">[13]</xref>, but to our knowledge, there has been no systematic evaluation of high-throughput 16S rRNA gene sequencing involving multiple sequencing and PCR replicates from natural microbial communities. Here, we coupled detailed analyses of replicate 16S rRNA gene datasets to comparisons with companion community shotgun metagenomics data from the same samples.</p>
<p>Metagenome approaches are commonly used to describe microbial communities in different systems, e.g., <xref ref-type="bibr" rid="pone.0093827-Burke1">[14]</xref>–<xref ref-type="bibr" rid="pone.0093827-RodriguezBrito1">[16]</xref>, without the biases inherent to PCR amplification of a single gene, although it remains a challenge to accurately infer taxonomic origin from metagenomic reads <xref ref-type="bibr" rid="pone.0093827-Bazinet1">[17]</xref>. Whole genome shotgun (WGS) metagenomic approaches provide robust estimates of microbial community composition and diversity without the need to target and amplify a specific gene. However, differences in sequencing platforms, DNA preparation methods, and the complexity of the samples being studied can possibly lead to different or biased observations <xref ref-type="bibr" rid="pone.0093827-Quince1">[6]</xref>, <xref ref-type="bibr" rid="pone.0093827-Aird1">[18]</xref>, <xref ref-type="bibr" rid="pone.0093827-GomezAlvarez1">[19]</xref>. Furthermore, phylogenetic classification of microbes using WGS is seldom coupled to 16S-based classification, and a few recent studies doing so have identified discrepancies between the different classification methods, usually with regard to the level of resolution obtained <xref ref-type="bibr" rid="pone.0093827-Shah1">[20]</xref>, <xref ref-type="bibr" rid="pone.0093827-Steven1">[21]</xref>.</p>
<p>Here, we focused on evaluating the bacterioplankton composition and short-term variability in an important, temperate freshwater lake in the Southeast USA, Lake Lanier. Lake Lanier is the source of drinking water for metropolitan Atlanta and is a popular recreational area, especially during the summer months. Freshwater microbial communities have been shown to change over time in many different systems <xref ref-type="bibr" rid="pone.0093827-Portillo1">[22]</xref>–<xref ref-type="bibr" rid="pone.0093827-Eiler1">[25]</xref>, influenced by a variety of environmental factors such as pH, temperature, and water retention time <xref ref-type="bibr" rid="pone.0093827-Lindstrom1">[26]</xref>–<xref ref-type="bibr" rid="pone.0093827-Methe1">[28]</xref>, but little is known about microbial temporal dynamics or responses to natural perturbations such as strong storm events in southern temperate lakes such as Lake Lanier. Understanding the microbial community composition, variation, and metabolic potential of Lake Lanier will help discern the sensitivity and responsiveness of this community to potential perturbations as well as address the gap of knowledge of freshwater lake communities. We examined the microbial community with 16S rRNA gene and metagenomic sequencing while assessing the reproducibility and potential biases of the 16S-based approach by comparing multiple PCR (i.e., same template DNA with independent 16S rDNA amplifications) and sequencing (i.e., same DNA sequenced independently) replicate datasets from four different timepoints separated by two different potential perturbations: a summer storm event and the beginning of the fall turnover. We further compared this 16S-based information to that from functional genes and 16S rRNA gene fragments recovered in companion metagenomic datasets to determine the extent to which an amplicon approach influences our ecological inferences and to evaluate the strengths and limitations of these common community characterization approaches. In addition to providing information about the technical variability of the 16S rRNA gene amplicon approach, we also gained new insights into the microbial ecology of the system, specifically about how certain physiochemical changes might influence bacterioplankton communities as well as how community composition changes over time. This work is also part of a larger, long-term effort to characterize the microbial community of Lake Lanier <xref ref-type="bibr" rid="pone.0093827-Oh1">[29]</xref>.</p>
</sec><sec id="s2" sec-type="methods">
<title>Methods</title>
<sec id="s2a">
<title>Sample Description</title>
<p>Lake Lanier is a seasonally stratified lake situated about 80 km northeast of Atlanta, GA at the headwaters of the Apalachicola-Chattahoochee-Flint River basin. When full, the reservoir covers nearly 156 km<sup>2</sup> and holds approximately 2.4×10<sup>9</sup> m<sup>3</sup> of water. It is used for drinking water, hydroelectric power generation, flood control, run-off management, and recreation. Samples were collected from below the Browns Bridge at Lake Lanier (34°N 15′ 43″, 83°W 57′ 7″) at four time points in 2009: three centered around an August 27 storm event (August 26, AUG1; August 28, AUG2; and September 7, SEPT) and one during the fall mixing event in November (November 8, NOV). No specific permissions were required for this sampling location, nor did our field study involve endangered or protected species. At each sampling point, a Water Quality Meter (Horiba) was used to measure water temperature, pH, conductivity, turbidity, dissolved oxygen, and total dissolved solids (Table S1 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>, Fig. S1 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>). A horizontal sampler (Wildco Instruments) was used to collect samples of planktonic microbial communities at 5 m, within the epilimnion, which is fairly uniform in temperature and fully oxygenated during summer stratification. Metagenomes from these same samples were analyzed previously <xref ref-type="bibr" rid="pone.0093827-Oh1">[29]</xref>.</p>
</sec><sec id="s2b">
<title>DNA Extraction</title>
<p>A total of 10 L of water was pre-filtered through ∼1.6 mm GF/A filters (Whatman) and cells were collected on 0.22 μm Sterivex filters (Millipore) using a peristaltic pump. Sterivex filters were stored at −80°C until DNA extraction. DNA was extracted as described in <xref ref-type="bibr" rid="pone.0093827-Oh1">[29]</xref>. Briefly, filters were treated with lysis buffer (50 mM Tris-HCl, 40 mM EDTA, and 0.75 M sucrose) and incubated with 1 mg/ml lysozyme at 37°C for 30 min. Samples were subsequently incubated with 1% SDS, 10 mg/ml proteinase K, and 150 mg/ml RNAse for 2 h rotating at 55°C. DNA was extracted from the lysate with phenol and chloroform, precipitated with ethanol and eluted in TE buffer. DNA yield was about 1.5 μg per liter of water filtered. For the metagenome, ∼5 μg of the total DNA aliquot was sequenced using the Illumina GA-II sequencers at the Emory University Genomics Facility, providing paired-end reads with an average length of 100 bp (Table S4 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>). 16S rRNA gene amplicon pyrosequencing (see below) was run on the GS-FLX 454 Titanium platform, also at the Emory University Genomics Facility.</p>
</sec><sec id="s2c">
<title>16S Amplicon Library Preparation and Sequencing</title>
<p>Lake Lanier 16S rRNA gene amplicons were PCR-amplified from the same community DNA samples sequenced for metagenomic analysis using barcoded primers for the V1–V3 regions (Table S2 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>). Each 20 μl PCR mixture was comprised of 0.15 μl AccuPrime Taq DNA Polymerase High Fidelity (Invitrogen), 2 μl 10X AccuPrime PCR Buffer II, 13.85 μl nuclease-free water, 1 μl of 2 mM “B” adaptor-labeled 27F primer, 1 μl of 2 mM “A” adaptor-labeled and barcoded 534R primer, and 2 μl undiluted template DNA. PCR conditions consisted of 2 min incubation at 95°C followed by 25 cycles of 95°C, 20 sec; 50°C, 30 sec; and 72°C, 5 min. Three independent PCRs were carried out for each primer pair listed in Table S2 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>, the products of which were pooled for each sample. To further assess reproducibility and potential technical artifacts, we sequenced two separate amplicon pools from AUG1 (A and B) and three from NOV (A, B, and C; Table S3 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>). As an additional control sample, a mixture of DNA from four organisms grown in pure culture: <italic>Escherichia coli</italic> strain H1-sample ANK, <italic>E. coli</italic> str. K-12 substr. DH10B, and two environmental isolates: an <italic>Enterococcus</italic> sp. and a <italic>Shewanella</italic> sp., were also subject to 16S amplification and sequenced together with the Lake samples. PCR products were cleaned using Agencourt AMPure beads (Beckman Genomics). All seven samples were then pooled according to the Roche protocol into a mixture containing a final concentration of ∼10<sup>7</sup> molecules/μl from each sample. The pooled amplicons were sequenced in duplicate (i.e., two halves of a plate) on the GS-FLX 454 Titanium instrument providing an average read length of 333.2 bp (Table S3 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>).</p>
</sec><sec id="s2d">
<title>16S rRNA Gene Sequence Analysis</title>
<p>Each sample was separated from the run based on its barcode sequence using the Splitkeys.pl script from the AmpliconNoise package, version 1.2. The reads of each sample were then independently denoised to reduce sequencing and PCR single base substitutions and then chimera-checked using the PyroNoiseM + SeqNoise and Perseus shell scripts, respectively, in the AmpliconNoise package <xref ref-type="bibr" rid="pone.0093827-Quince1">[6]</xref>, <xref ref-type="bibr" rid="pone.0093827-Quince2">[7]</xref>. A denoising shell script included a filter requiring a minimum flowgram length of 360 bp (including key and primer). To reintegrate all the samples for downstream comparisons, a combined fasta file of the denoised, chimera-checked sequences was created and the AmpliconNoise Qiime.pl script was used to make both a 3% and 1% OTU mapping file (i.e., OTUs were picked at both 97% and 99% identity). The QIIME software package, version 1.2.0 <xref ref-type="bibr" rid="pone.0093827-Caporaso1">[30]</xref> was then used for 16S rRNA analysis, skipping OTU construction and beginning with the split_libraries.py (with –l 50–H 50) and pick_rep_set.py scripts using the pre-processed sequences. For many analyses, a subset of sequences obtained by randomly subsampling each dataset to the same depth (that of the smallest dataset) was used. OTUs that were identified in only one of the 14 datasets or that occurred as singletons were excluded from the analysis. Within QIIME, taxonomy was assigned with the RDP classifier based on a July 2011 version of the Greengenes reference OTU database <xref ref-type="bibr" rid="pone.0093827-DeSantis1">[31]</xref> with the addition of a freshwater sequence database and taxonomy framework described in <xref ref-type="bibr" rid="pone.0093827-Newton1">[32]</xref>.</p>
</sec><sec id="s2e">
<title>Assembly and Phylogenetic Assignment of Metagenomic Reads</title>
<p>Metagenomic sequences from the same four timepoints were analyzed by creating a combined assembly from all four datasets after filtering the data for quality based on the Phred average per sliding window with Q≥20 and not allowing any N’s. The reads were assembled into contigs as described previously <xref ref-type="bibr" rid="pone.0093827-Oh1">[29]</xref>; Table S4 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref> using the SOAPdenovo <xref ref-type="bibr" rid="pone.0093827-Li1">[33]</xref> and Velvet <xref ref-type="bibr" rid="pone.0093827-Zerbino1">[34]</xref> pre-followed by assembly into longer contigs with Newbler 2.0. This hybrid protocol provided significantly longer contigs, with accuracy comparable with or higher than that of the contigs of Velvet or SOAPdenovo <xref ref-type="bibr" rid="pone.0093827-Luo1">[35]</xref>. The resulting contigs were annotated using MeteGeneMark <xref ref-type="bibr" rid="pone.0093827-Zhu1">[36]</xref>. The predicted genes were subsequently searched against a database of all sequenced bacterial and archaeal genomes and their best match was used to infer the phylogenetic origin of contig sequences using the MyTaxa scheme developed in our lab (<xref ref-type="bibr" rid="pone.0093827-Luo2">[37]</xref>; <ext-link ext-link-type="uri" xlink:href="http://enve-omics.ce.gatech.edu/mytaxa/" xlink:type="simple">http://enve-omics.ce.gatech.edu/mytaxa/</ext-link>).</p>
<sec id="s2e1">
<title>Nucleotide sequence accession numbers</title>
<p>16S datasets from the Lake Lanier samples were deposited in the Sequence Read Archive under the same projects as the previously submitted WGS datasets <xref ref-type="bibr" rid="pone.0093827-Oh1">[29]</xref>: AUG1 (SRA029309.1), AUG2 (SRA029314.1), SEPT (SRA029315.1), and NOV (SRA029316.1).</p>
</sec></sec></sec><sec id="s3">
<title>Results</title>
<sec id="s3a">
<title>16S rRNA Gene Amplicon Sequencing Reproducibility</title>
<p>We used the control mixture made up of 16S rRNA gene sequences from four organisms grown in isolation in the laboratory, to validate the denoising parameters and efficacy of OTU recovery and taxonomic assignments of amplicon sequencing. Following denoising and taxonomic binning of the sequences in this sample, four major (&gt;1% of total sequences) 97% OTUs were identified in each of the two lane runs. The OTUs were identified using RDP taxonomy within QIIME at the order level as members of the <italic>Enterobacteriales</italic>, corresponding to the two <italic>E. coli</italic> strains of four control organisms used and accounting for about 50% of the reads, <italic>Lactobacillales</italic>, corresponding to the <italic>Enterococcus</italic> isolate used and accounting for about 20% of total, and <italic>Alteromonadales</italic>, corresponding to the <italic>Shewanella</italic> isolate and accounting for about 20% of the total. Thirteen additional OTUs with either singletons or few representative sequences (&lt;0.1% of the total sequences) were also identified, but were likely the result of sequencing errors due to their low abundance and poor matches to the known, control sequences. These OTUs had taxonomic affiliations that matched the known control sequences at the phylum level, but most (9 of 13) could not be taxonomically assigned beyond that. Furthermore, the highly populated OTUs were the same between the two runs of the same sample, whereas the OTUs with a small number of sequences were not. We therefore determined that a reasonable filter would exclude OTUs with fewer than ten reads that were not found in both sequencing runs from the same sample, i.e., in both lanes 1 and 2. This filter, similar to what is used by others (e.g., <xref ref-type="bibr" rid="pone.0093827-Caporaso2">[38]</xref>), was subsequently applied to our lake 16S rRNA gene datasets. Singletons were not removed for comparison with metagenomic sequences (see below).</p>
<p>The 14 datasets acquired from four temporally-distinct sampling events were processed using the standard QIIME protocol to bin reads into OTUs and then sub-sample each dataset to an even depth of 17,821 sequences, i.e., the number of sequences in the smallest dataset, in order to account for heterogeneity in the sequencing effort (Table S3 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>). As expected, slightly more OTUs were identified at the 99% level than the 97% level, but many of the additional 99% OTUs occurred as singletons (Fig. S2 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>). Each sample had ∼500 different OTUs at the 97% level and a total of 4,684 OTUs were identified. Only slight differences were detected in the numbers of OTUs recovered in independently sequenced datasets of the same DNA (Lane 1 vs. 2; e.g., for 571 and 520 OTUs for AUG1-1 and AUG1–2, respectively) or PCR replicates of the same water sample (replicates A and B, e.g., 545 and 487 OTUs for AUG1 A and AUG1 B, respectively), with the exception of NOV C which had notably fewer OTUs than NOV A-B (364 vs. 706 OTUs, respectively). Prior to the application of the aforementioned singleton filter, most (∼75%) of the OTUs were represented by only one sequence or were present in only one dataset, indicating that 16S-based sequencing approaches can overestimate OTU diversity within a taxonomic group in a sample and/or capture different members of the rare fraction. Excluding these OTUs resulted in a total of 1,067 OTUs present in at least one of the four samples and ∼250 OTUs specific to each dataset. Only ∼2% of the OTUs were present in all 14 datasets and ∼6% were found in all four timepoints, but these OTUs comprised ∼30% of the total reads.</p>
<p>Accordingly, observed species richness varied between samples. Rarefaction curves showed some of this variation among replicate samples (same DNA, independent PCR amplifications), particularly between NOV A/B (most diverse) and NOV C (least diverse) (<xref ref-type="fig" rid="pone-0093827-g001">Fig. 1A</xref>). The discrepancy in estimated diversity levels between the three November samples was surprising, given that the starting DNA for all three samples was the same. Nevertheless, the three NOV replicates were not significantly different from each other in terms of OTU composition, as evaluated by one-way ANOSIM <xref ref-type="bibr" rid="pone.0093827-Clarke1">[39]</xref>. All datasets shared more than half of their OTUs with both their corresponding technical sequencing replicate (i.e., lane 1 and lane 2) and their corresponding PCR replicate (e.g., A vs. B). Furthermore, when the datasets were filtered to remove singletons, the three NOV samples were highly similar to each other in terms of OTU composition relative to the samples from the other three timepoints (Fig. S3 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>). Good’s nonparametric coverage estimator <xref ref-type="bibr" rid="pone.0093827-Good1">[40]</xref> was similar among NOV A/B (98.2 and 98.5, respectively) and slightly higher for NOV C (99.2). Because the original, non-rarefied NOV C datasets contained the fewest sequenced reads of all the 14 datasets (Table S3 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>), the difference between NOV C and NOV A/B could be related to the sizes of the original datasets (Table S3 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>), and the number of singletons captured in the datasets (resulting from sequencing or PCR amplification artifacts) as opposed to the presence of entirely different OTUs.</p>
<fig id="pone-0093827-g001" position="float"><object-id pub-id-type="doi">10.1371/journal.pone.0093827.g001</object-id><label>Figure 1</label><caption>
<title>Diversity estimates for the four Lake Lanier timepoints</title>
<p>. A) Alpha diversity based on observed species (97% OTUs) from 16S amplicons for each of the nine samples. Error bars represent the variation observed among duplicate sequencing runs. B) Redundancy curves of the metagenomes of the four timepoints using (see Methods for details). The curves show that NOV is a more diverse sample, e.g., with the same sequencing effort it results in a lower coverage.</p>
</caption><graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0093827.g001" position="float" xlink:type="simple"/></fig>
<p>There was no significant difference (G test of independence) in the presence/absence of OTUs at the 97% level between either the sequencing replicates or the seven datasets representing the various replicates from the four timepoints. However, there was distinct partitioning of OTUs between samples in terms of relative abundance of shared OTUs, with few differences between sequencing replicates (Fig. S3 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>). Additionally, OTU composition of AUG1, AUG2, and SEPT clustered uniquely from the NOV samples (Fig. S3 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>). This was verified when biological replicates were combined and the four timepoints were compared, revealing that the NOV OTU composition, phylogeny (evaluated with weighted UniFrac distance), and abundance was significantly different from the other three timepoints (One-way ANOSIM, p&lt;0.01). In general, abundant taxa were common between the four timepoints.</p>
</sec><sec id="s3b">
<title>16S rRNA Gene-based Community Composition, Diversity, and Dynamics between Four Timepoints</title>
<p>Most major bacterial phyla were present in Lake Lanier and there was a high representation of common freshwater taxa <xref ref-type="bibr" rid="pone.0093827-Newton1">[32]</xref> such as <italic>Actinobacteria</italic>, <italic>Cyanobacteria</italic>, <italic>Verrucomicrobia</italic> and <italic>Proteobacteria</italic> (particularly <italic>Betaproteobacteria</italic>). In fact, <italic>Proteobacteria</italic> and <italic>Actinobacteria</italic> were the most frequently observed, with nearly 20–40% of the total sequences identified as members of these phyla at each timepoint (<xref ref-type="fig" rid="pone-0093827-g002">Fig. 2</xref>, top). About 10% of the OTUs from all lake datasets matched previously sequenced organisms with high sequence identity (&gt;95%), e.g., <italic>Synechococcus sp.</italic> and <italic>Polynucleobacter necessarius</italic>, a betaproteobacterium frequently detected in freshwater <xref ref-type="bibr" rid="pone.0093827-Hahn1">[41]</xref>. More divergent sequences (e.g., 80–85% sequence identity) were also observed, indicative of uncharacterized taxa more distantly related to well-characterized lineages, although it is also possible that some of these divergent sequences could arise from sequencing errors (see below). Nearly 35% of the OTUs were highly (&gt;95% identity) similar to known freshwater 16S rRNA sequences, including 118 OTUs with reads 100% identical to freshwater tribes (a taxonomic level below clade defined in <xref ref-type="bibr" rid="pone.0093827-Newton1">[32]</xref>) belonging to <italic>Actinobacteria, Alpha-, Beta- and Gamma-proteobacteria, Bacteroidetes,</italic> and <italic>Verrucomicrobia</italic>.</p>
<fig id="pone-0093827-g002" position="float"><object-id pub-id-type="doi">10.1371/journal.pone.0093827.g002</object-id><label>Figure 2</label><caption>
<title>Community composition shifts over time as revealed by 16S data.</title>
<p>Taxonomic binning of 16S amplicon sequences for each of the 14 individual datasets at the phylum (top) and genus (middle) levels were based on the July 2011 version of the Greengenes database <xref ref-type="bibr" rid="pone.0093827-DeSantis1">[31]</xref>. Freshwater lineages (bottom) were based on a freshwater database according to the taxonomy framework described in Newton et al., 2011. Datasets are ordered left to right by date, technical sequencing replicate (lane 1 and lane 2), and DNA replicate (A, B and C). Taxa identified as major drivers of the differences between timepoints (SIMPER analysis) are labeled (see figure key).</p>
</caption><graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0093827.g002" position="float" xlink:type="simple"/></fig>
<p>The OTUs in each of the combined datasets from the four timepoints were binned into phyla, genera, and described freshwater lineages to better characterize the temporal shifts in a taxonomic context. Of 17,821 sequences in each library, ∼90% could be assigned to a known phylum and between 32–47%, depending on the dataset, to a known genus in the Greengenes database. In addition to the differences in the 97% OTU composition noted above, the NOV sample was significantly different from the others in terms of phyla, genera, and clade (ANOSIM with Bray-Curtis metric, p&lt;0.01; <xref ref-type="fig" rid="pone-0093827-g002">Fig. 2</xref>). The differences, however, were due more to variations in relative abundances of specific phyla or genera than to differences in the presence or absence of taxonomic groups at these levels (as assessed by the G-test of independence), although phylogenetic differences were found at a finer-scale resolution (as assessed by UPGMA analysis and tribe-level comparisons). Thus, the same major phyla and genera were typically found in all four timepoints, but the abundances of these groups varied, as did individuals comprising these groups. Similarity Percentage (SIMPER) analysis <xref ref-type="bibr" rid="pone.0093827-Clarke1">[39]</xref> identified specific taxa as primary drivers of the differences between samples (<xref ref-type="fig" rid="pone-0093827-g002">Fig. 2</xref>). Much of the difference (6%) between AUG1 and NOV was attributed to OTUs that could not be classified at the phylum level (“Other Bacteria” in <xref ref-type="fig" rid="pone-0093827-g002">Fig. 2</xref>). Generally, NOV had a lower relative abundance of <italic>Verrucomicrobia</italic> and a higher relative abundance of <italic>Bacteroidetes</italic> compared to the first three samples. <italic>Cyanobacteria</italic> abundance increased following the storm event (AUG2) but returned to AUG1 levels (∼8% of the total phyla) in NOV.</p>
<p>While variation at the genus level was more difficult to assess due the challenge of assigning genera with high confidence, we were able to identify a number of known genera and their freshwater taxonomic affiliations (based on the lineages described in <xref ref-type="bibr" rid="pone.0093827-Newton1">[32]</xref>) with significantly different relative abundances between the four timepoints (<xref ref-type="fig" rid="pone-0093827-g002">Fig. 2</xref>). For example, <italic>Thiomonas</italic> comprised 16–23% of the genera in AUG1-SEPT, but less than 5% of the genera in NOV. <italic>Pelagibacter</italic> increased in relative abundance from ∼6% in AUG1–SEPT to ∼16% in NOV. This genus corresponded to LD12 tribe (alfV-A) <xref ref-type="bibr" rid="pone.0093827-Newton1">[32]</xref>, the freshwater sibling to the marine SAR11 group (<xref ref-type="fig" rid="pone-0093827-g002">Fig. 2</xref>, bottom), which also increased in abundance in NOV. Other genera such as <italic>Prochlorococcus</italic>-like sequences varied between the four timepoints, and was highest in AUG2 (15%) following the strong summer storm and lowest in AUG1 (8%). Interestingly, <italic>Prochlorococcus</italic> is a ubiquitous marine organism <xref ref-type="bibr" rid="pone.0093827-Partensky1">[42]</xref>, but <italic>Prochlorococcus</italic>-like organisms have seldom been identified in freshwater systems <xref ref-type="bibr" rid="pone.0093827-Corzo1">[43]</xref>, <xref ref-type="bibr" rid="pone.0093827-Stenuite1">[44]</xref>. We suspect, however, that these sequences were misclassified when using the RDP taxonomy, as evidenced by the high representation of <italic>Synechococcus</italic> among both the 16S rRNA gene amplicons re-analyzed using NCBI taxonomy and the metagenome contigs in all four timepoints (see below), as well as the known abundance of <italic>Synechococcus</italic> in freshwater lakes <xref ref-type="bibr" rid="pone.0093827-Newton1">[32]</xref>. These <italic>Prochlorococcus</italic>-like sequences were also assigned to the <italic>Cyanothece</italic> related freshwater CyanI-A1. This illustrates one of the difficulties in using 16S rRNA gene sequences to examine populations at the genus level or lower.</p>
<p>Among the <italic>Actinomycetales</italic> that could not be assigned to a known genus, we examined the freshwater lineages that they associated with. The acI lineage <xref ref-type="bibr" rid="pone.0093827-Newton1">[32]</xref> dominated all four sampling points, typically representing 20–30% of the identified lineages. Among the tribes affiliated with this lineage, acI-A6 and acI-C2 dominated all samples, but showed different abundance profiles: acI-A6 was roughly stable over time, accounting for 15–20% of the identified lineages while acI-C2 peaked after the storm at AUG2 to about twice the levels seen at the other timepoints. Other acI tribes such as acI-B1 were more abundant in the NOV sample and acI-A1 was most abundant in AUG1. The second most abundant <italic>Actinobacteria</italic> lineage, acIV, also showed variation in the abundance profiles of the associated clades, with some increasing in abundance in AUG2 and NOV (acIV-A), and others being nearly absent in AUG1–SEPT but peaking in NOV (acIV-B and acIV-C). Overall, substantial variation was seen among individual clades and tribes comprising the identified lineages. Because there are so few defined lake species and genera, these phylogenetic classifications cannot be gleaned from the genus level assignments and individual OTUs do not always provide detailed taxonomic information. Thus, comparisons to well-described, relevant 16S rRNA gene databases such are useful when available.</p>
</sec><sec id="s3c">
<title>Comparisons to Corresponding Metagenomes</title>
<p>We compared the 16S rRNA gene findings to those from companion metagenomes, first by estimating the diversity of each metagenomic dataset using a new method developed in our group (<xref ref-type="bibr" rid="pone.0093827-RodriguezR1">[45]</xref>; <ext-link ext-link-type="uri" xlink:href="http://enve-omics.ce.gatech.edu/nonpareil/" xlink:type="simple">http://enve-omics.ce.gatech.edu/nonpareil/</ext-link>) that determines the relative complexity of a metagenomic dataset using the extent of redundancy of its reads. From these estimates, the AUG1, AUG2 and SEPT assembled contig sequences had on average 2–5X coverage, while the NOV coverage was ∼0.5X and required significantly higher sequencing effort in order to achieve nearly complete community coverage (<xref ref-type="fig" rid="pone-0093827-g001">Fig. 1B</xref>). These findings agreed well with our 16S rRNA gene observations of increased diversity in sample NOV A relative to the other timepoints and different from NOV B and C (<xref ref-type="fig" rid="pone-0093827-g001">Fig. 1A</xref>). Thus, the metagenomic analysis indicated that the NOV A 16S datasets were likely the most representative of the three NOV replicates.</p>
<p>A combined assembly from the four metagenomic datasets was then used to obtain reference contigs, representing distinct populations, and follow their abundance over time. Unlike the 16S amplicon-based OTUs, more than 90% of which were unique to one or more timepoints, 79% of the 217,149 contigs longer than 500 bp, were detected at all four timepoints. Despite the differences in estimated diversity between the four metagenomic samples (read redundancy, <xref ref-type="fig" rid="pone-0093827-g001">Fig. 1B</xref>), the differences in terms of the composition and abundance of different contigs were not significant (ANOSIM with Bray-Curtis metric, p&lt;0.01). These findings indicated that, unlike individual reads (read redundancy), which can represent low-abundance in addition to high-abundance community members, long contigs, which typically represent abundant community members, were found with roughly similar coverage levels in the four timepoints. Additional diversity that may have been present among shorter contigs in the metagenome (&lt;500 bp) was not assessed but likely differed between the samples, similar to the read data above.</p>
<p>The organisms identified from 16S rRNA gene sequencing were compared to those identified from the metagenomes. The OTUs in each amplicon dataset were reanalyzed using NCBI taxonomy both with and without singleton and other sequence–removal filters (which reduced the number of identified OTUs by ∼10%) for consistency between the 16S and whole-genome. To determine the taxonomic origin of short-read metagenomic sequences, we used MyTaxa, an advanced taxonomic classifier developed in our group that combines homology- and phylogenetic-based approaches to assign putative taxonomic origin to assembled contigs <xref ref-type="bibr" rid="pone.0093827-Luo2">[37]</xref>. Contig sequencing depth (reads/length) was used as a proxy for taxon abundance. With this approach, 1.5 times and ∼10 times as many phyla and genera, respectively, were identified within the metagenomic contigs than the 16S amplicons (based on OTUs found in the database), regardless of whether or not the singleton filter was applied to the amplicon sequences. ChaoI diversity estimates based on phylum- and genus-level assignments were therefore different between the metagenomic and 16S amplicon datasets (<xref ref-type="fig" rid="pone-0093827-g003">Fig. 3</xref>).</p>
<fig id="pone-0093827-g003" position="float"><object-id pub-id-type="doi">10.1371/journal.pone.0093827.g003</object-id><label>Figure 3</label><caption>
<title>Sequence diversity of the samples used in this study</title>
<p>. Chao1 diversity estimates of datasets based on phylum (A) and genus (B) level taxonomic classification are shown for all four metagenomic timepoints and seven selected 16S amplicon datasets.</p>
</caption><graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0093827.g003" position="float" xlink:type="simple"/></fig>
<p>The taxonomic composition of each 16S rRNA gene library was generally similar to its corresponding metagenome at the phylum level, although some phyla were more represented in the metagenome analysis than the 16S amplicon analysis, including <italic>Firmicutes</italic> and <italic>Planctomycetes</italic>, while others such as <italic>Cyanobacteria</italic> were more abundant among the 16S rRNA gene amplicons (Fig. S4 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>). A few phyla were only found in the metagenomic contigs, albeit in low abundances (&lt;0.2% of the total number of phylum-assigned contigs), and included the <italic>Dictyoglomi, Fusobacteria, Synergistetes,</italic> and <italic>Deinococcus-Thermus</italic>. At the genus level, however, there was a large amount of variation between the metagenomic contigs and the 16S rRNA sequences. Some genera showed similar trends and relative abundances over time (e.g., <italic>Legionella</italic>; <xref ref-type="fig" rid="pone-0093827-g004">Fig. 4</xref>) while others showed substantial differences (e.g., <italic>Burkholderia</italic> and <italic>Synechococcus</italic>; <xref ref-type="fig" rid="pone-0093827-g004">Fig. 4</xref>). <italic>Thiomonas</italic> accounted for ∼45% of the 16S amplicons identified at the genus level in AUG1 (and 23% of all OTUs using RDP taxonomy, <xref ref-type="fig" rid="pone-0093827-g002">Fig. 2</xref>), but only ∼0.3% of the metagenome contigs identified at that level. Although the amplicon approach appears to overestimate the abundance of this group (see below), the high abundance of this genus is probably not wholly a PCR artifact, as almost 10% of the partial 16S rRNA gene sequences recovered in the metagenome (see below) were 100% identical to the 16S rRNA gene amplicon sequences assigned to <italic>Thiomonas</italic>. Part of the discrepancy between the contig and 16S rRNA gene amplicon assignments could instead be due to the fact that there were only two complete <italic>Thiomonas</italic> reference genomes in the database but 243 distinct <italic>Thiomonas</italic> OTUs in the Greengenes OTU database at the time of analysis.</p>
<fig id="pone-0093827-g004" position="float"><object-id pub-id-type="doi">10.1371/journal.pone.0093827.g004</object-id><label>Figure 4</label><caption>
<title>Individual genera abundance shifts over time based on 16S and metagenomes.</title>
<p>Genus-level taxonomic trends for a subset of genera identified within the metagenomic contigs (A) and 16S rRNA amplicon (B) datasets, based on NCBI taxonomy, are shown. The lines represent the general temporal trends of two genera, <italic>Synechococcus</italic> and <italic>Legionella</italic>, in each dataset.</p>
</caption><graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0093827.g004" position="float" xlink:type="simple"/></fig>
<p>As noted above, the genus level may frequently mask important levels of intra-genus population differentiation and heterogeneity, which typically remain inaccessible to short-read, 16S rRNA gene-based analysis that target a single variable region of the 16S rRNA gene <xref ref-type="bibr" rid="pone.0093827-Acinas1">[46]</xref>, <xref ref-type="bibr" rid="pone.0093827-Konstantinidis2">[47]</xref>. This was evident following a more detailed investigation of three different genera, <italic>Synechococcus, Burkholderia,</italic> and <italic>Legionella,</italic> whose relative abundance profiles over time varied between the 16S rRNA gene amplicons and the metagenome. Each of these genera was represented in the 16S amplicon data by several different OTUs (<italic>Synechococcus,</italic> 80; <italic>Burkholderia,</italic> 18; and <italic>Legionella,</italic> 56) and hundreds to thousands of different contigs in the metagenomic datasets. The contigs assigned to each genus with our MyTaxa algorithm were clustered using the Pearson correlation metric in order to collapse the contigs into populations with similar abundance profiles over the four timepoints, likely representing similar populations <xref ref-type="bibr" rid="pone.0093827-Strous1">[48]</xref>. Often, the two methods were congruent, but this analysis revealed variations not captured when the data were assessed at the genus level. For example, <italic>Synechocococcus</italic> was dominated by a single 16S rRNA gene OTU for the first three timepoints, which was replaced by two different OTUs in the NOV sample that were either undetected or present in low quantities at earlier timepoints, keeping the total abundance of <italic>Synechococcus</italic> in the four samples relatively constant (Fig. S5 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>). Although similar trends were observed among the metagenome contigs, the contigs that increased in abundance in the NOV sample relative to the other three were present at such low levels that the overall percentage of <italic>Synechococcus</italic> in the NOV sample was low, making the overall patterns observed for this genus different between the two methods. It should also be noted that, in contrast to <italic>Thiomonas</italic>, there are many <italic>Synechococcus</italic> reference genomes. Populations (metagenomes) or OTUs (16S rRNA gene data) within the other two genera examined generally displayed a similar trend as well, i.e., several abundant taxa were observed in the AUG1 to SEPT samples that were apparently replaced by other taxa in NOV (Fig. S5 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>). Overall, the metagenomic contigs and the 16S rRNA gene sequence data generally agreed with each other, but the relative abundances of the individual taxa within the genera contributed to seemingly large differences.</p>
<p>We also compared partial 16S sequences recovered in a shotgun 454 metagenome generated from the AUG1 sample <xref ref-type="bibr" rid="pone.0093827-Oh1">[29]</xref> to the PCR-based identification of 16S rRNA gene amplicon sequences. Among the 558 partial 16S sequences captured in the AUG1 454 metagenome, there were 302 different OTUs, approximately half as many as in the PCR-based dataset, which had more than 30,000 individual 16S rRNA gene amplicon sequences (Fig. S2 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>). However, subsampling the 16S rRNA gene amplicon sequences to the same depth as the 16S rRNA gene reads from the metagenome, i.e., 558, yielded only about 80 different OTUs in each 16S rDNA amplicon dataset, indicating that the metagenome provided more information on community composition at the per-read level, but the number of reads obtained from the 16S rDNA amplicon sequencing approach offset this inequality. Some phyla such as TM7 were captured in the PCR-based datasets, albeit in low abundance (&lt;0.1%), but were not found among the shotgun-derived 16S sequences, probably because of the lower number of sequences, while others such as <italic>Chlamydiae</italic> were only found within the shotgun 16S rRNA gene sequences, perhaps because of primer/PCR biases in the amplicon approach. The relative number of OTUs attributed to <italic>Actinobacteria</italic> and <italic>Verrucomicrobia</italic> was higher among the shotgun sequences than the PCR-based sequences and corresponded well with the lineages identified from comparison to the freshwater 16S database (above), indicating that the shotgun library is sometimes able to capture more taxonomic diversity than 16S amplicons. Our observations corroborate those seen by others that the 16S rRNA gene sequences derived from metagenomic datasets vs. PCR amplification are roughly similar at broad taxonomic classifications (e.g., <xref ref-type="bibr" rid="pone.0093827-Kalyuzhnaya1">[49]</xref>), but that the number of OTUs identified by 16S rRNA gene sequencing is larger simply by virtue of the number of sequences obtained and that shotgun approaches capture greater diversity due to the lack of PCR primer specificity <xref ref-type="bibr" rid="pone.0093827-Sharpton1">[50]</xref>.</p>
<p>Finally, to gain further insight into individual populations, full-length 16S sequences were reconstructed separately from each of the AUG1–SEPT metagenomes <xref ref-type="bibr" rid="pone.0093827-Miller1">[51]</xref> and were compared to the 16S rDNA amplicon OTUs in terms of sequence similarity and abundance patterns over the timepoints. One full-length reconstructed OTU most likely corresponding to 16S amplicon “OTU 2” (represented by sequence GKJT1QE01CC3RV) was identified as a member of the order <italic>Burkholderiales</italic>, had no known close relative at the genus level, and comprised 16–20% of the 16S rRNA genes among the fragments captured in the three metagenomes. This sequence was named “FJ820419” for its closest relative in the Silva 16S database. OTU 2 and FJ820419 were assigned to different families within the <italic>Burkholderiales</italic>: OTU 2 to <italic>Alcaligenaceae</italic> and FJ820419 to <italic>Burkholderiaceae</italic>. Although they both had &gt;98% identity to a known freshwater <italic>Betaproteobacteria</italic> named LakTan18, neither could be assigned to taxa lower than the family level; the closest genus match of OTU 2, with ∼94% identity, was to either <italic>Thiomonas</italic> or other uncultured <italic>Burkholderiales</italic>. In fact, OTU 2 was the biggest contributor to the <italic>Thiomonas</italic> sequences identified among the 16S rDNA amplicon OTUs. Potential biases in the amplification of the 16S rRNA gene and the short length of the 16S amplicon reads as well as the predictive nature of the full length 16S rRNA genes sequence reconstruction from the metagenomes confounded our ability to accurately link the two methods to a single source organism. Nevertheless, the relative abundances of FJ820419 in the four timepoints gauged by recruitment of reads to the full-length FJ820419 sequence were comparable to the abundances of OTU 2 in each amplicon datasets (e.g., 22% vs. 28%; Fig. S6 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>), providing further evidence that the metagenome and 16S rDNA amplicon sequencing can sometimes identify the same populations, but the taxonomic assignments are not always consistent.</p>
</sec></sec><sec id="s4">
<title>Discussion</title>
<sec id="s4a">
<title>Sequencing Replicates are more Consistent than Sample Preparation Replicates</title>
<p>While investigating temporal dynamics and response to potential disturbances in a freshwater, mesotrophic lake community, we employed numerous methodological and experimental replicates, providing a means to comprehensively evaluate specific limitations of some of the commonly used methods for microbial community characterization. Although denoising and chimera checking can reduce the number of potentially spurious sequences arising from both PCR and sequencing errors <xref ref-type="bibr" rid="pone.0093827-Quince2">[7]</xref>, such processing cannot eliminate all biases, as evidenced by the identification of thirteen different OTUs in a control DNA sample generated from only four different organisms. The filter that we used here, i.e., removing singletons and OTUs present in only one of our replicate datasets, has the disadvantage of confounding our ability to estimate diversity and identify rare members of the community. In agreement with other recent studies <xref ref-type="bibr" rid="pone.0093827-Shakya1">[13]</xref>, <xref ref-type="bibr" rid="pone.0093827-Bokulich1">[52]</xref>, it is clear that the inclusion of “synthetic communities” is highly advantageous for 16S amplicon sequencing in order to determine biases of sequencing runs, optimal filtering, and assess samples properly. Further, the use of replicate samples enabled us to better pinpoint both advantages and limitations of the 16S rDNA amplicon sequencing approach. We observed differences in the number of OTUs and, therefore, the projected diversity, in replicate datasets obtained from the same template DNA but from different pools of PCR amplicons. Because replicate sequencing runs (i.e., lane 1 vs. lane 2) were similar and the differences between the NOV triplicates correlated with differences in the read yield and singletons observed in each dataset, it appears that the discrepancies in diversity estimates are likely introduced either at the PCR and library preparation steps or sequencing steps, which are virtually impossible to control even when all libraries are constructed in the same manner. Specifically, among the three NOV samples, the smallest dataset (NOV C) had the fewest number of singletons and the lowest estimated diversity and the resulting biases were not fully eliminated by sub-sampling to an even sequencing depth prior to analysis. It is difficult to discern whether the differences between NOV A/B and NOV C arise from errors at the PCR step or from the lower yield of reads (and whatever underlying cause resulted in fewer reads at the sequencing step), but it is clear that replicate, at least triplicate, biological samples should be prepared for 16S rDNA amplicon sequencing from any sample, even if multiple PCRs are pooled for a single sample. Replicate libraries from each pooled PCR sample should be independently sequenced as well, which is increasingly feasible given the advances and cost effectiveness of new sequencing technologies. Nevertheless, the differences between sample replicates (both lane 1 vs. lane 2 as well as “A, B, and C” PCR replicates) were small relative to the differences between the four timepoints, at least in terms of community composition (e.g., Fig. S3 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>). Additionally, although differences in diversity estimates between NOV A, B, and C were evident (<xref ref-type="fig" rid="pone-0093827-g001">Fig. 1A</xref>), the NOV samples were clearly more similar to each other in terms of OTU composition and distinct from the AUG and SEPT samples (Fig. S3 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>). Therefore, the types of replicates included in a study should be carefully considered in the context of the comparisons being made as well as the sequencing platform being used <xref ref-type="bibr" rid="pone.0093827-Claesson1">[53]</xref>.</p>
</sec><sec id="s4b">
<title>The 16S rRNA Gene Identifies Broad Levels of Community Composition While Metagenomics Captures a Higher Level of Diversity</title>
<p>The assignment of taxonomic origin to metagenomic sequences continues to be a hurdle and the confidence with which 16S rRNA gene sequences can be assigned to deep taxonomic levels such as genus can be low. Classification of both protein-encoding and 16S sequences is also limited by the databases used for sequence comparisons; although there are several high quality, comprehensive and curated 16S databases compared to genomic databases, they are still limited, as evidenced by the paucity of 16S rRNA gene reads that could confidently be assigned to a genus and the increased resolution obtained by comparison to a relevant, well-curated freshwater database. Many databases are biased in their compositions; e.g., ∼30% of the Greengenes database are <italic>Proteobacteria,</italic> which comprise ∼5% of the database of complete microbial genomes used to assign taxonomic affiliations to metagenomic contigs. We showed that when the genome database is limited, the metagenome data can miss taxa due to sequences being unassigned, while in cases where there are ample reference genomes and gene sequences, genus-level assignments of the 16S rRNA gene amplicons can be less reliable than those of the contigs, likely due to the region of the 16S rRNA gene chosen <xref ref-type="bibr" rid="pone.0093827-Wang1">[54]</xref>, <xref ref-type="bibr" rid="pone.0093827-Werner1">[55]</xref> and the high conservation of the 16S rRNA gene, which can mask important level of micro-heterogeneity. By assigning taxonomic origin to metagenomic sequences, we were able to get a more detailed sense of the community structure than by 16S rRNA gene sequencing alone, but the confidence with which we can make these assignments remains a challenge. As the databases expand, so does our ability to more accurately assign taxonomy to reads.</p>
<p>Comparing the metagenomic and 16S rRNA amplicon sequences revealed some notable patterns. Many more phyla and genera were identified among the metagenomic than the amplicon sequences, a likely consequence of both of the databases used and biases in PCR amplification and amplicon sequencing. The latter biases can produce differences in estimated diversity levels depending on the sequencing platform, the discriminatory power of the region of the 16S rRNA molecule targeted <xref ref-type="bibr" rid="pone.0093827-Claesson1">[53]</xref>, and the fact that some taxa such as <italic>Planctomycetes,</italic> which were seen in higher abundance in the metagenomes (Fig. S4 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>), are detected less efficiently, or not at all, by some 16S rRNA primer sets <xref ref-type="bibr" rid="pone.0093827-Klindworth1">[56]</xref>. Groups such as <italic>Proteobacteria,</italic> which are represented well in the 16S and genome databases, showed similar abundances between the two approaches. Binning either the contigs or the 16S rDNA amplicons into taxonomic groups at finer-scale resolution (i.e., genus level or species level) provided vastly different pictures of community composition for many, but not all, taxa. We also demonstrated that evaluating genus-level trends masks the variation and diversity of individual “species” or OTUs/genotypes within any genus, which can be partially overcome by binning both metagenomic contigs and 16S rRNA gene sequences into OTU-like units based on recruitment of reads to contigs and percent identities, respectively.</p>
<p>It is clear from our analysis that different patterns arise for different groups of organisms depending on the analysis method used. Metagenomic contigs, 16S rRNA gene sequences encoded in metagenomic data, and 16S rDNA amplicon sequences were sometimes concurrent, especially for taxa that were both abundant in the sample and well-represented in 16S rRNA and genome databases, while other times they provided a vastly different picture of microbial community composition and dynamics. For example, <italic>Synechococcus</italic> populations, one of the most abundant genera detected by both approaches, were tracked with higher resolution, both in terms of number of distinct OTUs present as well as OTU abundance patterns over time, by metagenomics (Fig. S5 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>). The 16S rDNA amplicon approach clearly has the potential to artificially increase the perceived diversity of a sample more so than the metagenome due to errors or artifacts, as evidenced by our examination of a mixture of known 16S rRNA gene sequences. As long as sufficient reference genomes exist for identification, the metagenome performs well in describing the taxonomic composition of a sample. In addition, metagenomics offers the potential to investigate 16S rRNA gene fragments recovered in metagenomic reads without amplification as well as robust taxonomic assignment of contigs, description of genomic populations based on contig dynamics, and even the reconstruction of full-length 16S rRNA gene sequences.</p>
</sec><sec id="s4c">
<title>Temporal Changes in Microbial Community Composition</title>
<p>In evaluating microbial communities, it is informative to not only quantify the relative abundances of different taxa, but also to track these abundances over time and following potential perturbations such as heavy rainfall or lake turnover. We are particularly interested in such dynamics in Lake Lanier due to its regional significance and the general lack of information on microbial communities in southern temperate lakes. Taking the above limitations in assigning taxonomic affiliations to both 16S rDNA amplicon and metagenomic sequences into account, we observed members of several organisms that showed different patterns of abundance across the four samples taken on short-term timescale. The microbial communities from Lake Lanier experience broad shifts in community diversity over the course of several months, but the community changed little over the course of 3 days, despite the occurrence of a strong summer storm between the first two sampling timepoints. The resistance of the microbial community to the pulse disturbance of high precipitation was somewhat surprising, given that many microbial communities are sensitive to ecosystem-level disturbances <xref ref-type="bibr" rid="pone.0093827-Allison1">[57]</xref>. However, our observations combined with the fact that there was no discernable difference in the basic water chemistry before and after the storm (Table S1 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>) indicate that either such a rainfall event was not a chemical or thermal disturbance or that the system recovered more rapidly than our sampling scheme could detect. In contrast, the community changed more substantially between August and November, correlating to <italic>in situ c</italic>onditions in the lake such as the transition from stratified to well-mixed (Fig. S1 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>; Table S1 in <xref ref-type="supplementary-material" rid="pone.0093827.s001">File S1</xref>), consistent with previous observations that bacterioplakton often experience seasonal shifts in both lakes <xref ref-type="bibr" rid="pone.0093827-Kent2">[58]</xref>–<xref ref-type="bibr" rid="pone.0093827-Shade1">[60]</xref> and marine environments <xref ref-type="bibr" rid="pone.0093827-Gilbert1">[2]</xref>. Thus, short-term, pulse disturbances related to a meteorological event sometimes have less of an effect on the microbial communities than anticipated while long-term disturbances occurring that occur during lake turnover can cause significant shifts in microbial community composition. The general trends for the microbial community diversity observed from metagenomic reads and 16S rDNA amplicon reads were comparable: both approaches showed similar diversity levels in AUG1, AUG2, and SEPT and that the NOV sample was relatively more diverse. Mixing events have previously been identified as disturbances that can dramatically shift microbial community composition <xref ref-type="bibr" rid="pone.0093827-Shade2">[61]</xref>, <xref ref-type="bibr" rid="pone.0093827-Shade3">[62]</xref>. When mixing events were performed in experimental manipulations, changes in community composition were presumed to be due to the introduction of nutrients from the hypolimnion <xref ref-type="bibr" rid="pone.0093827-Shade2">[61]</xref>. Similar to our observations in the NOV timepoint, epilimnion samples in experimental manipulations were also shown to increase in richness following lake mixing <xref ref-type="bibr" rid="pone.0093827-Shade3">[62]</xref>. Using a combination of metagenomics to track contigs and 16S rRNA gene sequencing to track OTUs between the four temporally separated samples from Lake Lanier, we were also able to identify some general patterns in bacterioplankton community composition, although the specific dynamics sometimes differed between the two methods, as noted above. The changes in community composition in Lake Lanier between the first three timepoints and the fall mixing sometimes echoed shifts in individual taxa seen in very different northern lakes that experience ice cover; for example, both LD12, the freshwater <italic>Pelagibacter</italic> relative, and a member of the acIV lineage increased in abundance in NOV in Lake Lanier and also peaked in autumn in a Swedish lake <xref ref-type="bibr" rid="pone.0093827-Eiler1">[25]</xref>. In a North Sparkling Bog in the northern US, there was a slight increase in <italic>Gammaproteobacteria</italic> post-mixing, similar to in Lake Lanier <xref ref-type="bibr" rid="pone.0093827-Shade3">[62]</xref>. Despite these similarities, we observed many taxa whose abundances over time did not correspond with those in these northern lakes, indicating that bacterioplankton in southern temperate lakes such as Lake Lanier might behave differently in response to similar seasonal changes than their relatives in northern lakes.</p>
<p>This study provides insights into the Lake Lanier planktonic microbial community and advances the approaches for assessing microbial community diversity and dynamics <italic>in situ</italic>. A combined approach using both metagenomics and 16S rRNA gene sequences can help provide a complete picture, but sequencing controls and replicates are advised, especially when trying to infer diversity levels. Using 16S rRNA gene fragments recovered in a shotgun metagenome has the benefit of removing the initial PCR amplicon biases and providing a means to do both functional genomics and 16S analysis with the same sequence dataset. Here, we demonstrated that Lake Lanier microbial communities are resistant to a short-term rainfall disturbance in the summer, but shift in composition and diversity during the fall mixing, although these shifts do not always correspond to those seen in other, well-studied freshwater lakes. Continued, long-term seasonal characterizations of Lake Lanier will help validate the patterns observed here.</p>
</sec></sec><sec id="s5">
<title>Supporting Information</title>
<supplementary-material id="pone.0093827.s001" mimetype="application/pdf" xlink:href="info:doi/10.1371/journal.pone.0093827.s001" position="float" xlink:type="simple"><label>File S1</label><caption>
<p><bold>The file includes Figures S1 to S6 and Table S1 to S4.</bold> Figure S1 Dissolved oxygen and temperature profiles for July–December 2009 at the Brown’s Bridge location of Lake Lanier. Figure S2 Number of OTUs identified in each dataset. Figure S3 Similarity of datasets based on shared OTUs. Figure S4 Differences in phylum abundance based on 16S and metagenomes. Figure S5 Differences in abundance of individual genera based on 16S and metagenomes. Figure S6 Abundance of an individual <italic>Burkholderia</italic>-like population based on 16S amplicon vs. 16S metagenomic reads. Table S1 Characteristics of Lake Lanier at Brown’s Bridge for several dates in 2009. Table S2 V1, V3 specific primers used for amplification of the 16S rRNA gene. Table S3 16S rRNA gene amplicon library statistics. Table S4 metagenome library statistics.</p>
<p>(PDF)</p>
</caption></supplementary-material></sec></body>
<back>
<ack>
<p>We thank R. Fuller for sharing Lake Lanier metadata collected under contract with the Upper Chattahoochee Basin. We also thank Timothy Read and Chad Haase of the Emory University Genomics Facility for sequencing the samples.</p>
</ack>
<ref-list>
<title>References</title>
<ref id="pone.0093827-Costello1"><label>1</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Costello</surname><given-names>EK</given-names></name>, <name name-style="western"><surname>Lauber</surname><given-names>CL</given-names></name>, <name name-style="western"><surname>Hamady</surname><given-names>M</given-names></name>, <name name-style="western"><surname>Fierer</surname><given-names>N</given-names></name>, <name name-style="western"><surname>Gordon</surname><given-names>JI</given-names></name>, <etal>et al</etal>. (<year>2009</year>) <article-title>Bacterial community variation in human body habitats across space and time</article-title>. <source>Science</source> <volume>326</volume>: <fpage>1694</fpage>–<lpage>1697</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Gilbert1"><label>2</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Gilbert</surname><given-names>JA</given-names></name>, <name name-style="western"><surname>Steele</surname><given-names>JA</given-names></name>, <name name-style="western"><surname>Caporaso</surname><given-names>JG</given-names></name>, <name name-style="western"><surname>Steinbruck</surname><given-names>L</given-names></name>, <name name-style="western"><surname>Reeder</surname><given-names>J</given-names></name>, <etal>et al</etal>. (<year>2012</year>) <article-title>Defining seasonal marine microbial community dynamics</article-title>. <source>ISME J</source> <volume>6</volume>: <fpage>298</fpage>–<lpage>308</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Kent1"><label>3</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Kent</surname><given-names>AD</given-names></name>, <name name-style="western"><surname>Jones</surname><given-names>SE</given-names></name>, <name name-style="western"><surname>Yannarell</surname><given-names>AC</given-names></name>, <name name-style="western"><surname>Graham</surname><given-names>JM</given-names></name>, <name name-style="western"><surname>Lauster</surname><given-names>GH</given-names></name>, <etal>et al</etal>. (<year>2004</year>) <article-title>Annual patterns in bacterioplankton community variability in a humic lake</article-title>. <source>Microb Ecol</source> <volume>48</volume>: <fpage>550</fpage>–<lpage>560</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Nemergut1"><label>4</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Nemergut</surname><given-names>DR</given-names></name>, <name name-style="western"><surname>Costello</surname><given-names>EK</given-names></name>, <name name-style="western"><surname>Hamady</surname><given-names>M</given-names></name>, <name name-style="western"><surname>Lozupone</surname><given-names>C</given-names></name>, <name name-style="western"><surname>Jiang</surname><given-names>L</given-names></name>, <etal>et al</etal>. (<year>2011</year>) <article-title>Global patterns in the biogeography of bacterial taxa</article-title>. <source>Environ Microbiol</source> <volume>13</volume>: <fpage>135</fpage>–<lpage>144</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Sogin1"><label>5</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Sogin</surname><given-names>ML</given-names></name>, <name name-style="western"><surname>Morrison</surname><given-names>HG</given-names></name>, <name name-style="western"><surname>Huber</surname><given-names>JA</given-names></name>, <name name-style="western"><surname>Mark Welch</surname><given-names>D</given-names></name>, <name name-style="western"><surname>Huse</surname><given-names>SM</given-names></name>, <etal>et al</etal>. (<year>2006</year>) <article-title>Microbial diversity in the deep sea and the underexplored “rare biosphere”</article-title>. <source>Proc Natl Acad Sci U S A</source> <volume>103</volume>: <fpage>12115</fpage>–<lpage>12120</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Quince1"><label>6</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Quince</surname><given-names>C</given-names></name>, <name name-style="western"><surname>Lanzen</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Curtis</surname><given-names>TP</given-names></name>, <name name-style="western"><surname>Davenport</surname><given-names>RJ</given-names></name>, <name name-style="western"><surname>Hall</surname><given-names>N</given-names></name>, <etal>et al</etal>. (<year>2009</year>) <article-title>Accurate determination of microbial diversity from 454 pyrosequencing data</article-title>. <source>Nat Methods</source> <volume>6</volume>: <fpage>639</fpage>–<lpage>641</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Quince2"><label>7</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Quince</surname><given-names>C</given-names></name>, <name name-style="western"><surname>Lanzen</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Davenport</surname><given-names>RJ</given-names></name>, <name name-style="western"><surname>Turnbaugh</surname><given-names>PJ</given-names></name> (<year>2011</year>) <article-title>Removing Noise From Pyrosequenced Amplicons</article-title>. <source>BMC Bioinformatics</source> <volume>12</volume>.</mixed-citation>
</ref>
<ref id="pone.0093827-Youssef1"><label>8</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Youssef</surname><given-names>N</given-names></name>, <name name-style="western"><surname>Sheik</surname><given-names>CS</given-names></name>, <name name-style="western"><surname>Krumholz</surname><given-names>LR</given-names></name>, <name name-style="western"><surname>Najar</surname><given-names>FZ</given-names></name>, <name name-style="western"><surname>Roe</surname><given-names>BA</given-names></name>, <etal>et al</etal>. (<year>2009</year>) <article-title>Comparison of species richness estimates obtained using nearly complete fragments and simulated pyrosequencing-generated fragments in 16S rRNA gene-based environmental surveys</article-title>. <source>Appl Environ Microbiol</source> <volume>75</volume>: <fpage>5227</fpage>–<lpage>5236</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Huse1"><label>9</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Huse</surname><given-names>SM</given-names></name>, <name name-style="western"><surname>Welch</surname><given-names>DM</given-names></name>, <name name-style="western"><surname>Morrison</surname><given-names>HG</given-names></name>, <name name-style="western"><surname>Sogin</surname><given-names>ML</given-names></name> (<year>2010</year>) <article-title>Ironing out the wrinkles in the rare biosphere through improved OTU clustering</article-title>. <source>Environ Microbiol</source> <volume>12</volume>: <fpage>1889</fpage>–<lpage>1898</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-McDonald1"><label>10</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>McDonald</surname><given-names>IR</given-names></name>, <name name-style="western"><surname>Kampfer</surname><given-names>P</given-names></name>, <name name-style="western"><surname>Topp</surname><given-names>E</given-names></name>, <name name-style="western"><surname>Warner</surname><given-names>KL</given-names></name>, <name name-style="western"><surname>Cox</surname><given-names>MJ</given-names></name>, <etal>et al</etal>. (<year>2005</year>) <article-title><italic>Aminobacter ciceronei</italic> sp. nov. and <italic>Aminobacter lissarensis</italic> sp. nov., isolated from various terrestrial environments</article-title>. <source>Int J Syst Evol Microbiol</source> <volume>55</volume>: <fpage>1827</fpage>–<lpage>1832</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Konstantinidis1"><label>11</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Konstantinidis</surname><given-names>KT</given-names></name>, <name name-style="western"><surname>Ramette</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Tiedje</surname><given-names>JM</given-names></name> (<year>2006</year>) <article-title>The bacterial species definition in the genomic era</article-title>. <source>Philos Trans R Soc B Biol Sci</source> <volume>361</volume>: <fpage>1929</fpage>–<lpage>1940</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-RosselloMora1"><label>12</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Rossello-Mora</surname><given-names>R</given-names></name>, <name name-style="western"><surname>Amann</surname><given-names>R</given-names></name> (<year>2001</year>) <article-title>The species concept for prokaryotes</article-title>. <source>FEMS Microbiol Rev</source> <volume>25</volume>: <fpage>39</fpage>–<lpage>67</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Shakya1"><label>13</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Shakya</surname><given-names>M</given-names></name>, <name name-style="western"><surname>Quince</surname><given-names>C</given-names></name>, <name name-style="western"><surname>Campbell</surname><given-names>JH</given-names></name>, <name name-style="western"><surname>Yang</surname><given-names>ZK</given-names></name>, <name name-style="western"><surname>Schadt</surname><given-names>CW</given-names></name>, <etal>et al</etal>. (<year>2013</year>) <article-title>Comparative metagenomic and rRNA microbial diversity characterization using Archaeal and Bacterial synthetic communities</article-title>. <source>Environ Microbiol</source> <volume>15</volume>: <fpage>1882</fpage>–<lpage>1899</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Burke1"><label>14</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Burke</surname><given-names>C</given-names></name>, <name name-style="western"><surname>Steinberg</surname><given-names>P</given-names></name>, <name name-style="western"><surname>Rusch</surname><given-names>D</given-names></name>, <name name-style="western"><surname>Kjelleberg</surname><given-names>S</given-names></name>, <name name-style="western"><surname>Thomas</surname><given-names>T</given-names></name> (<year>2011</year>) <article-title>Bacterial community assembly based on functional genes rather than species</article-title>. <source>Proc Natl Acad Sci U S A</source> <volume>108</volume>: <fpage>14288</fpage>–<lpage>14293</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Gilbert2"><label>15</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Gilbert</surname><given-names>JA</given-names></name>, <name name-style="western"><surname>Field</surname><given-names>D</given-names></name>, <name name-style="western"><surname>Swift</surname><given-names>P</given-names></name>, <name name-style="western"><surname>Thomas</surname><given-names>S</given-names></name>, <name name-style="western"><surname>Cummings</surname><given-names>D</given-names></name>, <etal>et al</etal>. (<year>2010</year>) <article-title>The taxonomic and functional diversity of microbes at a temperate coastal site: a ‘multi-omic’ study of seasonal and diel temporal variation</article-title>. <source>PLoS One</source> <volume>5</volume>: <fpage>e15545</fpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-RodriguezBrito1"><label>16</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Rodriguez-Brito</surname><given-names>B</given-names></name>, <name name-style="western"><surname>Li</surname><given-names>LL</given-names></name>, <name name-style="western"><surname>Wegley</surname><given-names>L</given-names></name>, <name name-style="western"><surname>Furlan</surname><given-names>M</given-names></name>, <name name-style="western"><surname>Angly</surname><given-names>F</given-names></name>, <etal>et al</etal>. (<year>2010</year>) <article-title>Viral and microbial community dynamics in four aquatic environments</article-title>. <source>ISME J</source> <volume>4</volume>: <fpage>739</fpage>–<lpage>751</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Bazinet1"><label>17</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Bazinet</surname><given-names>AL</given-names></name>, <name name-style="western"><surname>Cummings</surname><given-names>MP</given-names></name> (<year>2012</year>) <article-title>A comparative evaluation of sequence classification programs</article-title>. <source>BMC Bioinformatics</source> <volume>13</volume>: <fpage>92</fpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Aird1"><label>18</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Aird</surname><given-names>D</given-names></name>, <name name-style="western"><surname>Ross</surname><given-names>MG</given-names></name>, <name name-style="western"><surname>Chen</surname><given-names>WS</given-names></name>, <name name-style="western"><surname>Danielsson</surname><given-names>M</given-names></name>, <name name-style="western"><surname>Fennell</surname><given-names>T</given-names></name>, <etal>et al</etal>. (<year>2011</year>) <article-title>Analyzing and minimizing PCR amplification bias in Illumina sequencing libraries</article-title>. <source>Genome Biol</source> <comment><bold>12</bold> doi:<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1186/gb-2011-12-2-r18" xlink:type="simple">10.1186/gb-2011-12-2-r18</ext-link></comment></mixed-citation>
</ref>
<ref id="pone.0093827-GomezAlvarez1"><label>19</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Gomez-Alvarez</surname><given-names>V</given-names></name>, <name name-style="western"><surname>Teal</surname><given-names>TK</given-names></name>, <name name-style="western"><surname>Schmidt</surname><given-names>TM</given-names></name> (<year>2009</year>) <article-title>Systematic artifacts in metagenomes from complex microbial communities</article-title>. <source>ISME J</source> <volume>3</volume>: <fpage>1314</fpage>–<lpage>1317</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Shah1"><label>20</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Shah</surname><given-names>N</given-names></name>, <name name-style="western"><surname>Tang</surname><given-names>H</given-names></name>, <name name-style="western"><surname>Doak</surname><given-names>TG</given-names></name>, <name name-style="western"><surname>Ye</surname><given-names>Y</given-names></name> (<year>2011</year>) <article-title>Comparing bacterial communities inferred from 16S rRNA gene sequencing and shotgun metagenomics</article-title>. <source>Pac Symp Biocomput</source>: <fpage>165</fpage>–<lpage>176</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Steven1"><label>21</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Steven</surname><given-names>B</given-names></name>, <name name-style="western"><surname>Gallegos-Graves</surname><given-names>L</given-names></name>, <name name-style="western"><surname>Starkenburg</surname><given-names>SR</given-names></name>, <name name-style="western"><surname>Chain</surname><given-names>PS</given-names></name>, <name name-style="western"><surname>Kuske</surname><given-names>CR</given-names></name> (<year>2012</year>) <article-title>Targeted and shotgun metagenomic approaches provide different descriptions of dryland soil microbial communities in a manipulated field study</article-title>. <source>Environ Microbiol Rep</source> <volume>4</volume>: <fpage>248</fpage>–<lpage>256</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Portillo1"><label>22</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Portillo</surname><given-names>MC</given-names></name>, <name name-style="western"><surname>Anderson</surname><given-names>SP</given-names></name>, <name name-style="western"><surname>Fierer</surname><given-names>N</given-names></name> (<year>2012</year>) <article-title>Temporal variability in the diversity and composition of stream bacterioplankton communities</article-title>. <source>Environ Microbiol</source> <volume>14</volume>: <fpage>2417</fpage>–<lpage>2428</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Yannarell1"><label>23</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Yannarell</surname><given-names>AC</given-names></name>, <name name-style="western"><surname>Kent</surname><given-names>AD</given-names></name>, <name name-style="western"><surname>Lauster</surname><given-names>GH</given-names></name>, <name name-style="western"><surname>Kratz</surname><given-names>TK</given-names></name>, <name name-style="western"><surname>Triplett</surname><given-names>EW</given-names></name> (<year>2003</year>) <article-title>Temporal patterns in bacterial communities in three temperate lakes of different trophic status</article-title>. <source>Microb Ecol</source> <volume>46</volume>: <fpage>391</fpage>–<lpage>405</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Zwisler1"><label>24</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Zwisler</surname><given-names>W</given-names></name>, <name name-style="western"><surname>Selje</surname><given-names>N</given-names></name>, <name name-style="western"><surname>Simon</surname><given-names>M</given-names></name> (<year>2003</year>) <article-title>Seasonal patterns of the bacterioplankton community composition in a large mesotrophic lake</article-title>. <source>Aquat Microb Ecol</source> <volume>31</volume>: <fpage>211</fpage>–<lpage>225</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Eiler1"><label>25</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Eiler</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Heinrich</surname><given-names>F</given-names></name>, <name name-style="western"><surname>Bertilsson</surname><given-names>S</given-names></name> (<year>2012</year>) <article-title>Coherent dynamics and association networks among lake bacterioplankton taxa</article-title>. <source>ISME J</source> <volume>6</volume>: <fpage>330</fpage>–<lpage>342</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Lindstrom1"><label>26</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Lindstrom</surname><given-names>ES</given-names></name>, <name name-style="western"><surname>Kamst-Van Agterveld</surname><given-names>MP</given-names></name>, <name name-style="western"><surname>Zwart</surname><given-names>G</given-names></name> (<year>2005</year>) <article-title>Distribution of typical freshwater bacterial groups is associated with pH, temperature, and lake water retention time</article-title>. <source>Appl Environ Microbiol</source> <volume>71</volume>: <fpage>8201</fpage>–<lpage>8206</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Crump1"><label>27</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Crump</surname><given-names>RC</given-names></name>, <name name-style="western"><surname>Adams</surname><given-names>HE</given-names></name>, <name name-style="western"><surname>Hobbie</surname><given-names>JE</given-names></name>, <name name-style="western"><surname>Kling</surname><given-names>GW</given-names></name> (<year>2007</year>) <article-title>Biogeography of bacterioplankton in lakes and streams of an Arctic tundra catchment</article-title>. <source>Ecology</source> <volume>88</volume>: <fpage>1365</fpage>–<lpage>1378</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Methe1"><label>28</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Methe</surname><given-names>BA</given-names></name>, <name name-style="western"><surname>Zehr</surname><given-names>JP</given-names></name> (<year>1999</year>) <article-title>Diversity of bacterial communities in Adirondack lakes: do species assemblages reflect lake water chemistry?</article-title> <source>Hydrobiologia</source> <volume>401</volume>: <fpage>77</fpage>–<lpage>96</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Oh1"><label>29</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Oh</surname><given-names>S</given-names></name>, <name name-style="western"><surname>Caro-Quintero</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Tsementzi</surname><given-names>D</given-names></name>, <name name-style="western"><surname>Deleon-Rodriguez</surname><given-names>N</given-names></name>, <name name-style="western"><surname>Luo</surname><given-names>C</given-names></name>, <etal>et al</etal>. (<year>2011</year>) <article-title>Metagenomic insights into the evolution, function, and complexity of the planktonic microbial community of Lake Lanier, a temperate freshwater ecosystem</article-title>. <source>Appl Environ Microbiol</source> <volume>77</volume>: <fpage>6000</fpage>–<lpage>6011</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Caporaso1"><label>30</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Caporaso</surname><given-names>JG</given-names></name>, <name name-style="western"><surname>Kuczynski</surname><given-names>J</given-names></name>, <name name-style="western"><surname>Stombaugh</surname><given-names>J</given-names></name>, <name name-style="western"><surname>Bittinger</surname><given-names>K</given-names></name>, <name name-style="western"><surname>Bushman</surname><given-names>FD</given-names></name>, <etal>et al</etal>. (<year>2010</year>) <article-title>QIIME allows analysis of high-throughput community sequencing data</article-title>. <source>Nat Methods</source> <volume>7</volume>: <fpage>335</fpage>–<lpage>336</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-DeSantis1"><label>31</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>DeSantis</surname><given-names>TZ</given-names></name>, <name name-style="western"><surname>Hugenholtz</surname><given-names>P</given-names></name>, <name name-style="western"><surname>Larsen</surname><given-names>N</given-names></name>, <name name-style="western"><surname>Rojas</surname><given-names>M</given-names></name>, <name name-style="western"><surname>Brodie</surname><given-names>EL</given-names></name>, <etal>et al</etal>. (<year>2006</year>) <article-title>Greengenes, a chimera-checked 16S rRNA gene database and workbench compatible with ARB</article-title>. <source>Appl Environ Microbiol</source> <volume>72</volume>: <fpage>5069</fpage>–<lpage>5072</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Newton1"><label>32</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Newton</surname><given-names>RJ</given-names></name>, <name name-style="western"><surname>Jones</surname><given-names>SE</given-names></name>, <name name-style="western"><surname>Eiler</surname><given-names>A</given-names></name>, <name name-style="western"><surname>McMahon</surname><given-names>KD</given-names></name>, <name name-style="western"><surname>Bertilsson</surname><given-names>S</given-names></name> (<year>2011</year>) <article-title>A Guide to the Natural History of Freshwater Lake Bacteria</article-title>. <source>Microbiol Mol Biol Rev</source> <volume>75</volume>: <fpage>14</fpage>–<lpage>49</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Li1"><label>33</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Li</surname><given-names>R</given-names></name>, <name name-style="western"><surname>Zhu</surname><given-names>H</given-names></name>, <name name-style="western"><surname>Ruan</surname><given-names>J</given-names></name>, <name name-style="western"><surname>Qian</surname><given-names>W</given-names></name>, <name name-style="western"><surname>Fang</surname><given-names>X</given-names></name>, <etal>et al</etal>. (<year>2010</year>) <article-title>De novo assembly of human genomes with massively parallel short read sequencing</article-title>. <source>Genome Res</source> <volume>20</volume>: <fpage>265</fpage>–<lpage>272</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Zerbino1"><label>34</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Zerbino</surname><given-names>DR</given-names></name>, <name name-style="western"><surname>Birney</surname><given-names>E</given-names></name> (<year>2008</year>) <article-title>Velvet: algorithms for de novo short read assembly using de Bruijn graphs</article-title>. <source>Genome Res</source> <volume>18</volume>: <fpage>821</fpage>–<lpage>829</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Luo1"><label>35</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Luo</surname><given-names>C</given-names></name>, <name name-style="western"><surname>Tsementzi</surname><given-names>D</given-names></name>, <name name-style="western"><surname>Kyrpides</surname><given-names>NC</given-names></name>, <name name-style="western"><surname>Konstantinidis</surname><given-names>KT</given-names></name> (<year>2012</year>) <article-title>Individual genome assembly from complex community short-read metagenomic datasets</article-title>. <source>ISME J</source> <volume>6</volume>: <fpage>898</fpage>–<lpage>901</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Zhu1"><label>36</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Zhu</surname><given-names>W</given-names></name>, <name name-style="western"><surname>Lomsadze</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Borodovsky</surname><given-names>M</given-names></name> (<year>2010</year>) <article-title><italic>Ab initio</italic> gene identification in metagenomic sequences</article-title>. <source>Nucleic Acids Res</source> <volume>38</volume>: <fpage>e132</fpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Luo2"><label>37</label>
<mixed-citation publication-type="other" xlink:type="simple">Luo C Konstantinidis KT (<italic>Under revision</italic>) MyTaxa: an advanced taxonomic classifier for genomic and metagenomic sequences. Nuc Acids Res.</mixed-citation>
</ref>
<ref id="pone.0093827-Caporaso2"><label>38</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Caporaso</surname><given-names>JG</given-names></name>, <name name-style="western"><surname>Lauber</surname><given-names>CL</given-names></name>, <name name-style="western"><surname>Walters</surname><given-names>WA</given-names></name>, <name name-style="western"><surname>Berg-Lyons</surname><given-names>D</given-names></name>, <name name-style="western"><surname>Huntley</surname><given-names>J</given-names></name>, <etal>et al</etal>. (<year>2012</year>) <article-title>Ultra-high-throughput microbial community analysis on the Illumina HiSeq and MiSeq platforms</article-title>. <source>ISME J</source> <volume>6</volume>: <fpage>1621</fpage>–<lpage>1624</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Clarke1"><label>39</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Clarke</surname><given-names>KR</given-names></name> (<year>1993</year>) <article-title>Non-parametric multivariate analyses of changes in community structure</article-title>. <source>Aust J Ecol</source> <volume>18</volume>: <fpage>117</fpage>–<lpage>143</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Good1"><label>40</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Good</surname><given-names>IJ</given-names></name>, <name name-style="western"><surname>Toulmin</surname><given-names>GH</given-names></name> (<year>1956</year>) <article-title>The Number of New Species, and the Increase in Population Coverage, When a Sample Is Increased</article-title>. <source>Biometrika</source> <volume>43</volume>: <fpage>45</fpage>–<lpage>63</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Hahn1"><label>41</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Hahn</surname><given-names>MW</given-names></name> (<year>2003</year>) <article-title>Isolation of strains belonging to the cosmopolitan <italic>Polynucleobacter necessarius</italic> cluster from freshwater habitats located in three climatic zones</article-title>. <source>Appl Environ Microbiol</source> <volume>69</volume>: <fpage>5248</fpage>–<lpage>5254</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Partensky1"><label>42</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Partensky</surname><given-names>F</given-names></name>, <name name-style="western"><surname>Hess</surname><given-names>WR</given-names></name>, <name name-style="western"><surname>Vaulot</surname><given-names>D</given-names></name> (<year>1999</year>) <article-title><italic>Prochlorococcus</italic>, a marine photosynthetic prokaryote of global significance</article-title>. <source>Microbiol Mol Biol Rev</source> <volume>63</volume>: <fpage>106</fpage>–<lpage>127</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Corzo1"><label>43</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Corzo</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Jimenez-Gomez</surname><given-names>F</given-names></name>, <name name-style="western"><surname>Gordillo</surname><given-names>FJL</given-names></name>, <name name-style="western"><surname>Garcia-Ruiz</surname><given-names>R</given-names></name>, <name name-style="western"><surname>Niell</surname><given-names>FX</given-names></name> (<year>1999</year>) <article-title><italic>Synechococcus</italic> and <italic>Prochlorococcus</italic>-like populations detected by flow cytometry in a eutrophic reservoir in summer</article-title>. <source>J Plankton Res</source> <volume>21</volume>: <fpage>1575</fpage>–<lpage>1581</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Stenuite1"><label>44</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Stenuite</surname><given-names>S</given-names></name>, <name name-style="western"><surname>Tarbe</surname><given-names>A-L</given-names></name>, <name name-style="western"><surname>Sarmento</surname><given-names>H</given-names></name>, <name name-style="western"><surname>Unrein</surname><given-names>F</given-names></name>, <name name-style="western"><surname>Pirlot</surname><given-names>S</given-names></name>, <etal>et al</etal>. (<year>2009</year>) <article-title>Photosynthetic picoplankton in Lake Tanganyika: biomass distribution patterns with depth, season and basin</article-title>. <source>J Plankton Res</source> <volume>31</volume>: <fpage>1531</fpage>–<lpage>1544</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-RodriguezR1"><label>45</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Rodriguez-R</surname><given-names>L</given-names></name>, <name name-style="western"><surname>Konstantinidis</surname><given-names>K</given-names></name> (<year>2013</year>) <article-title>Nonpareil: A redundancy-based approach to. assess the level of coverage in metagenomic datasets</article-title>. <source>Bioinformatics</source> <comment>doi:<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1093/bioinformatics/btt584" xlink:type="simple">10.1093/bioinformatics/btt584</ext-link></comment></mixed-citation>
</ref>
<ref id="pone.0093827-Acinas1"><label>46</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Acinas</surname><given-names>SG</given-names></name>, <name name-style="western"><surname>Marcelino</surname><given-names>LA</given-names></name>, <name name-style="western"><surname>Klepac-Ceraj</surname><given-names>V</given-names></name>, <name name-style="western"><surname>Polz</surname><given-names>MF</given-names></name> (<year>2004</year>) <article-title>Divergence and redundancy of 16S rRNA sequences in genomes with multiple rrn operons</article-title>. <source>J Bacteriol</source> <volume>186</volume>: <fpage>2629</fpage>–<lpage>2635</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Konstantinidis2"><label>47</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Konstantinidis</surname><given-names>KT</given-names></name>, <name name-style="western"><surname>Tiedje</surname><given-names>JM</given-names></name> (<year>2007</year>) <article-title>Prokaryotic taxonomy and phylogeny in the genomic era: advancements and challenges ahead</article-title>. <source>Curr Opin Microbiol</source> <volume>10</volume>: <fpage>504</fpage>–<lpage>509</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Strous1"><label>48</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Strous</surname><given-names>M</given-names></name>, <name name-style="western"><surname>Kraft</surname><given-names>B</given-names></name>, <name name-style="western"><surname>Bisdorf</surname><given-names>R</given-names></name>, <name name-style="western"><surname>Tegetmeyer</surname><given-names>HE</given-names></name> (<year>2012</year>) <article-title>The binning of metagenomic contigs for microbial physiology of mixed cultures</article-title>. <source>Front Microbiol</source> <volume>3</volume>: <fpage>410</fpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Kalyuzhnaya1"><label>49</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Kalyuzhnaya</surname><given-names>MG</given-names></name>, <name name-style="western"><surname>Lapidus</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Ivanova</surname><given-names>N</given-names></name>, <name name-style="western"><surname>Copeland</surname><given-names>AC</given-names></name>, <name name-style="western"><surname>McHardy</surname><given-names>AC</given-names></name>, <etal>et al</etal>. (<year>2008</year>) <article-title>High-resolution metagenomics targets specific functional types in complex microbial communities</article-title>. <source>Nat Biotechnol</source> <volume>26</volume>: <fpage>1029</fpage>–<lpage>1034</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Sharpton1"><label>50</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Sharpton</surname><given-names>TJ</given-names></name>, <name name-style="western"><surname>Riesenfeld</surname><given-names>SJ</given-names></name>, <name name-style="western"><surname>Kembel</surname><given-names>SW</given-names></name>, <name name-style="western"><surname>Ladau</surname><given-names>J</given-names></name>, <name name-style="western"><surname>O’Dwyer</surname><given-names>JP</given-names></name>, <etal>et al</etal>. (<year>2011</year>) <article-title>PhylOTU: a high-throughput procedure quantifies microbial community diversity and resolves novel taxa from metagenomic data</article-title>. <source>PLoS Comput Biol</source> <volume>7</volume>: <fpage>e1001061</fpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Miller1"><label>51</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Miller</surname><given-names>CS</given-names></name>, <name name-style="western"><surname>Baker</surname><given-names>BJ</given-names></name>, <name name-style="western"><surname>Thomas</surname><given-names>BC</given-names></name>, <name name-style="western"><surname>Singer</surname><given-names>SW</given-names></name>, <name name-style="western"><surname>Banfield</surname><given-names>JF</given-names></name> (<year>2011</year>) <article-title>EMIRGE: reconstruction of full-length ribosomal genes from microbial community short read sequencing data</article-title>. <source>Genome Biol</source> <volume>12</volume>: <fpage>R44</fpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Bokulich1"><label>52</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Bokulich</surname><given-names>NA</given-names></name>, <name name-style="western"><surname>Subramanian</surname><given-names>S</given-names></name>, <name name-style="western"><surname>Faith</surname><given-names>JJ</given-names></name>, <name name-style="western"><surname>Gevers</surname><given-names>D</given-names></name>, <name name-style="western"><surname>Gordon</surname><given-names>JI</given-names></name>, <etal>et al</etal>. (<year>2013</year>) <article-title>Quality-filtering vastly improves diversity estimates from Illumina amplicon sequencing</article-title>. <source>Nat Meth</source> <volume>10</volume>: <fpage>57</fpage>–<lpage>59</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Claesson1"><label>53</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Claesson</surname><given-names>MJ</given-names></name>, <name name-style="western"><surname>Wang</surname><given-names>Q</given-names></name>, <name name-style="western"><surname>O’Sullivan</surname><given-names>O</given-names></name>, <name name-style="western"><surname>Greene-Diniz</surname><given-names>R</given-names></name>, <name name-style="western"><surname>Cole</surname><given-names>JR</given-names></name>, <etal>et al</etal>. (<year>2010</year>) <article-title>Comparison of two next-generation sequencing technologies for resolving highly complex microbiota composition using tandem variable 16S rRNA gene regions</article-title>. <source>Nucleic Acids Res</source> <volume>38</volume>: <fpage>e200</fpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Wang1"><label>54</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Wang</surname><given-names>Q</given-names></name>, <name name-style="western"><surname>Garrity</surname><given-names>GM</given-names></name>, <name name-style="western"><surname>Tiedje</surname><given-names>JM</given-names></name>, <name name-style="western"><surname>Cole</surname><given-names>JR</given-names></name> (<year>2007</year>) <article-title>Naive Bayesian classifier for rapid assignment of rRNA sequences into the new bacterial taxonomy</article-title>. <source>Appl Environ Microbiol</source> <volume>73</volume>: <fpage>5261</fpage>–<lpage>5267</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Werner1"><label>55</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Werner</surname><given-names>JJ</given-names></name>, <name name-style="western"><surname>Koren</surname><given-names>O</given-names></name>, <name name-style="western"><surname>Hugenholtz</surname><given-names>P</given-names></name>, <name name-style="western"><surname>DeSantis</surname><given-names>TZ</given-names></name>, <name name-style="western"><surname>Walters</surname><given-names>WA</given-names></name>, <etal>et al</etal>. (<year>2012</year>) <article-title>Impact of training sets on classification of high-throughput bacterial 16S rRNA gene surveys</article-title>. <source>The ISME journal</source> <volume>6</volume>: <fpage>94</fpage>–<lpage>103</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Klindworth1"><label>56</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Klindworth</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Pruesse</surname><given-names>E</given-names></name>, <name name-style="western"><surname>Schweer</surname><given-names>T</given-names></name>, <name name-style="western"><surname>Peplies</surname><given-names>J</given-names></name>, <name name-style="western"><surname>Quast</surname><given-names>C</given-names></name>, <etal>et al</etal>. (<year>2013</year>) <article-title>Evaluation of general 16S ribosomal RNA gene PCR primers for classical and next-generation sequencing-based diversity studies</article-title>. <source>Nucleic Acids Res</source> <volume>41</volume>: <fpage>e1</fpage> <comment>doi:<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1093/nar/gks808" xlink:type="simple">10.1093/nar/gks808</ext-link></comment></mixed-citation>
</ref>
<ref id="pone.0093827-Allison1"><label>57</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Allison</surname><given-names>SD</given-names></name>, <name name-style="western"><surname>Martiny</surname><given-names>JBH</given-names></name> (<year>2008</year>) <article-title>Resistance, resilience, and redundancy in microbial communities</article-title>. <source>Proc Natl Acad Sci U S A</source> <volume>105</volume>: <fpage>11512</fpage>–<lpage>11519</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Kent2"><label>58</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Kent</surname><given-names>AD</given-names></name>, <name name-style="western"><surname>Yannarell</surname><given-names>AC</given-names></name>, <name name-style="western"><surname>Rusak</surname><given-names>JA</given-names></name>, <name name-style="western"><surname>Triplett</surname><given-names>EW</given-names></name>, <name name-style="western"><surname>McMahon</surname><given-names>KD</given-names></name> (<year>2007</year>) <article-title>Synchrony in aquatic microbial community dynamics</article-title>. <source>ISME J</source> <volume>1</volume>: <fpage>38</fpage>–<lpage>47</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Newton2"><label>59</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Newton</surname><given-names>RJ</given-names></name>, <name name-style="western"><surname>McMahon</surname><given-names>KD</given-names></name> (<year>2011</year>) <article-title>Seasonal differences in bacterial community composition following nutrient additions in a eutrophic lake</article-title>. <source>Environ Microbiol</source> <volume>13</volume>: <fpage>887</fpage>–<lpage>899</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Shade1"><label>60</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Shade</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Kent</surname><given-names>AD</given-names></name>, <name name-style="western"><surname>Jones</surname><given-names>SE</given-names></name>, <name name-style="western"><surname>Newton</surname><given-names>RJ</given-names></name>, <name name-style="western"><surname>Triplett</surname><given-names>EW</given-names></name>, <etal>et al</etal>. (<year>2007</year>) <article-title>Interannual dynamics and phenology of bacterial communities in a eutrophic lake</article-title>. <source>Limnol Oceanogr</source> <volume>52</volume>: <fpage>487</fpage>–<lpage>494</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Shade2"><label>61</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Shade</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Read</surname><given-names>JS</given-names></name>, <name name-style="western"><surname>Welkie</surname><given-names>DG</given-names></name>, <name name-style="western"><surname>Kratz</surname><given-names>TK</given-names></name>, <name name-style="western"><surname>Wu</surname><given-names>CH</given-names></name>, <etal>et al</etal>. (<year>2011</year>) <article-title>Resistance, resilience and recovery: aquatic bacterial dynamics after water column disturbance</article-title>. <source>Environ Microbiol</source> <volume>13</volume>: <fpage>2752</fpage>–<lpage>2767</lpage>.</mixed-citation>
</ref>
<ref id="pone.0093827-Shade3"><label>62</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Shade</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Read</surname><given-names>JS</given-names></name>, <name name-style="western"><surname>Youngblut</surname><given-names>ND</given-names></name>, <name name-style="western"><surname>Fierer</surname><given-names>N</given-names></name>, <name name-style="western"><surname>Knight</surname><given-names>R</given-names></name>, <etal>et al</etal>. (<year>2012</year>) <article-title>Lake microbial communities are resilient after a whole-ecosystem disturbance</article-title>. <source>ISME J</source> <volume>6</volume>: <fpage>2153</fpage>–<lpage>2167</lpage>.</mixed-citation>
</ref>
</ref-list></back>
</article>