<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article
  PUBLIC "-//NLM//DTD Journal Publishing DTD v3.0 20080202//EN" "http://dtd.nlm.nih.gov/publishing/3.0/journalpublishing3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="3.0" xml:lang="en">
  <front>
    <journal-meta><journal-id journal-id-type="nlm-ta">PLoS ONE</journal-id><journal-id journal-id-type="publisher-id">plos</journal-id><journal-id journal-id-type="pmc">plosone</journal-id><issn pub-type="epub">1932-6203</issn><publisher>
        <publisher-name>Public Library of Science</publisher-name>
        <publisher-loc>San Francisco, USA</publisher-loc>
      </publisher></journal-meta>
    <article-meta><article-id pub-id-type="publisher-id">PONE-D-12-12523</article-id><article-id pub-id-type="doi">10.1371/journal.pone.0047132</article-id><article-categories>
        <subj-group subj-group-type="heading">
          <subject>Research Article</subject>
        </subj-group>
        <subj-group subj-group-type="Discipline-v2">
          <subject>Biology</subject>
          <subj-group>
            <subject>Biochemistry</subject>
            <subj-group>
              <subject>Proteins</subject>
              <subj-group>
                <subject>Chromoproteins</subject>
                <subject>Protein structure</subject>
                <subject>Recombinant proteins</subject>
              </subj-group>
            </subj-group>
          </subj-group>
          <subj-group>
            <subject>Biophysics</subject>
            <subj-group>
              <subject>Protein chemistry</subject>
            </subj-group>
          </subj-group>
          <subj-group>
            <subject>Proteomics</subject>
            <subj-group>
              <subject>Protein engineering</subject>
            </subj-group>
          </subj-group>
        </subj-group>
        <subj-group subj-group-type="Discipline">
          <subject>Biophysics</subject>
          <subject>Biochemistry</subject>
        </subj-group>
      </article-categories><title-group><article-title>Crystal Structure of Enhanced Green Fluorescent Protein to 1.35 Å Resolution Reveals Alternative Conformations for Glu222</article-title><alt-title alt-title-type="running-head">EGFP Structure</alt-title></title-group><contrib-group>
        <contrib contrib-type="author" xlink:type="simple">
          <name name-style="western">
            <surname>Arpino</surname>
            <given-names>James A. J.</given-names>
          </name>
          <xref ref-type="aff" rid="aff1">
            <sup>1</sup>
          </xref>
          <xref ref-type="fn" rid="fn1">
            <sup>¤</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author" xlink:type="simple">
          <name name-style="western">
            <surname>Rizkallah</surname>
            <given-names>Pierre J.</given-names>
          </name>
          <xref ref-type="aff" rid="aff2">
            <sup>2</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author" xlink:type="simple">
          <name name-style="western">
            <surname>Jones</surname>
            <given-names>D. Dafydd</given-names>
          </name>
          <xref ref-type="aff" rid="aff1">
            <sup>1</sup>
          </xref>
          <xref ref-type="corresp" rid="cor1">
            <sup>*</sup>
          </xref>
        </contrib>
      </contrib-group><aff id="aff1">
        <label>1</label>
        <addr-line>School of Biosciences, Cardiff University, Cardiff, United Kingdom</addr-line>
      </aff><aff id="aff2">
        <label>2</label>
        <addr-line>School of Medicine, Cardiff University, Cardiff, United Kingdom</addr-line>
      </aff><contrib-group>
        <contrib contrib-type="editor" xlink:type="simple">
          <name name-style="western">
            <surname>Budisa</surname>
            <given-names>Nediljko</given-names>
          </name>
          <role>Editor</role>
          <xref ref-type="aff" rid="edit1"/>
        </contrib>
      </contrib-group><aff id="edit1">
        <addr-line>Berlin Institute of Technology, Germany</addr-line>
      </aff><author-notes>
        <corresp id="cor1">* E-mail: <email xlink:type="simple">jonesdd@cf.ac.uk</email></corresp>
        <fn fn-type="conflict">
          <p>The work was supported by a contribution from Merck KGaA through a BBBSRC sponsored CASE studentship. This does not alter the authors' adherence to all the PLOS ONE policies on sharing data and materials.</p>
        </fn>
        <fn fn-type="con">
          <p>Conceived and designed the experiments: JAJA DDJ. Performed the experiments: JAJA PJR. Analyzed the data: JAJA PJR DDJ. Contributed reagents/materials/analysis tools: JAJA PJR. Wrote the paper: JAJA DDJ.</p>
        </fn>
        <fn fn-type="current-aff" id="fn1">
          <label>¤</label>
          <p>Current address: Centre for Synthetic Biology and Innovation, Imperial College London, London, United Kingdom</p>
        </fn>
      </author-notes><pub-date pub-type="collection">
        <year>2012</year>
      </pub-date><pub-date pub-type="epub">
        <day>16</day>
        <month>10</month>
        <year>2012</year>
      </pub-date><volume>7</volume><issue>10</issue><elocation-id>e47132</elocation-id><history>
        <date date-type="received">
          <day>2</day>
          <month>5</month>
          <year>2012</year>
        </date>
        <date date-type="accepted">
          <day>11</day>
          <month>9</month>
          <year>2012</year>
        </date>
      </history><permissions>
        
        <copyright-holder>Arpino et al</copyright-holder>
        <license xlink:type="simple">
          <license-p>This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
        </license>
      </permissions><abstract>
        <p>Enhanced Green Fluorescent Protein (EGFP) is one of the most widely used engineered variants of the original wild-type Green Fluorescent Protein. Here, we report the high resolution (1.35 Å) structure of EGFP crystallised in its untagged sequence form that reveals the combined impact of the F64L and S65T, that give rise to improved folding and spectral characteristics. The overall structure of EGFP is very similar to wt GFP, forming the classical β-barrel fold with the chromophore containing helix running through the core of the structure. Replacement of Phe64 with Leu in EGFP results in subtle rearrangement of hydrophobic core packing close to the chromophore including the reduction in surface exposure of two hydrophobic residues. Replacement of Ser65 with Thr has a significant impact on the local hydrogen bond network in the vicinity of the chromophore. Detailed analysis of electron density reveals that several residues close to the chromophore occupy at least two distinct conformations. This includes Glu222 that defines the charged state on the chromophore, with the two conformations having slightly different effects on the hydrogen bond network surrounding the chromophore. Hence, the reported high-resolution structure of EGFP has provided a long overdue molecular description of one of the most important fluorescent protein variants currently in general use.</p>
      </abstract><funding-group>
        <funding-statement>JAJA was supported by a BBSRC CASE studentship in collaboration with Merck KGaA. The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</funding-statement>
      </funding-group><counts>
        <page-count count="8"/>
      </counts></article-meta>
  </front>
  <body>
    <sec id="s1">
      <title>Introduction</title>
      <p>Since it's discovery <xref ref-type="bibr" rid="pone.0047132-Shimomura1">[1]</xref> and subsequent use as a genetic protein tag <xref ref-type="bibr" rid="pone.0047132-Chalfie1">[2]</xref>, Green Fluorescent Protein (GFP) from <italic>Aequorea victoria</italic> has become one of the most important and powerful tools in cell biology <xref ref-type="bibr" rid="pone.0047132-Tsien1">[3]</xref>, <xref ref-type="bibr" rid="pone.0047132-Zhang1">[4]</xref>. Its intrinsic fluorescence without the requirement of any additional co-factors or substrates allowed for the first time genetically encoded defined tagging and monitoring of any target protein in the cell. GFP and other since discovered fluorescent proteins from different organisms <xref ref-type="bibr" rid="pone.0047132-Pakhomov1">[5]</xref> are fluorescent due to covalent rearrangement of contiguous amino acids <xref ref-type="bibr" rid="pone.0047132-Tsien1">[3]</xref>. In the case of wt GFP Ser65, Tyr66 and Gly67 main-chain atoms cyclise after the protein folds to form, in the presence of O<sub>2</sub>, the highly conjugated planar <italic>p</italic>-hydroxybenzylideneimidazolinone chromophore <xref ref-type="bibr" rid="pone.0047132-Zhang2">[6]</xref>. The crystal structure of wild-type GFP (wt GFP) <xref ref-type="bibr" rid="pone.0047132-Yang1">[7]</xref>, <xref ref-type="bibr" rid="pone.0047132-Ormo1">[8]</xref> revealed that the chromophore is packed within the core of the GFP β-barrel structure protecting it from quenching through water dipoles, paramagnetic oxygen or <italic>cis-trans</italic> isomerisation. The spectral properties of the GFP chromophore are further tuned through non-covalent interactions with neighboring residues <xref ref-type="bibr" rid="pone.0047132-Tsien1">[3]</xref>.</p>
      <p>The original wt GFP had several major drawbacks that reduced its effectiveness as a tool for cell imaging <xref ref-type="bibr" rid="pone.0047132-Tsien1">[3]</xref>. Its folding efficiency and thus fluorescent signal drops dramatically at physiologically relevant temperatures such as 37°C, its maturation rate is very slow and it had a strong tendency to aggregate. Two separate excitation peaks were also observed due to the coexistence of neutral (λ<sub>ex</sub>∼395 nm) and phenolate (λ<sub>ex</sub>∼490 nm) forms of the chromophore <xref ref-type="bibr" rid="pone.0047132-Heim1">[9]</xref>. Excitation at ∼490 nm was preferred as its lower energy is less damaging to the cell. However, the 490 nm excitation wavelength was only a minor contributor to fluorescence (∼15% compared to excitation at ∼395 nm). Protein engineering has solved many of the problems associated with wt GFP so facilitating its rapid and wide spread use <xref ref-type="bibr" rid="pone.0047132-Tsien1">[3]</xref>–<xref ref-type="bibr" rid="pone.0047132-Pakhomov1">[5]</xref>, <xref ref-type="bibr" rid="pone.0047132-LippincottSchwartz1">[10]</xref>. One of the first and most important engineered versions of wt GFP was enhanced GFP (EGFP) <xref ref-type="bibr" rid="pone.0047132-Cormack1">[11]</xref>, <xref ref-type="bibr" rid="pone.0047132-Yang2">[12]</xref>. EGFP has greater folding efficiency (increased fluorescence due to a higher proportion of correctly folded protein) at 37°C, has a single excitation peak at ∼490 nm and has been codon optimized for expression in mammalian hosts. Two mutations that generate EGFP, F64L and S65T, contribute to these improved properties. S65T is considered essential for suppressing the 395 nm excitation peak through modulation of the ionized state of nearby Glu222, whilst the F64L mutation is responsible for improved folding efficiency at 37°C. In wt GFP, Ser65 donates a hydrogen bond to the carboxyl group of Glu222 and promotes the deprotonated form. Electrostatic repulsion prevents both the Glu222 and the chromophore occupying the same anionic state.</p>
      <p>EGFP is still one of the most widely utilized of all the GFP variants but its native sequence structure in the absence of any tag has not been determined to high resolution so as to fully understand the impact and context of the F64L and S65T mutations. The only available structure of EGFP-like protein available in the PDB was determined only very recently at the slightly lower resolution of 1.5 Å, and with an N-terminal protein purification affinity [His] tag present <xref ref-type="bibr" rid="pone.0047132-Royant1">[13]</xref>, accession code 2Y0G. Here we report the crystal structure of the native EGFP without any purification tags present to 1.35 Å resolution. Analysis of the structure suggests that the mutations have subtle yet important effects on the side chain packing and hydrogen bond network surrounding the chromophore. The high resolution data has identified several residues close to the chromophore that exist in multiple conformations. These include Glu222, which defines the charge character of the chromophore, Leu18 and Leu44. Our work independently confirms the presence of alternate conformations previously observed for Glu222 but with significant differences in side chain placement in the additional conformer. The observation of alternate conformers for Leu18 and Leu44 has not been previously reported to our knowledge.</p>
    </sec>
    <sec id="s2">
      <title>Results and Discussion</title>
      <sec id="s2a">
        <title>General characterisation of EGFP</title>
        <p>EGFP was purified in its native sequence form, encompassing residues 1-Met-Val-Ser to Leu-Tyr-Lys-238 without any affinity purification tag attached at the N- or C-termini. The spectral characteristics of the pure protein were similar to those already reported for EGFP <xref ref-type="bibr" rid="pone.0047132-Patterson1">[14]</xref>, with λ<sub>ex</sub> and λ<sub>em</sub> of 488 nm and 511 nm, respectively, ε of 55 mM<sup>−1</sup> cm<sup>−1</sup>, a quantum efficiency of 0.6 and brightness of 33 mM<sup>−1</sup> cm<sup>−1</sup>. Size exclusion chromatography (Methods S1) confirmed EGFP was predominantly monomeric (<xref ref-type="supplementary-material" rid="pone.0047132.s001">Figure S1</xref>).</p>
      </sec>
      <sec id="s2b">
        <title>Crystal structure of EGFP</title>
        <p>The crystal structure of EGFP showing residues Lys3 to Leu231 was determined as described in the Methods and Materials. Crystals grew in the space group P2<sub>1</sub>2<sub>1</sub>2<sub>1</sub> and contained a single molecule in the asymmetric unit. The structure was determined to a resolution of 1.35 Å and refined to an R and R<sub>free</sub> of 12.8% and 16.8%, respectively (<xref ref-type="table" rid="pone-0047132-t001">Table 1</xref>). The final refinement statistics and model geometry fall within the expected range (<xref ref-type="table" rid="pone-0047132-t001">Table 1</xref>).</p>
        <table-wrap id="pone-0047132-t001" orientation="portrait" position="float"><object-id pub-id-type="doi">10.1371/journal.pone.0047132.t001</object-id><label>Table 1</label><caption>
            <title>Cystallographic statistics.</title>
          </caption><alternatives>
            <graphic id="pone-0047132-t001-1" mimetype="image" orientation="portrait" position="float" xlink:href="info:doi/10.1371/journal.pone.0047132.t001" xlink:type="simple"/>
            <table>
              <colgroup span="1">
                <col align="left" span="1"/>
                <col align="center" span="1"/>
              </colgroup>
              <thead>
                <tr>
                  <td align="left" colspan="2" rowspan="1">Data reduction statistics</td>
                </tr>
                <tr>
                  <td align="left" colspan="1" rowspan="1">Beamline</td>
                  <td align="left" colspan="1" rowspan="1">Diamond I02</td>
                </tr>
              </thead>
              <tbody>
                <tr>
                  <td align="left" colspan="1" rowspan="1">Wavelength (Å)</td>
                  <td align="left" colspan="1" rowspan="1">
                    <italic>0.97988</italic>
                  </td>
                </tr>
                <tr>
                  <td align="left" colspan="1" rowspan="1">Space group</td>
                  <td align="left" colspan="1" rowspan="1"><italic>P</italic>2(1)2(1)2(1)</td>
                </tr>
                <tr>
                  <td align="left" colspan="1" rowspan="1">a (Å)</td>
                  <td align="left" colspan="1" rowspan="1">51.1</td>
                </tr>
                <tr>
                  <td align="left" colspan="1" rowspan="1">b (Å)</td>
                  <td align="left" colspan="1" rowspan="1">62.2</td>
                </tr>
                <tr>
                  <td align="left" colspan="1" rowspan="1">c (Å)</td>
                  <td align="left" colspan="1" rowspan="1">69.6</td>
                </tr>
                <tr>
                  <td align="left" colspan="1" rowspan="1">Resolution range (Å)</td>
                  <td align="left" colspan="1" rowspan="1">46.42 - 1.35</td>
                </tr>
                <tr>
                  <td align="left" colspan="1" rowspan="1">Total reflections measured</td>
                  <td align="left" colspan="1" rowspan="1">225405</td>
                </tr>
                <tr>
                  <td align="left" colspan="1" rowspan="1">Unique reflections</td>
                  <td align="left" colspan="1" rowspan="1">49477</td>
                </tr>
                <tr>
                  <td align="left" colspan="1" rowspan="1">Completeness (%) (last shell)</td>
                  <td align="left" colspan="1" rowspan="1">99.8 (99.5)</td>
                </tr>
                <tr>
                  <td align="left" colspan="1" rowspan="1">I/σ (last shell)</td>
                  <td align="left" colspan="1" rowspan="1">5.0 (2.0)</td>
                </tr>
                <tr>
                  <td align="left" colspan="1" rowspan="1">R(merge)<xref ref-type="table-fn" rid="nt101">a</xref> (%) (last shell)</td>
                  <td align="left" colspan="1" rowspan="1">9.3 (38.6)</td>
                </tr>
                <tr>
                  <td align="left" colspan="1" rowspan="1">B(iso) from Wilson (Å<sup>2</sup>)</td>
                  <td align="left" colspan="1" rowspan="1">10.6</td>
                </tr>
              </tbody>
            </table>
            <table>
              <colgroup span="1">
                <col align="left" span="1"/>
                <col align="center" span="1"/>
              </colgroup>
              <thead>
                <tr>
                  <td align="left" colspan="2" rowspan="1">Refinement statistics</td>
                </tr>
              </thead>
              <tbody>
                <tr>
                  <td align="left" colspan="1" rowspan="1">Protein atoms excluding H</td>
                  <td align="left" colspan="1" rowspan="1">2385</td>
                </tr>
                <tr>
                  <td align="left" colspan="1" rowspan="1">Solvent molecules</td>
                  <td align="left" colspan="1" rowspan="1">393</td>
                </tr>
                <tr>
                  <td align="left" colspan="1" rowspan="1">R-factor<xref ref-type="table-fn" rid="nt102">b</xref> (%)</td>
                  <td align="left" colspan="1" rowspan="1">12.8</td>
                </tr>
                <tr>
                  <td align="left" colspan="1" rowspan="1">R-free<xref ref-type="table-fn" rid="nt103">c</xref> (%)</td>
                  <td align="left" colspan="1" rowspan="1">16.8</td>
                </tr>
                <tr>
                  <td align="left" colspan="1" rowspan="1">Rmsd bond lengths (Å)</td>
                  <td align="left" colspan="1" rowspan="1">0.017</td>
                </tr>
              </tbody>
            </table>
            <table>
              <colgroup span="1">
                <col align="left" span="1"/>
                <col align="center" span="1"/>
              </colgroup>
              <thead>
                <tr>
                  <td align="left" colspan="2" rowspan="1">Ramachandran plot statistics</td>
                </tr>
              </thead>
              <tbody>
                <tr>
                  <td align="left" colspan="1" rowspan="1">Rmsd angles (°)</td>
                  <td align="left" colspan="1" rowspan="1">2.0</td>
                </tr>
                <tr>
                  <td align="left" colspan="1" rowspan="1">Core region (%)</td>
                  <td align="left" colspan="1" rowspan="1">92.7</td>
                </tr>
                <tr>
                  <td align="left" colspan="1" rowspan="1">Allowed region (%)</td>
                  <td align="left" colspan="1" rowspan="1">7.3</td>
                </tr>
                <tr>
                  <td align="left" colspan="1" rowspan="1">Additionally allowed region (%)</td>
                  <td align="left" colspan="1" rowspan="1">0.0</td>
                </tr>
                <tr>
                  <td align="left" colspan="1" rowspan="1">Disallowed region (%)</td>
                  <td align="left" colspan="1" rowspan="1">0.0</td>
                </tr>
              </tbody>
            </table>
          </alternatives><table-wrap-foot>
            <fn id="nt101">
              <label>a</label>
              <p><inline-formula><inline-graphic xlink:href="info:doi/10.1371/journal.pone.0047132.e001" xlink:type="simple"/></inline-formula>.</p>
            </fn>
            <fn id="nt102">
              <label>b</label>
              <p><inline-formula><inline-graphic xlink:href="info:doi/10.1371/journal.pone.0047132.e002" xlink:type="simple"/></inline-formula>.</p>
            </fn>
            <fn id="nt103">
              <label>c</label>
              <p><italic>R<sub>free</sub></italic> is calculated from a set of 5% randomly selected reflections that were excluded from refinement.</p>
            </fn>
          </table-wrap-foot></table-wrap>
        <p>The crystal structure of EGFP displays the traditional β-barrel structure with the chromophore located in the core of the protein (<xref ref-type="fig" rid="pone-0047132-g001">Figure 1A</xref>). Secondary structure assignment using DSSP revealed that 11 strands make up the β-barrel core, corresponding to 47% of protein secondary structure. Only 13% is helical, with the core helix containing the chromophore being a mixture of the 3<sub>10</sub> and α conformations. Whilst secondary structure assignment using DSSP identified the 3<sub>10</sub> helix in the core of the protein (Pro56 – Leu60) it failed to identify residues Val61 – Leu64 as being α-helical in nature. Structural analysis of the residues in the central helix identify an i to i+3 hydrogen bonding pattern between residues Pro56 to Leu60 corresponding to a 3<sub>10</sub> helix, despite proline being considered as a typical helix breaker, whilst an i to i+4 hydrogen bonding pattern is seen from residues Leu60 to Leu64 corresponding to an α-helix (<xref ref-type="fig" rid="pone-0047132-g001">Figure 1A</xref>). The remaining 40% of the structure is comprised of coil mostly from loops located at the two ends of the β-barrel structure (<xref ref-type="fig" rid="pone-0047132-g001">Figure 1A</xref>). A full list of secondary structure assignments can be found in <xref ref-type="supplementary-material" rid="pone.0047132.s006">Table S1</xref>.</p>
        <fig id="pone-0047132-g001" orientation="portrait" position="float">
          <object-id pub-id-type="doi">10.1371/journal.pone.0047132.g001</object-id>
          <label>Figure 1</label>
          <caption>
            <title>Structure of EGFP.</title>
            <p>(A) Ribbon representation of EGFP highlighting β-strands in green, helices in red and loops in pale green. <bold>Inset</bold>, Stick representation of the central helix forming residues (main chain only) in the 3<sub>10</sub> conformation (dark red) and in the α conformation (yellow). Residue Leu60 (orange) is involved in hydrogen bonding in the 3<sub>10</sub> portion of the helix (grey dashed lines) and the α portion of the helix (black dashed lines). (B) B-Factor putty representation of EGFP with chromophore shown as sticks. The B-factor color scale is shown to the right. The regions with high B-factors (shown as bulges) are: K3 to G10 (N-terminus); G115 to D116; K131 to G134; A154 to I161; P187 to P196; K209 to E213; G228 to L231 (C-terminus).</p>
          </caption>
          <graphic mimetype="image" orientation="portrait" position="float" xlink:href="info:doi/10.1371/journal.pone.0047132.g001" xlink:type="simple"/>
        </fig>
        <p>A B-factor ‘putty’ (or ‘sausage’) representation of EGFP (<xref ref-type="fig" rid="pone-0047132-g001">Figure 1B</xref>) highlights increased B-factor values for residues at the N- and C-termini and in several loops connecting ordered secondary structures. This may be an indication of increased mobility in these regions and could be considered as possible target sites for future protein engineering endeavors. Overall the B-factor values observed for the higher resolution EGFP, 4EUL, are slightly lower in comparison to those observed for the previously determined lower resolution structure, 2Y0G, providing increased confidence in the placement of side chains in the structure determined here. This has implications in terms of the certainty of alternate side chain conformations observed for EGFP (<italic>vide infra</italic>).</p>
        <p>Despite the mature chromophore requiring protection from the external environment to maintain fluorescence several structured water molecules are also found within the core of the protein (<xref ref-type="fig" rid="pone-0047132-g002">Figure 2</xref>), some of which are critical to the fluorescent properties. Whilst all of these waters superimpose with waters from the lower resolution EGFP structure 2Y0G, two of the waters (W<sub>5</sub> and W<sub>6</sub>) are absent in both structures for wt GFP (1GFL) and for S65T GFP (1EMA).</p>
        <fig id="pone-0047132-g002" orientation="portrait" position="float">
          <object-id pub-id-type="doi">10.1371/journal.pone.0047132.g002</object-id>
          <label>Figure 2</label>
          <caption>
            <title>Chromophore local environment.</title>
            <p>Stereo view of the chromophore local environment with 2F<sub>o</sub>-F<sub>c</sub> electron density map contoured to 1σ, highlighting the presence of several conserved water molecules and hydrogen bonding interactions (blue dashed lines). Whilst waters W<sub>1</sub> to W<sub>4</sub> are present in both wt GFP and S65T GFP W<sub>5</sub> and W<sub>6</sub> are absent. W<sub>1</sub> to W<sub>6</sub> are all present in the lower resolution EGFP structure 2Y0G. W<sub>1</sub> to W<sub>6</sub> refer to solvent molecules 413, 442, 564, 421, 494 and 547 respectively in structure 4EUL.</p>
          </caption>
          <graphic mimetype="image" orientation="portrait" position="float" xlink:href="info:doi/10.1371/journal.pone.0047132.g002" xlink:type="simple"/>
        </fig>
      </sec>
      <sec id="s2c">
        <title>Comparison of EGFP structures with wild-type GFP and S65T GFP structures</title>
        <p>Superpositioning of the structure obtained for EGFP with that of wt GFP (PDB entry 1GFL <xref ref-type="bibr" rid="pone.0047132-Yang1">[7]</xref>) and a S65T GFP mutant (PDB entry 1EMA <xref ref-type="bibr" rid="pone.0047132-Ormo1">[8]</xref>) shows that the overall structures are very similar (<xref ref-type="fig" rid="pone-0047132-g003">Figure 3A</xref>); the RMSD over the backbone and all atoms of EGFP and wt GFP is 0.40 Å and 1.03 Å respectively, whilst the RMSD over backbone and all atoms of EGFP and S65T GFP are 0.29 Å and 0.85 Å, respectively. This indicates that the F64L and S65T mutations do not have a significant effect on the overall protein structure but have more subtle effects. Secondary structure analysis revealed the boundaries between the different elements in wt GFP and EGFP (<xref ref-type="supplementary-material" rid="pone.0047132.s006">Table S1</xref>) are very similar.</p>
        <fig id="pone-0047132-g003" orientation="portrait" position="float">
          <object-id pub-id-type="doi">10.1371/journal.pone.0047132.g003</object-id>
          <label>Figure 3</label>
          <caption>
            <title>Structural comparison of wt GFP, S65T GFP and EGFP.</title>
            <p>(A) overlay of EGFP (green), wt GFP (grey) and S65T GFP (cyan). (B) Stereo view of the influence of the S65T mutation on local hydrogen bond network. EGFP, wt GFP and S65T GFP coloured as in A. Hydrogen bonds associated with EGFP, wt GFP and S65T GFP are yellow, red and blue dashed lines respectively.</p>
          </caption>
          <graphic mimetype="image" orientation="portrait" position="float" xlink:href="info:doi/10.1371/journal.pone.0047132.g003" xlink:type="simple"/>
        </fig>
        <p>Superposition of the present model, 4EUL, with the lower resolution 2Y0G structure with an extended N-terminal His-tag (MAHHHHHHGHHH) sequence, reveals a RMSD of 0.59 Å when all common atoms are considered, including side chains. This indicates that both structures are largely identical. Thus, the presence of the longer than normal His tag sequence element in 2Y0G does not appear to greatly influence the overall structure. Both suffer from disordered termini. Whilst there are a number of identical residues in both versions of the EGFP structure that have been refined with multiple conformers, there are several that are only present in one or the other structure. These will be discussed in more detail below.</p>
      </sec>
      <sec id="s2d">
        <title>Influence of F64L on EGFP structure</title>
        <p>Given the high resolution of the EGFP structure, the exact placement of side chains can be defined with high confidence. The F64L mutation confers increased folding efficiency to GFP at 37°C but the structural consequences of this mutation in the context of the S65T mutation have not been fully investigated. The most obvious effect of the F64L mutation comprises the exchange of the bulky and buried phenylalanine side chain for a smaller leucine side chain in the central chromophore containing helical structure (<xref ref-type="fig" rid="pone-0047132-g004">Figure 4A</xref>). The substitution causes β-strand 2 to pack tighter with the core. The largest observed variation between wt GFP and EGFP was centred on residue Val29, with deviation of 1.37 Å across all atoms (<xref ref-type="fig" rid="pone-0047132-g004">Figure 4A</xref>). Val29 shifts closer to the chromophore upon the additional space being made available by loss of the aromatic Phe64 side chain. Residue Leu18 also shifts positions with the electron density only fully satisfied by modelling two alternate side chain conformations (<xref ref-type="fig" rid="pone-0047132-g004">Figure 4B</xref>), both of which differ from the side chain conformation of wt GFP Leu18 (<xref ref-type="fig" rid="pone-0047132-g004">Figure 4A</xref>). To satisfy the electron density the two conformations were modelled with an occupancy of 0.7 for conformer A and 0.3 for conformer B (<xref ref-type="fig" rid="pone-0047132-g004">Figure 4</xref>). Conformer A and B of Leu18 have observed RMSDs of 0.53 Å and 1.22 Å between wt GFP and EGFP across all atoms respectively. Both conformers exhibit a rotation of the Leu18 isobutyl side chain away from the edge of the β-barrel towards the core of the protein (<xref ref-type="fig" rid="pone-0047132-g004">Figure 4A</xref>). Whilst the lower resolution 2Y0G structure also shows rotation of the Leu18 isobutyl side chain away from the edge of the β-barrel it was not modelled by two conformers as seen in the present structure (<xref ref-type="supplementary-material" rid="pone.0047132.s005">Figure S5</xref>).</p>
        <fig id="pone-0047132-g004" orientation="portrait" position="float">
          <object-id pub-id-type="doi">10.1371/journal.pone.0047132.g004</object-id>
          <label>Figure 4</label>
          <caption>
            <title>Effect of F64L mutation on EGFP structure.</title>
            <p>(A) Structural effects of the F64L mutation on the positions of L18, F27, V29, W57 and L64. EGFP and wt GFP coloured as in A. (B) 2F<sub>o</sub>-F<sub>c</sub> electron density map, contoured to 1σ, of the L18 double conformation. Each conformer is coloured green (fit to 70% occupancy) and yellow (fit to 30% occupancy).</p>
          </caption>
          <graphic mimetype="image" orientation="portrait" position="float" xlink:href="info:doi/10.1371/journal.pone.0047132.g004" xlink:type="simple"/>
        </fig>
        <p>There is also a slight shift of residue Trp57 away from the surface of the protein towards Leu64, resulting in an RMSD over the side chain atoms of 0.39 Å (<xref ref-type="fig" rid="pone-0047132-g004">Figure 4A</xref>), decreasing its solvent accessible surface area in EGFP (12.8 Å<sup>2</sup>) with respect to wt GFP (15.2 Å<sup>2</sup>). Trp57 lies in the proline rich PVPWP pentapeptide sequence found in a variety of different proteins and, along with Val55 has been reported to be essential for function as mutation to other residues render EGFP non-fluorescent <xref ref-type="bibr" rid="pone.0047132-Budisa1">[15]</xref>, <xref ref-type="bibr" rid="pone.0047132-Steiner1">[16]</xref>. The bulky side chain of Phe27 also moves towards the core of the protein with an RMSD over the side chain atoms of 0.41 Å resulting in a decreased solvent accessible surface area in EGFP (1.7 Å<sup>2</sup>) with respect to wt GFP (2.6 Å<sup>2</sup>) (<xref ref-type="fig" rid="pone-0047132-g004">Figure 4A</xref>). The repositioning of these residues could potentially influence the folding of EGFP at 37°C through better packing of the hydrophobic residues surrounding the central helix and of the central helix itself, and by reducing surface exposure of hydrophobic residues.</p>
      </sec>
      <sec id="s2e">
        <title>Influence of S65T on EGFP structure</title>
        <p>The S65T mutation has proved to be a more general mutation that can be transplanted to other green fluorescent protein variants to alter their spectral properties through removal of the 395 nm and promotion of the ∼490 nm excitation λ<sub>ex</sub> <xref ref-type="bibr" rid="pone.0047132-Heim2">[17]</xref>, <xref ref-type="bibr" rid="pone.0047132-Brejc1">[18]</xref>, increase the rate of oxidation during chromophore maturation and increase the brightness of the fluorescent proteins <xref ref-type="bibr" rid="pone.0047132-Heim2">[17]</xref>. Analysis of the local environment around the chromophore can explain the molecular basis for the observed spectral properties. Replacement of Ser65 with Thr results in the hydroxyl group of Thr65 in EGFP occupying a different position from the corresponding hydroxyl group of Ser65 in wt GFP (<xref ref-type="fig" rid="pone-0047132-g003">Figure 3</xref>), probably as a result of steric effects due to the additional methyl group of Thr65. The Thr65 side chain in the EGFP structure determined here is in the same orientation as in the previously determined S65T-GFP structures <xref ref-type="bibr" rid="pone.0047132-Brejc1">[18]</xref> (<xref ref-type="fig" rid="pone-0047132-g003">Figure 3B</xref>).</p>
        <p>In contrast to other S65T-GFP structures the electron density of the Glu222 carboxylate side chain in EGFP suggests that it occupies two distinct conformations (<xref ref-type="fig" rid="pone-0047132-g005">Figure 5A</xref>). The electron density difference map produced after molecular replacement and structural refinement displays a tridentate density for Glu222 (<xref ref-type="fig" rid="pone-0047132-g005">Figure 5A</xref>), which was successfully modeled as two conformations of the carboxylate, with substantial difference in the placement of atoms along the side-chain (<xref ref-type="fig" rid="pone-0047132-g005">Figure 5B</xref>). The rationale behind the Glu222 double conformer in EGFP is described in <xref ref-type="supplementary-material" rid="pone.0047132.s002">Figure S2</xref>. The occupancy of conformers A and B were set to 70% and 30%, respectively, in order to satisfy the electron density for this residue. The Glu222 conformer A matches very closely to the position of Glu222 seen in the S65T GFP mutant but differs significantly from that observed for wt GFP (<xref ref-type="fig" rid="pone-0047132-g005">Figure 5B</xref>). This highlights the role of residue 65 in defining the positioning of Glu222. However, conformer B represents a new and different side-chain positioning for this residue, leaving the carboxylate group orientated in a similar direction (but not superimposable) with the Glu222 carboxylate group from wt GFP (<xref ref-type="fig" rid="pone-0047132-g005">Figure 5B</xref>). Tridentate density for Glu222 has only been observed to our knowledge once before in a GFP-derived variant, the recently determined His-tagged EGFP structure 2Y0G <xref ref-type="bibr" rid="pone.0047132-Royant1">[13]</xref>. While conformer A in both these independently determined structures are very similar, conformer B shows obvious differences. With regards to Y20G, the tridentate electron density was refined to show changes largely related to the carboxyl group and not the side-chain as a whole (<xref ref-type="supplementary-material" rid="pone.0047132.s003">Figure S3</xref>), as observed here for 4EUL (<xref ref-type="fig" rid="pone-0047132-g005">Figure 5B</xref> and <xref ref-type="supplementary-material" rid="pone.0047132.s003">Figure S3</xref>). The hydroxyl group of Thr65 now donates a hydrogen bond to the backbone carbonyl of V61 instead of Glu222 (<xref ref-type="fig" rid="pone-0047132-g003">Figure 3B</xref>). However, the hydrogen bonding network related to the carboxylate of Glu222 depends on the conformation sampled, as outlined in <xref ref-type="fig" rid="pone-0047132-g005">Figure 5</xref>. Thus, we have provided important independent proof that Glu222 can exist in two alternate conformations, albeit with slight discrepancies concerning the alternate B conformation, and with the higher resolution structure can position the atoms of the alternate conformer of Glu222 with higher confidence.</p>
        <fig id="pone-0047132-g005" orientation="portrait" position="float">
          <object-id pub-id-type="doi">10.1371/journal.pone.0047132.g005</object-id>
          <label>Figure 5</label>
          <caption>
            <title>Effect of S65T mutation on Glu222 conformation and hydrogen bonding network.</title>
            <p>(A) 2F<sub>o</sub>-F<sub>c</sub> electron density map for the chromophore and E222 (sticks) contoured to 1σ. Tridentate density for E222 modelled to two side chain conformations fit to 70% (E222a) and 30% (E222b) occupancy. (B) Superposition of E222 sidechain conformer A (E222a; green) and B (E222b; yellow) with the E222 side chain from wt GFP (1GFL; grey) and S65T GFP (1EMA; cyan). (C &amp; D) The hydrogen bond network for each E222 conformer is indicated as dashed blue lines. The O<sub>δ1</sub> alternatively donates a hydrogen bond to T65 OH (E222a; C) or S205 OH (E222b; D).</p>
          </caption>
          <graphic mimetype="image" orientation="portrait" position="float" xlink:href="info:doi/10.1371/journal.pone.0047132.g005" xlink:type="simple"/>
        </fig>
        <p>The reason for promotion of the anionic chromophore over the neutral form is thought to be a result of disruption of hydrogen bonding with charged Glu222 on mutation of Ser65 to Thr <xref ref-type="bibr" rid="pone.0047132-Tsien1">[3]</xref>, <xref ref-type="bibr" rid="pone.0047132-Brejc1">[18]</xref>, <xref ref-type="bibr" rid="pone.0047132-Shu1">[19]</xref>. This in turn prevents ionization within the core of the Glu222 carboxylate group so removing an electrostatic clash with the anionic form of the ground state chromophore. In both conformations Glu222 O<sub>δ1</sub> is hydrogen bonded to two conserved water molecules. With respect to Glu222 O<sub>δ2</sub>, in one conformation it donates a hydrogen bond to the hydroxyl group of Thr65 (<xref ref-type="fig" rid="pone-0047132-g005">Figure 5C</xref>) and in the alternate conformation it donates a hydrogen bond to the hydroxyl group of Ser205 (<xref ref-type="fig" rid="pone-0047132-g005">Figure 5D</xref>). In order for Glu222 to donate hydrogen bonds its carboxylate group must be protonated and therefore neutral. This allows charge stabilization on the deprotonated phenol group of the chromophore by hydrogen-bonding interactions from His148, Thr203 and a conserved water molecule coordinated between the backbone carbonyl group of Asn146 and the side chain hydroxyl group of Ser205 (<xref ref-type="fig" rid="pone-0047132-g005">Figure 5C &amp; 5D</xref>). The neutral charge on Glu222 also removes any potential electrostatic clashes between the negative charges on Glu222 and the chromophore, thus allowing the chromophore to be deprotonated in the ground state. This explains why EGFP has a single excitation peak corresponding to the deprotonated state.</p>
        <p>However, given the heterogeneity in the local environment of the chromophore due to the alternate conformations of Glu222 it would be expected that this may be reflected by spectral heterogeneity. This is not the case as is evident from single exponential fluorescence lifetime decays (<xref ref-type="fig" rid="pone-0047132-g006">Figure 6</xref>); the measured fluorescence lifetime was 2.54 ns, similar to that reported previously for EGFP <xref ref-type="bibr" rid="pone.0047132-Stepanenko1">[20]</xref>. Therefore, small alterations in Glu222 conformation are unlikely to have profound effects on the electrostatic environment surrounding the chromophore and thus the fluorescence properties. The two side chain conformations observed for Glu222 could be a crystallographic artifact and both may not be populated in solution. This is unlikely given that the residue is buried within the interior of the protein and alternate conformations for this residue have been observed in a lower resolution structure of the His-tagged EGFP protein <xref ref-type="bibr" rid="pone.0047132-Royant1">[13]</xref>. Alternatively both conformations may exist but could be in a rapid dynamic equilibrium and transiently exchanging between the two conformations. A third possibility could be that upon folding the Glu222 side chain is trapped in one conformation or the other. Further structural analysis by NMR could potentially identify and measure Glu222 side-chain exchange rates in solution to confirm the two conformations observed in the crystal structure.</p>
        <fig id="pone-0047132-g006" orientation="portrait" position="float">
          <object-id pub-id-type="doi">10.1371/journal.pone.0047132.g006</object-id>
          <label>Figure 6</label>
          <caption>
            <title>Fluorescence lifetime analysis of EGFP.</title>
            <p>Photon counts (black dots) measured over 20 ns were fit to a single exponential decay function (green line) with the instrument response function shown as red dots. Residuals for the single exponential decay fit to the data are plotted below the decay curve.</p>
          </caption>
          <graphic mimetype="image" orientation="portrait" position="float" xlink:href="info:doi/10.1371/journal.pone.0047132.g006" xlink:type="simple"/>
        </fig>
      </sec>
      <sec id="s2f">
        <title>Other residues exhibiting multiple conformers</title>
        <p>In addition to Leu18 and Glu222 that lie close in space to the chromophore (<xref ref-type="fig" rid="pone-0047132-g007">Figure 7</xref>), electron density maps indicated other residues occupied multiple conformations including Ser30, Thr43, Leu44, Gln80, Thr97, Lys101, Asp102, Lys113, Asp117, Glu124, Met153, Glu172, Tyr182, Gln184 and Thr186 (<xref ref-type="supplementary-material" rid="pone.0047132.s004">Figure S4</xref>). Whilst the majority of these residues are surface exposed and potentially have the ability to sample multiple conformations freely, residues Leu18 and Leu44 are buried in the core of the protein in close proximity to Glu222 and the chromophore (<xref ref-type="fig" rid="pone-0047132-g007">Figure 7</xref>). Both Leu18 and Leu44 are modeled by single conformations in the lower resolution 2Y0G (<xref ref-type="supplementary-material" rid="pone.0047132.s005">Figure S5</xref>). The electron density for all three residues was best fitted when one conformer occupancy was set to 70% and the other conformer occupancy set to 30%. The implications of the dual conformers in terms of fluorescence characteristics, including whether one represents a fluorescent and the other a non-fluorescent state, are not currently known.</p>
        <fig id="pone-0047132-g007" orientation="portrait" position="float">
          <object-id pub-id-type="doi">10.1371/journal.pone.0047132.g007</object-id>
          <label>Figure 7</label>
          <caption>
            <title>Buried residues with multiple conformers close to the chromophore.</title>
            <p>Cartoon representation of EGFP (green) showing the chromophore (Cro; orange sticks) in close proximity to residues L18, L44 and E222 all of which have been modeled to two conformers; conformer A (green sticks) or conformer B (yellow sticks) were modeled to an occupancy of 70% or 30% respectively.</p>
          </caption>
          <graphic mimetype="image" orientation="portrait" position="float" xlink:href="info:doi/10.1371/journal.pone.0047132.g007" xlink:type="simple"/>
        </fig>
        <p>Comparison of 4EUL with the lower resolution 2Y0G structure identified a number of common double conformers observed between the two structures (S30, T43, K101, D102, D117, E124, E172, Q184, T186 and E222). Additional solvent exposed residues were modeled as double conformers in 2Y0G that were not observed in 4EUL (I47, K79, K107, N164, D190 and D197). Likewise a number of double conformers were modeled in 4EUL that were not observed in 2Y0G (L18, L44, Q80, T97, K113, M153). Leu18, Leu44 and Glu222 aside, given the solvent exposed nature of these residues and the difference in crystallisation conditions (4EUL: 0.1M MES/NaOH, pH 6.5, 200 mM calcium acetate, 20% (w/v) PEG8000. 2Y0G: 50 mM HEPES, pH 8.2, 24% (w/v), 50 mM magnesium chloride, PEG4000, 10 mM β-mercaptoethanol) the difference in double conformers modeled between the two structures are potentially crystallographic artifacts arising due to fixing of particular conformation populations in the crystal during random rotations around the side chain σ-dihedral bonds.</p>
        <p>In conclusion, we have determined the structure of the native sequence to 1.35 Å resolution of the widely used and commercially important enhanced Green Fluorescent Protein. While the core structure and fold of EGFP is very similar to the wild-type GFP, the introduction of the F64L and S65T have subtle yet important effects on the properties of EGFP. These include altered core packing arrangements close to the chromophore and altering hydrogen bonding and charged states of residues close to the chromophore. These changes in turn give rise to the important properties of EGFP that make such a useful tool compared to the wt GFP: better fluorescence excitation characteristics and improved folding at 37°C. Comparison of the EGFP structure determined here (4EUL) with that of an extended N-terminal His-tagged version recently determined at slightly lower resolution (2Y0G) shows that the structures are very similar so the artificial affinity tag is having little overall effect on structure. However, the present higher resolution structure with slightly lower overall B-factor values increases confidence of side chain placement during the model refinement, which becomes crucial when alternate conformations are observed. Our work independently confirms the recent observation of an alternate conformation of Glu222 but here the side chain placement of the alternate conformer is different to that in the lower resolution structure. In addition, alternate conformations were observed for two residues close to the chromophore that were absent from the lower resolution structure suggesting that the presence of alternate conformations go beyond that of just Glu222. Thus, the observed multiple conformations for residues close to the chromophore, including the chromophore charge defining residue Glu222 is intriguing and may be having a yet unknown impact on the fluorescent properties of EGFP.</p>
      </sec>
    </sec>
    <sec id="s3" sec-type="materials|methods">
      <title>Materials and Methods</title>
      <sec id="s3a">
        <title>Protein production and purification</title>
        <p>The production and subsequent purification of EGFP was performed as follows. LB Broth (15 ml) supplemented with 100 µg/ml ampicillin was inoculated with a single colony of <italic>Escherichia coli</italic> BL21 (DE3) Gold containing the plasmid pNOM-XP3-<italic>egfp</italic> to generate a starter culture and incubated overnight at 37°C. A 1/200 dilution of the starter culture was used to inoculate 1 l LB broth supplemented with 100 µg/ml ampicillin and grown at 37°C until an optical density of A<sub>600</sub> = 0.4 was achieved. Protein expression was induced by the addition of 1 mM IPTG. The culture was incubated for 24 hrs at 37°C. The 1 l culture was then harvested by centrifugation (3000× g for 20 mins) and the pellet resuspended in 20 ml 50 mM Tris-HCl pH 8.0 (Buffer A) supplemented with 1 mM PMSF and 1 mM EDTA. The cells were lysed by French press using a chilled pressure cell. The lysate was then centrifuged (20000 rpm in Beckman JA20 rotor for 30 mins) to pellet any cell debris and the supernatant was decanted and stored at 4°C. The cell lysate was applied to a Q-Sepharose (GE healthcare) ion exchange column and elution monitored at 280 nm and 488 nm. Pooled fractions were then subjected to ammonium sulphate precipitation to further purify and concentrate the protein sample. An initial ammonium sulphate concentration of 45% (w/v) was used to precipitate unwanted proteins from solution. Further addition of ammonium sulphate to a final concentration of 75% (w/v) was carried out to precipitate EGFP from solution. The precipitate was resuspended in buffer A (5 ml) and the protein solution was then applied to a SP Superdex 200 gel filtration column (GE Healthcare) with elution monitored at 280 nm and 488 nm. The purified protein sample was finally stored in buffer A supplemented with 150 mM NaCl. A detailed description of absorption and fluorescence methods is provided in Methods S1.</p>
      </sec>
      <sec id="s3b">
        <title>Protein crystallisation and structure determination</title>
        <p>Purified EGFP (10 mg/ml in 50 mM Tris-HCl, pH 8.0 and 150 mM NaCl) was screened for crystal formation by the sitting drop vapour diffusion method with incubation at 4°C. Drops were set up with equal volumes of protein and precipitant solutions (0.5 µl each). Crystals of EGFP were obtained from 0.1 M MES/NaOH, pH 6.5, 200 mM calcium acetate and 20% (w/v) PEG 8000. A crystal was transferred to mother liquor supplemented with 13% (w/v) PEG 200 as a cryoprotectant and vitrified. Data were collected on beamline I02 at the Diamond Light Source, Harwell, UK. Usable diffraction was recorded up to a resolution of 1.35 Å. Data were reduced with the XIA2 package <xref ref-type="bibr" rid="pone.0047132-Winter1">[21]</xref>, space group assignment was done by POINTLESS <xref ref-type="bibr" rid="pone.0047132-Evans1">[22]</xref>, scaling and merging were completed with SCALA <xref ref-type="bibr" rid="pone.0047132-Evans1">[22]</xref> and TRUNCATE <xref ref-type="bibr" rid="pone.0047132-CCP41">[23]</xref>. Initial molecular replacement for the EGFP structure was performed using a previously determined GFP structure (PDB entry 2HQZ) as the search model, using MOLREP <xref ref-type="bibr" rid="pone.0047132-Lebedev1">[24]</xref>. The structure for EGFP was adjusted manually using COOT <xref ref-type="bibr" rid="pone.0047132-Emsley1">[25]</xref> and refinement of the completed molecule was carried out using REFMAC <xref ref-type="bibr" rid="pone.0047132-Murshudov1">[26]</xref>. Protein atoms were refined anisotropically, but residues shown as sphericity outliers by REFMAC were refined isotropically. All non-protein atoms were refined isotropically. The above routines were used as the CCP4 package <xref ref-type="bibr" rid="pone.0047132-CCP41">[23]</xref> (<ext-link ext-link-type="uri" xlink:href="http://www.ccp4.ac.uk" xlink:type="simple">www.ccp4.ac.uk</ext-link>). Graphical representations were made with PyMOL Molecular Graphics System, Schrödinger, LLC.</p>
      </sec>
    </sec>
    <sec id="s4">
      <title>Supporting Information</title>
      <supplementary-material id="pone.0047132.s001" mimetype="image/tiff" orientation="portrait" position="float" xlink:href="info:doi/10.1371/journal.pone.0047132.s001" xlink:type="simple">
        <label>Figure S1</label>
        <caption>
          <p><bold>Size exclusion chromatography of EGFP.</bold> Samples of EGFP were applied to a Superdex™ 75 gel filtration column and the elution monitored at 488 nm. Protein concentrations of 10 µM (solid black line), 25 µM (long dashed line), 50 µM (medium dashed line) or 100 µM (short dashed line) were applied to the column. A small decrease in peak elution volume (∼0.15 ml) was observed with increasing protein concentration (from 10–100 µM), corresponding to a small increase in apparent molecular weight (∼24.6–∼26.8 kDa). The apparent molecular weight was still very close to the theoretical molecular weight calculated from the amino acid sequence (26941 Da). The elution peak was non-symmetrical, suggesting there was more than one oligomeric species present in dynamic equilibrium with the monomeric form; this is consistent with previous observations that wt GFP is largely monomeric with a weak tendency to dimerise.</p>
          <p>(TIFF)</p>
        </caption>
      </supplementary-material>
      <supplementary-material id="pone.0047132.s002" mimetype="image/tiff" orientation="portrait" position="float" xlink:href="info:doi/10.1371/journal.pone.0047132.s002" xlink:type="simple">
        <label>Figure S2</label>
        <caption>
          <p><bold>Rationale behind modelling of E222 as a double conformer.</bold> Modelling of residue E222 as either the single conformer A (A), the single conformer B (B) or as a double conformer as observed in PDB entry 2Y0G [S1] (C) does not fully satisfy the electron density difference map. Modelling of the double conformer as seen here (D) satisfies the electron density.</p>
          <p>(TIFF)</p>
        </caption>
      </supplementary-material>
      <supplementary-material id="pone.0047132.s003" mimetype="image/tiff" orientation="portrait" position="float" xlink:href="info:doi/10.1371/journal.pone.0047132.s003" xlink:type="simple">
        <label>Figure S3</label>
        <caption>
          <p><bold>Structural comparison of E222 double conformers in the present structure (4EUL) and 2Y0G.</bold> (A) Overlay of all four conformers from 4EUL and 2Y0G. Conformer A and B from 4EUL are coloured green and yellow, respectively. Conformer A and B from 2Y0G [S1] are coloured orange and blue, respectively. The significant difference in placement of the side chain atoms for E22 conformer B in 4EUL in comparison to conformer B in 2Y0G are clearly seen. For clarity, the double conformers of E222 for 2Y0G (B) and 4EUL (C) have also been shown.</p>
          <p>(TIFF)</p>
        </caption>
      </supplementary-material>
      <supplementary-material id="pone.0047132.s004" mimetype="image/tiff" orientation="portrait" position="float" xlink:href="info:doi/10.1371/journal.pone.0047132.s004" xlink:type="simple">
        <label>Figure S4</label>
        <caption>
          <p><bold>Residues with multiple conformers in EGFP.</bold> Electron density difference maps and residues in EGFP with multiple conformers are shown as sticks and coloured green, yellow or grey for conformer A, B or C respectively.</p>
          <p>(TIFF)</p>
        </caption>
      </supplementary-material>
      <supplementary-material id="pone.0047132.s005" mimetype="image/tiff" orientation="portrait" position="float" xlink:href="info:doi/10.1371/journal.pone.0047132.s005" xlink:type="simple">
        <label>Figure S5</label>
        <caption>
          <p><bold>Structural comparison of L18 and L44 in the present structure (4EUL) and 2Y0G.</bold> Overlay of the single observed conformer of Leu18 (A) or L44 (B) for 2Y0G [S1] with conformer A (green) and conformer B (red) observed in the present study (4EUL).</p>
          <p>(TIFF)</p>
        </caption>
      </supplementary-material>
      <supplementary-material id="pone.0047132.s006" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" orientation="portrait" position="float" xlink:href="info:doi/10.1371/journal.pone.0047132.s006" xlink:type="simple">
        <label>Table S1</label>
        <caption>
          <p>
            <bold>Secondary structure assignment for EGFP and wt GFP.</bold>
          </p>
          <p>(DOCX)</p>
        </caption>
      </supplementary-material>
      <supplementary-material id="pone.0047132.s007" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" orientation="portrait" position="float" xlink:href="info:doi/10.1371/journal.pone.0047132.s007" xlink:type="simple">
        <label>Methods S1</label>
        <caption>
          <p>
            <bold>Supporting Methods.</bold>
          </p>
          <p>(DOCX)</p>
        </caption>
      </supplementary-material>
      <supplementary-material id="pone.0047132.s008" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" orientation="portrait" position="float" xlink:href="info:doi/10.1371/journal.pone.0047132.s008" xlink:type="simple">
        <label>References S1</label>
        <caption>
          <p>
            <bold>Supporting References.</bold>
          </p>
          <p>(DOCX)</p>
        </caption>
      </supplementary-material>
    </sec>
  </body>
  <back>
    <ack>
      <p>The authors thank the staff at the Diamond Light Source for the supply of facilities and beamtime, especially Beamline I02 staff. We would like to thank Dr Roger Chittock for advice on fluorescence lifetime measurements. We would like to thank Dr Anna Piasecka and Dr Matthias Bochtler for their help with protein crystalisation and data collection. We would also like to thank Dr Honorata Czapinska for her initial help and guidance with structure refinement.</p>
    </ack>
    <ref-list>
      <title>References</title>
      <ref id="pone.0047132-Shimomura1">
        <label>1</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Shimomura</surname><given-names>O</given-names></name>, <name name-style="western"><surname>Johnson</surname><given-names>FH</given-names></name>, <name name-style="western"><surname>Saiga</surname><given-names>Y</given-names></name> (<year>1962</year>) <article-title>Extraction, purification and properties of aequorin, a bioluminescent protein from the luminous hydromedusan, Aequorea</article-title>. <source>J Cell Comp Phys</source> <volume>59</volume>: <fpage>223</fpage>–<lpage>239</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Chalfie1">
        <label>2</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Chalfie</surname><given-names>M</given-names></name>, <name name-style="western"><surname>Tu</surname><given-names>Y</given-names></name>, <name name-style="western"><surname>Euskirchen</surname><given-names>G</given-names></name>, <name name-style="western"><surname>Ward</surname><given-names>WW</given-names></name>, <name name-style="western"><surname>Prasher</surname><given-names>DC</given-names></name> (<year>1994</year>) <article-title>Green fluorescent protein as a marker for gene expression</article-title>. <source>Science</source> <volume>263</volume>: <fpage>802</fpage>–<lpage>805</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Tsien1">
        <label>3</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Tsien</surname><given-names>RY</given-names></name> (<year>1998</year>) <article-title>The green fluorescent protein</article-title>. <source>Ann Rev Biochem</source> <volume>67</volume>: <fpage>509</fpage>–<lpage>544</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Zhang1">
        <label>4</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Zhang</surname><given-names>J</given-names></name>, <name name-style="western"><surname>Campbell</surname><given-names>RE</given-names></name>, <name name-style="western"><surname>Ting</surname><given-names>AY</given-names></name>, <name name-style="western"><surname>Tsien</surname><given-names>RY</given-names></name> (<year>2002</year>) <article-title>Creating new fluorescent probes for cell biology</article-title>. <source>Nat Rev Mol Cell Biol</source> <volume>3</volume>: <fpage>906</fpage>–<lpage>918</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Pakhomov1">
        <label>5</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Pakhomov</surname><given-names>AA</given-names></name>, <name name-style="western"><surname>Martynov</surname><given-names>VI</given-names></name> (<year>2008</year>) <article-title>GFP family: structural insights into spectral tuning</article-title>. <source>Chem Biol</source> <volume>15</volume>: <fpage>755</fpage>–<lpage>764</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Zhang2">
        <label>6</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Zhang</surname><given-names>L</given-names></name>, <name name-style="western"><surname>Patel</surname><given-names>HN</given-names></name>, <name name-style="western"><surname>Lappe</surname><given-names>JW</given-names></name>, <name name-style="western"><surname>Wachter</surname><given-names>RM</given-names></name> (<year>2006</year>) <article-title>Reaction progress of chromophore biogenesis in green fluorescent protein</article-title>. <source>J Am Chem Soc</source> <volume>128</volume>: <fpage>4766</fpage>–<lpage>4772</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Yang1">
        <label>7</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Yang</surname><given-names>F</given-names></name>, <name name-style="western"><surname>Moss</surname><given-names>LG</given-names></name>, <name name-style="western"><surname>Phillips</surname><given-names>GN</given-names><suffix>Jr</suffix></name> (<year>1996</year>) <article-title>The molecular structure of green fluorescent protein</article-title>. <source>Nat Biotech</source> <volume>14</volume>: <fpage>1246</fpage>–<lpage>1251</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Ormo1">
        <label>8</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Ormo</surname><given-names>M</given-names></name>, <name name-style="western"><surname>Cubitt</surname><given-names>AB</given-names></name>, <name name-style="western"><surname>Kallio</surname><given-names>K</given-names></name>, <name name-style="western"><surname>Gross</surname><given-names>LA</given-names></name>, <name name-style="western"><surname>Tsien</surname><given-names>RY</given-names></name>, <etal>et al</etal>. (<year>1996</year>) <article-title>Crystal structure of the Aequorea victoria green fluorescent protein</article-title>. <source>Science</source> <volume>273</volume>: <fpage>1392</fpage>–<lpage>1395</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Heim1">
        <label>9</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Heim</surname><given-names>R</given-names></name>, <name name-style="western"><surname>Prasher</surname><given-names>DC</given-names></name>, <name name-style="western"><surname>Tsien</surname><given-names>RY</given-names></name> (<year>1994</year>) <article-title>Wavelength mutations and posttranslational autoxidation of green fluorescent protein</article-title>. <source>Proc Natl Acad Sci USA</source> <volume>91</volume>: <fpage>12501</fpage>–<lpage>12504</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-LippincottSchwartz1">
        <label>10</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Lippincott-Schwartz</surname><given-names>J</given-names></name>, <name name-style="western"><surname>Patterson</surname><given-names>GH</given-names></name> (<year>2003</year>) <article-title>Development and use of fluorescent protein markers in living cells</article-title>. <source>Science</source> <volume>300</volume>: <fpage>87</fpage>–<lpage>91</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Cormack1">
        <label>11</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Cormack</surname><given-names>BP</given-names></name>, <name name-style="western"><surname>Valdivia</surname><given-names>RH</given-names></name>, <name name-style="western"><surname>Falkow</surname><given-names>S</given-names></name> (<year>1996</year>) <article-title>FACS-optimized mutants of the green fluorescent protein (GFP)</article-title>. <source>Gene</source> <volume>173</volume>: <fpage>33</fpage>–<lpage>38</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Yang2">
        <label>12</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Yang</surname><given-names>TT</given-names></name>, <name name-style="western"><surname>Cheng</surname><given-names>L</given-names></name>, <name name-style="western"><surname>Kain</surname><given-names>SR</given-names></name> (<year>1996</year>) <article-title>Optimized codon usage and chromophore mutations provide enhanced sensitivity with the green fluorescent protein</article-title>. <source>Nucleic Acids Res</source> <volume>24</volume>: <fpage>4592</fpage>–<lpage>4593</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Royant1">
        <label>13</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Royant</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Noirclerc-Savoye</surname><given-names>M</given-names></name> (<year>2011</year>) <article-title>Stabilizing role of glutamic acid 222 in the structure of Enhanced Green Fluorescent Protein</article-title>. <source>J Struc Biol</source> <volume>174</volume>: <fpage>385</fpage>–<lpage>390</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Patterson1">
        <label>14</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Patterson</surname><given-names>GH</given-names></name>, <name name-style="western"><surname>Knobel</surname><given-names>SM</given-names></name>, <name name-style="western"><surname>Sharif</surname><given-names>WD</given-names></name>, <name name-style="western"><surname>Kain</surname><given-names>SR</given-names></name>, <name name-style="western"><surname>Piston</surname><given-names>DW</given-names></name> (<year>1997</year>) <article-title>Use of the green fluorescent protein and its mutants in quantitative fluorescence microscopy</article-title>. <source>Biophys J</source> <volume>73</volume>: <fpage>2782</fpage>–<lpage>2790</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Budisa1">
        <label>15</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Budisa</surname><given-names>N</given-names></name>, <name name-style="western"><surname>Pal</surname><given-names>PP</given-names></name>, <name name-style="western"><surname>Alefelder</surname><given-names>S</given-names></name>, <name name-style="western"><surname>Birle</surname><given-names>P</given-names></name>, <name name-style="western"><surname>Krywcun</surname><given-names>T</given-names></name>, <etal>et al</etal>. (<year>2004</year>) <article-title>Probing the role of tryptophans in Aequorea victoria green fluorescent proteins with an expanded genetic code</article-title>. <source>Biol Chem</source> <volume>385</volume>: <fpage>191</fpage>–<lpage>202</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Steiner1">
        <label>16</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Steiner</surname><given-names>T</given-names></name>, <name name-style="western"><surname>Hess</surname><given-names>P</given-names></name>, <name name-style="western"><surname>Bae</surname><given-names>JH</given-names></name>, <name name-style="western"><surname>Wiltschi</surname><given-names>B</given-names></name>, <name name-style="western"><surname>Moroder</surname><given-names>L</given-names></name>, <etal>et al</etal>. (<year>2008</year>) <article-title>Synthetic biology of proteins: tuning GFPs folding and stability with fluoroproline</article-title>. <source>PloS One</source> <volume>3</volume>: <fpage>e1680</fpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Heim2">
        <label>17</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Heim</surname><given-names>R</given-names></name>, <name name-style="western"><surname>Cubitt</surname><given-names>AB</given-names></name>, <name name-style="western"><surname>Tsien</surname><given-names>RY</given-names></name> (<year>1995</year>) <article-title>Improved green fluorescence</article-title>. <source>Nature</source> <volume>373</volume>: <fpage>663</fpage>–<lpage>664</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Brejc1">
        <label>18</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Brejc</surname><given-names>K</given-names></name>, <name name-style="western"><surname>Sixma</surname><given-names>TK</given-names></name>, <name name-style="western"><surname>Kitts</surname><given-names>PA</given-names></name>, <name name-style="western"><surname>Kain</surname><given-names>SR</given-names></name>, <name name-style="western"><surname>Tsien</surname><given-names>RY</given-names></name>, <etal>et al</etal>. (<year>1997</year>) <article-title>Structural basis for dual excitation and photoisomerization of the Aequorea victoria green fluorescent protein</article-title>. <source>Proc Natl Acad Sci U S A</source> <volume>94</volume>: <fpage>2306</fpage>–<lpage>2311</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Shu1">
        <label>19</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Shu</surname><given-names>X</given-names></name>, <name name-style="western"><surname>Kallio</surname><given-names>K</given-names></name>, <name name-style="western"><surname>Shi</surname><given-names>X</given-names></name>, <name name-style="western"><surname>Abbyad</surname><given-names>P</given-names></name>, <name name-style="western"><surname>Kanchanawong</surname><given-names>P</given-names></name>, <etal>et al</etal>. (<year>2007</year>) <article-title>Ultrafast excited-state dynamics in the green fluorescent protein variant S65T/H148D. 1. Mutagenesis and structural studies</article-title>. <source>Biochemistry</source> <volume>46</volume>: <fpage>12005</fpage>–<lpage>12013</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Stepanenko1">
        <label>20</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Stepanenko</surname><given-names>OV</given-names></name>, <name name-style="western"><surname>Verkhusha</surname><given-names>VV</given-names></name>, <name name-style="western"><surname>Kazakov</surname><given-names>VI</given-names></name>, <name name-style="western"><surname>Shavlovsky</surname><given-names>MM</given-names></name>, <name name-style="western"><surname>Kuznetsova</surname><given-names>IM</given-names></name>, <etal>et al</etal>. (<year>2004</year>) <article-title>Comparative studies on the structure and stability of fluorescent proteins EGFP, zFP506, mRFP1, “dimer2”, and DsRed1</article-title>. <source>Biochemistry</source> <volume>43</volume>: <fpage>14913</fpage>–<lpage>14923</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Winter1">
        <label>21</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Winter</surname><given-names>G</given-names></name> (<year>2010</year>) <article-title>xia2: an expert system for macromolecular crystallography data reduction</article-title>. <source>J App Crystallogr</source> <volume>43</volume>: <fpage>186</fpage>–<lpage>190</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Evans1">
        <label>22</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Evans</surname><given-names>PR</given-names></name> (<year>2006</year>) <article-title>Scaling and assessment of data quality</article-title>. <source>Acta Cryst</source> <volume>D62</volume>: <fpage>72</fpage>–<lpage>82</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-CCP41">
        <label>23</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><collab xlink:type="simple">CCP4</collab> (<year>1994</year>) <article-title>The CCP4 suite: programs for protein crystallography</article-title>. <source>Acta Crystallogr D Biol Crystallogr</source> <volume>50</volume>: <fpage>760</fpage>–<lpage>763</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Lebedev1">
        <label>24</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Lebedev</surname><given-names>AA</given-names></name>, <name name-style="western"><surname>Vagin</surname><given-names>AA</given-names></name>, <name name-style="western"><surname>Murshudov</surname><given-names>GN</given-names></name> (<year>2008</year>) <article-title>Model preparation in MOLREP and examples of model improvement using X-ray data</article-title>. <source>Acta Crystallogr D Biol Crystallogr</source> <volume>64</volume>: <fpage>33</fpage>–<lpage>39</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Emsley1">
        <label>25</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Emsley</surname><given-names>P</given-names></name>, <name name-style="western"><surname>Cowtan</surname><given-names>K</given-names></name> (<year>2004</year>) <article-title>Coot: model-building tools for molecular graphics</article-title>. <source>Acta Crystallogr D Biol Crystallogr</source> <volume>60</volume>: <fpage>2126</fpage>–<lpage>2132</lpage>.</mixed-citation>
      </ref>
      <ref id="pone.0047132-Murshudov1">
        <label>26</label>
        <mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Murshudov</surname><given-names>GN</given-names></name>, <name name-style="western"><surname>Vagin</surname><given-names>AA</given-names></name>, <name name-style="western"><surname>Dodson</surname><given-names>EJ</given-names></name> (<year>1997</year>) <article-title>Refinement of macromolecular structures by the maximum-likelihood method</article-title>. <source>Acta Crystallogr D Biol Crystallogr</source> <volume>53</volume>: <fpage>240</fpage>–<lpage>255</lpage>.</mixed-citation>
      </ref>
    </ref-list>
  </back>
</article>