<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article
  PUBLIC "-//NLM//DTD Journal Publishing DTD v3.0 20080202//EN" "http://dtd.nlm.nih.gov/publishing/3.0/journalpublishing3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="3.0" xml:lang="en">
<front>
<journal-meta>
<journal-id journal-id-type="nlm-ta">PLoS ONE</journal-id>
<journal-id journal-id-type="publisher-id">plos</journal-id>
<journal-id journal-id-type="pmc">plosone</journal-id><journal-title-group>
<journal-title>PLoS ONE</journal-title></journal-title-group>
<issn pub-type="epub">1932-6203</issn>
<publisher>
<publisher-name>Public Library of Science</publisher-name>
<publisher-loc>San Francisco, USA</publisher-loc></publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">PONE-D-13-44063</article-id>
<article-id pub-id-type="doi">10.1371/journal.pone.0095693</article-id>
<article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="Discipline-v2"><subject>Biology and life sciences</subject><subj-group><subject>Computational biology</subject></subj-group><subj-group><subject>Ecology</subject><subj-group><subject>Behavioral ecology</subject></subj-group></subj-group><subj-group><subject>Neuroscience</subject><subj-group><subject>Cognitive science</subject><subj-group><subject>Cognition</subject><subj-group><subject>Memory</subject></subj-group></subj-group><subj-group><subject>Cognitive psychology</subject><subj-group><subject>Learning</subject></subj-group></subj-group></subj-group></subj-group><subj-group><subject>Psychology</subject><subj-group><subject>Behavior</subject><subj-group><subject>Human performance</subject></subj-group></subj-group></subj-group><subj-group><subject>Theoretical biology</subject></subj-group><subj-group><subject>Zoology</subject><subj-group><subject>Animal behavior</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v2"><subject>Ecology and environmental sciences</subject></subj-group><subj-group subj-group-type="Discipline-v2"><subject>Social sciences</subject></subj-group></article-categories>
<title-group>
<article-title>The Exploration-Exploitation Dilemma: A Multidisciplinary Framework</article-title>
<alt-title alt-title-type="running-head">Exploration-Exploitation Framework</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Berger-Tal</surname><given-names>Oded</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref><xref ref-type="corresp" rid="cor1"><sup>*</sup></xref><xref ref-type="fn" rid="fn1"><sup>¤a</sup></xref><xref ref-type="fn" rid="fn2"><sup>¤b</sup></xref></contrib>
<contrib contrib-type="author" equal-contrib="yes" xlink:type="simple"><name name-style="western"><surname>Nathan</surname><given-names>Jonathan</given-names></name><xref ref-type="aff" rid="aff2"><sup>2</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Meron</surname><given-names>Ehud</given-names></name><xref ref-type="aff" rid="aff2"><sup>2</sup></xref><xref ref-type="aff" rid="aff3"><sup>3</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Saltz</surname><given-names>David</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
</contrib-group>
<aff id="aff1"><label>1</label><addr-line>Mitrani Department of Desert Ecology, Jacob Blaustein Institutes for Desert Research, Ben-Gurion University of the Negev, Midreshet Ben-Gurion, Israel</addr-line></aff>
<aff id="aff2"><label>2</label><addr-line>Department of Solar Energy and Environmental Physics, Jacob Blaustein Institutes for Desert Research, Ben-Gurion University of the Negev, Midreshet Ben-Gurion, Israel</addr-line></aff>
<aff id="aff3"><label>3</label><addr-line>Physics Department, Ben-Gurion University of the Negev, Beer Sheva, Israel</addr-line></aff>
<contrib-group>
<contrib contrib-type="editor" xlink:type="simple"><name name-style="western"><surname>Daunizeau</surname><given-names>Jean</given-names></name>
<role>Editor</role>
<xref ref-type="aff" rid="edit1"/></contrib>
</contrib-group>
<aff id="edit1"><addr-line>Brain and Spine Institute (ICM), France</addr-line></aff>
<author-notes>
<corresp id="cor1">* E-mail: <email xlink:type="simple">oded.berger.tal@gmail.com</email></corresp>
<fn fn-type="conflict"><p>The authors have declared that no competing interests exist.</p></fn>
<fn fn-type="con"><p>Conceived and designed the experiments: OBT JN EM DS. Performed the experiments: OBT JN. Analyzed the data: OBT JN. Contributed reagents/materials/analysis tools: JN EM. Wrote the paper: OBT.</p></fn>
<fn id="fn1" fn-type="current-aff"><label>¤a</label><p>Current address: Department of Ecology and Evolutionary Biology, University of California Los Angeles, Los Angeles, California, United States of America</p></fn>
<fn id="fn2" fn-type="current-aff"><label>¤b</label><p>Current address: Applied Animal Ecology Division, Institute for Conservation Research, San Diego Zoo Global, Escondido, California, United States of America</p></fn>
</author-notes>
<pub-date pub-type="collection"><year>2014</year></pub-date>
<pub-date pub-type="epub"><day>22</day><month>4</month><year>2014</year></pub-date>
<volume>9</volume>
<issue>4</issue>
<elocation-id>e95693</elocation-id>
<history>
<date date-type="received"><day>27</day><month>10</month><year>2013</year></date>
<date date-type="accepted"><day>30</day><month>3</month><year>2014</year></date>
</history>
<permissions>
<copyright-year>2014</copyright-year>
<copyright-holder>Berger-Tal et al</copyright-holder><license xlink:type="simple"><license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">Creative Commons Attribution License</ext-link>, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p></license></permissions>
<abstract>
<p>The trade-off between the need to obtain new knowledge and the need to use that knowledge to improve performance is one of the most basic trade-offs in nature, and optimal performance usually requires some balance between exploratory and exploitative behaviors. Researchers in many disciplines have been searching for the optimal solution to this dilemma. Here we present a novel model in which the exploration strategy itself is dynamic and varies with time in order to optimize a definite goal, such as the acquisition of energy, money, or prestige. Our model produced four very distinct phases: Knowledge establishment, Knowledge accumulation, Knowledge maintenance, and Knowledge exploitation, giving rise to a multidisciplinary framework that applies equally to humans, animals, and organizations. The framework can be used to explain a multitude of phenomena in various disciplines, such as the movement of animals in novel landscapes, the most efficient resource allocation for a start-up company, or the effects of old age on knowledge acquisition in humans.</p>
</abstract>
<funding-group><funding-statement>This study was funded by an Israel Science Foundation (ISF) grant 1397/10, and by a seed grant from the Swiss Institute for Dryland Environmental and Energy Research (SIDEER). The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</funding-statement></funding-group><counts><page-count count="8"/></counts></article-meta>
</front>
<body><sec id="s1">
<title>Introduction</title>
<p>In order to produce high quality science, a scientist needs to be well versed in theory and familiar with other studies in her or his field. However, spending too much time delving into other studies might reduce the time allocated to the scientist’s own research, reducing the quality of the research’s results. Assuming the scientist wants to maximize his/her contribution to science, how much time should he/she spend on acquiring knowledge vs. putting this knowledge to use?</p>
<p>The trade-off between the exploration of new possibilities and the exploitation of old certainties constitutes one of the most basic dilemmas that both individuals and organizations constantly face at multiple time-scales, and has therefore been investigated by researchers from a variety of fields, including economics <xref ref-type="bibr" rid="pone.0095693-Schumpeter1">[1]</xref>–<xref ref-type="bibr" rid="pone.0095693-AzoulaySchwartz1">[3]</xref>, business management <xref ref-type="bibr" rid="pone.0095693-Uotila1">[4]</xref>, <xref ref-type="bibr" rid="pone.0095693-MolinaCastillo1">[5]</xref>, psychology <xref ref-type="bibr" rid="pone.0095693-Daw1">[6]</xref>, <xref ref-type="bibr" rid="pone.0095693-Cohen1">[7]</xref>, computer sciences <xref ref-type="bibr" rid="pone.0095693-Sutton1">[8]</xref> and ecology <xref ref-type="bibr" rid="pone.0095693-Eliassen1">[9]</xref>, <xref ref-type="bibr" rid="pone.0095693-BergerTal1">[10]</xref>. This dilemma stems from the fact that gathering information and exploiting it are in many cases two mutually exclusive activities. These two activities can be viewed as the two extreme strategies at the ends of a continuous scale. At one end of the continuum, an individual or system that only explores (i.e., obtains information about its environment in order to enhance future performance <xref ref-type="bibr" rid="pone.0095693-MettkeHofmann1">[11]</xref>) will pay the costs of obtaining new information without gaining the benefits of knowledge <xref ref-type="bibr" rid="pone.0095693-March1">[2]</xref>. On the other end of the continuum, an individual or system that only exploits (i.e., uses existing knowledge only) will lack the capability to adapt to significant environmental changes and may be trapped in a suboptimal stable equilibrium <xref ref-type="bibr" rid="pone.0095693-March1">[2]</xref>, <xref ref-type="bibr" rid="pone.0095693-Uotila1">[4]</xref>. Thus, optimal behavior usually requires some balance between exploratory and exploitative behaviors <xref ref-type="bibr" rid="pone.0095693-March1">[2]</xref>, <xref ref-type="bibr" rid="pone.0095693-Eliassen1">[9]</xref>, <xref ref-type="bibr" rid="pone.0095693-BergerTal1">[10]</xref>.</p>
<p>Most of the studies dealing with the exploration-exploitation tradeoff show optimal solutions that are composed of one or several stationary strategies <xref ref-type="bibr" rid="pone.0095693-Gittins1">[12]</xref>. These could be a point on the exploration-exploitation continuum representing a division of the subject’s resource allocation between exploratory and exploitative behaviors that yields the best long-term rewards under given conditions <xref ref-type="bibr" rid="pone.0095693-Benner1">[13]</xref>, <xref ref-type="bibr" rid="pone.0095693-Gupta1">[14]</xref>, or a point in time in which the subject should switch from a purely explorative strategy to an exploitative one <xref ref-type="bibr" rid="pone.0095693-Gupta1">[14]</xref>, <xref ref-type="bibr" rid="pone.0095693-Burgelman1">[15]</xref>. A more realistic approach should consider the strategy itself as a dynamic component that varies with time in order to optimize a definite goal, such as the acquisition of energy, money, or prestige. If we take the scientist from the opening example, it is reasonable to assume that his/her optimal strategy as a graduate student should differ considerably from his/her optimal strategy once he/she received tenure. Therefore, a key question is how will the optimal solution change with time along the different stages of the scientist’s career? Only very few studies have explored this optimization problem.</p>
<p>The principles of reinforcement learning (RF) theory, a framework originally used for machine learning that is aimed at facilitating adaptation to an environment based on trial and error <xref ref-type="bibr" rid="pone.0095693-Sutton1">[8]</xref>, were applied in computational biology to construct learning algorithms in which an agent can control the balance between exploration and exploitation in an optimal manner <xref ref-type="bibr" rid="pone.0095693-Ishii1">[16]</xref>–<xref ref-type="bibr" rid="pone.0095693-Khamassi1">[18]</xref>. These algorithms are based on a Bayesian modeling approach where the agent’s decisions are the product of a weighted average of some prior knowledge regarding the environment and current sampling information <xref ref-type="bibr" rid="pone.0095693-Jacobs1">[19]</xref>, and the agent’s need to explore is directly based on its perception of the environment, growing whenever the environment changes <xref ref-type="bibr" rid="pone.0095693-Ishii1">[16]</xref>. This is due to the fact that uncertainty should promote exploration <xref ref-type="bibr" rid="pone.0095693-Doya1">[20]</xref> in an attempt to reduce it, and indeed there is evidence that surprising events and changes to the environment promote animals to learn faster <xref ref-type="bibr" rid="pone.0095693-Courville1">[21]</xref>. Such algorithms have been tested and found to produce near optimal results in simulations. Moreover, analogical neurophysiologic pathways in the brain of animals and humans have been suggested, highlighting the neurobiological substrates that are related to the regulation of decision-making <xref ref-type="bibr" rid="pone.0095693-Schweighofer1">[17]</xref>, <xref ref-type="bibr" rid="pone.0095693-Khamassi1">[18]</xref>, <xref ref-type="bibr" rid="pone.0095693-Doya1">[20]</xref>. But although RF models are very useful in increasing our understandings of how animals and humans make decisions, they are also very mechanistic in nature and are, in many cases, specifically tailored to solve certain tasks, such as passing through mazes <xref ref-type="bibr" rid="pone.0095693-Ishii1">[16]</xref>, with no attention given to the general motivation and ecological background of the subject. In other words, the abovementioned models have concentrated on the <italic>how</italic> rather than on the <italic>why</italic> of the decision-making process. Furthermore, so far the conclusions of all previous investigations of the exploration-exploitation dilemma are restricted to the discipline in which the study was conducted, and no attempt has been made to create a unifying framework that would be applicable across disciplines.</p>
<p>We present a multidisciplinary general framework of the exploration-exploitation trade-off, motivated by a new mathematical model, in which the balance between exploring new possibilities and exploiting old certainties varies dynamically with time to optimize a predefined goal. In this framework we focus on the optimal exploration-exploitation strategies at different stages of a subject’s life-span.</p>
</sec><sec id="s2" sec-type="methods">
<title>Methods</title>
<p>Our model depicts a subject that can invest in energy acquisition (exploitation) or knowledge acquisition (exploration), according to a strategy that represents the proportion of time the subject invests in knowledge acquisition as a function of time along its lifetime <italic>T</italic><sub>max.</sub> Denoting the subject’s energy and knowledge by <italic>E</italic> and <italic>L</italic>, respectively, and the time dependent strategy by <italic>u(t),</italic> the model reads:</p>
<p><inline-formula><inline-graphic xlink:href="info:doi/10.1371/journal.pone.0095693.e001" xlink:type="simple"/></inline-formula> <inline-formula><inline-graphic xlink:href="info:doi/10.1371/journal.pone.0095693.e002" xlink:type="simple"/></inline-formula></p>
<p>According to this model, energy <italic>E</italic> is gained as a saturating function of the existing knowledge <italic>L</italic>, with the half saturation constant <italic>k<sub>L</sub></italic>, so that an increase in knowledge yields a smaller increase in energy gain when existing knowledge is higher. The constant <italic>k<sub>L</sub></italic> can also represent spatial unpredictability – a low value of <italic>k<sub>L</sub></italic> reflects a homogeneous environment in which a low amount of exploration is all the subject requires in order to gain benefits from it, while a high value of <italic>k<sub>L</sub></italic> represent a heterogeneous environment. Energy is lost due to maintenance costs at a constant rate <italic>m</italic>, and also due to knowledge acquisition at a rate proportional to the strategy <italic>u(t).</italic> Knowledge gain is proportional to <italic>u(t),</italic> with efficiency <italic>α</italic>, and knowledge loss due to maintenance costs is proportional to the existing amount of knowledge with a rate <italic>m<sub>L</sub></italic>. A high value of <italic>m<sub>L</sub></italic> (i.e., a high rate of knowledge loss or “forgetting”) can represent low temporal predictability in the environment or, alternatively, the subject’s limited ability to retain stored knowledge. To obtain physically feasible results, we must also add constraints requiring that energy will not become lower than some minimal level needed for survival (<italic>E</italic><sub>min</sub>), and also enforcing positive values of knowledge throughout the simulation:</p>
<p><disp-formula id="pone.0095693.e003"><graphic position="anchor" xlink:href="info:doi/10.1371/journal.pone.0095693.e003" xlink:type="simple"/></disp-formula><disp-formula id="pone.0095693.e004"><graphic position="anchor" xlink:href="info:doi/10.1371/journal.pone.0095693.e004" xlink:type="simple"/></disp-formula></p>
<p>We also require the strategy <italic>u(t)</italic> to be limited by the following constraints: Energy expenditure for exploration, per unit time, cannot have a negative value and should be smaller than the maximal energy acquisition rate <italic>f</italic><sub>max</sub>.</p>
<p><disp-formula id="pone.0095693.e005"><graphic position="anchor" xlink:href="info:doi/10.1371/journal.pone.0095693.e005" xlink:type="simple"/></disp-formula></p>
<p><xref ref-type="table" rid="pone-0095693-t001">Table 1</xref> lists the different parameters used in the model, the range of values which we investigated for each parameter, their units, their meaning, and the initial conditions and constraints of the model.</p>
<table-wrap id="pone-0095693-t001" position="float"><object-id pub-id-type="doi">10.1371/journal.pone.0095693.t001</object-id><label>Table 1</label><caption>
<title>The different parameters that were used in the model and the range of parameter values we investigated (A), and the parameters that were used in solving the optimization problem (B).</title>
</caption><alternatives><graphic id="pone-0095693-t001-1" position="float" mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0095693.t001" xlink:type="simple"/>
<table><colgroup span="1"><col align="left" span="1"/><col align="center" span="1"/><col align="center" span="1"/><col align="center" span="1"/></colgroup>
<thead>
<tr>
<td colspan="4" align="left" rowspan="1">A. Model Parameters</td>
</tr>
<tr>
<td align="left" rowspan="1" colspan="1">Parameter name</td>
<td align="left" rowspan="1" colspan="1">Values</td>
<td align="left" rowspan="1" colspan="1">Units</td>
<td align="left" rowspan="1" colspan="1">Meaning</td>
</tr>
</thead>
<tbody>
<tr>
<td align="left" rowspan="1" colspan="1"><italic>f</italic><sub>max</sub></td>
<td align="left" rowspan="1" colspan="1">[0.5–10]</td>
<td align="left" rowspan="1" colspan="1"><italic>E/t</italic></td>
<td align="left" rowspan="1" colspan="1">Maximal energy consumption rate</td>
</tr>
<tr>
<td align="left" rowspan="1" colspan="1"><italic>k<sub>L</sub></italic></td>
<td align="left" rowspan="1" colspan="1">[0.001–10]</td>
<td align="left" rowspan="1" colspan="1"><italic>L</italic></td>
<td align="left" rowspan="1" colspan="1">Efficiency of foraging: The level of knowledge that will yield half of the maximal consumption rate.</td>
</tr>
<tr>
<td align="left" rowspan="1" colspan="1"><italic>m</italic></td>
<td align="left" rowspan="1" colspan="1">0.02</td>
<td align="left" rowspan="1" colspan="1"><italic>E/t</italic></td>
<td align="left" rowspan="1" colspan="1">Maintenance cost of living</td>
</tr>
<tr>
<td align="left" rowspan="1" colspan="1">α</td>
<td align="left" rowspan="1" colspan="1">[0.5–10]</td>
<td align="left" rowspan="1" colspan="1"><italic>L/E</italic></td>
<td align="left" rowspan="1" colspan="1">Efficiency of learning: Knowledge gain per unit energy.</td>
</tr>
<tr>
<td align="left" rowspan="1" colspan="1"><italic>m<sub>L</sub></italic></td>
<td align="left" rowspan="1" colspan="1">[0.01–1]</td>
<td align="left" rowspan="1" colspan="1">1/<italic>t</italic></td>
<td align="left" rowspan="1" colspan="1">Knowledge maintenance cost (temporal predictability)</td>
</tr>
<tr>
<td align="left" rowspan="1" colspan="1"><italic>T</italic><sub>max</sub></td>
<td align="left" rowspan="1" colspan="1">[5–100]</td>
<td align="left" rowspan="1" colspan="1"><italic>T</italic></td>
<td align="left" rowspan="1" colspan="1">Life duration</td>
</tr>
<tr>
<td colspan="4" align="left" rowspan="1"><bold>B. Optimization problem parameters</bold></td>
</tr>
<tr>
<td align="left" rowspan="1" colspan="1"><bold>Parameter name</bold></td>
<td align="left" rowspan="1" colspan="1"><bold>Values</bold></td>
<td align="left" rowspan="1" colspan="1"><bold>Units</bold></td>
<td align="left" rowspan="1" colspan="1"><bold>Meaning</bold></td>
</tr>
<tr>
<td align="left" rowspan="1" colspan="1"><italic>E</italic>(<italic>t = </italic>0)</td>
<td align="left" rowspan="1" colspan="1">5.5</td>
<td align="left" rowspan="1" colspan="1"><italic>E</italic></td>
<td align="left" rowspan="1" colspan="1">Initial energy</td>
</tr>
<tr>
<td align="left" rowspan="1" colspan="1"><italic>L</italic>(<italic>t = </italic>0)</td>
<td align="left" rowspan="1" colspan="1">0</td>
<td align="left" rowspan="1" colspan="1"><italic>L</italic></td>
<td align="left" rowspan="1" colspan="1">Initial knowledge</td>
</tr>
<tr>
<td align="left" rowspan="1" colspan="1"><italic>E</italic><sub>min</sub></td>
<td align="left" rowspan="1" colspan="1">5</td>
<td align="left" rowspan="1" colspan="1"><italic>E</italic></td>
<td align="left" rowspan="1" colspan="1">Minimal energy for survival</td>
</tr>
<tr>
<td align="left" rowspan="1" colspan="1"><italic>L</italic><sub>min</sub></td>
<td align="left" rowspan="1" colspan="1">0</td>
<td align="left" rowspan="1" colspan="1"><italic>L</italic></td>
<td align="left" rowspan="1" colspan="1">Minimal knowledge</td>
</tr>
<tr>
<td align="left" rowspan="1" colspan="1"><italic>U</italic><sub>min</sub></td>
<td align="left" rowspan="1" colspan="1">0</td>
<td align="left" rowspan="1" colspan="1"><italic>E/t</italic></td>
<td align="left" rowspan="1" colspan="1">Minimal investment in learning</td>
</tr>
<tr>
<td align="left" rowspan="1" colspan="1"><italic>U</italic><sub>max</sub></td>
<td align="left" rowspan="1" colspan="1">1</td>
<td align="left" rowspan="1" colspan="1"><italic>E/t</italic></td>
<td align="left" rowspan="1" colspan="1">Maximal investment in learning</td>
</tr>
</tbody>
</table>
</alternatives></table-wrap>
<p>Each strategy, <italic>u(t)</italic>, correspond uniquely to a value of energy at the end of life, <italic>E<sub>i</sub>(T</italic><sub>max</sub><italic>)</italic>.</p>
<p>We define the optimal strategy <italic>u<sup>*</sup>(t)</italic> to be the strategy that maximizes the amount of energy at the end of the subject’s life-span, <italic>T</italic><sub>max.</sub> This does not mean that the subject ends its life with stores of wasted energy, since this energy is presumably used during its life-span to produce offspring, increase the subject’s material wealth, etc. In order to find such optimal strategy one can transform the optimization problem above to a set of differential equations. The rules to make this transformation were formalized by Lev Pontryagin and Richard Bellman, and are now widely known as Optimal Control Theory <xref ref-type="bibr" rid="pone.0095693-Kirk1">[22]</xref>. The differential equations obtained by this method are often quite complicated to solve analytically and may require the use of numerical solution methods. In this work we use an optimization problem solving code for MATLAB (version 7.6.0, MathWorks, Natick, Massachusetts) called “<italic>General Pseudospectral Optimization Software (GPOPS)” available freely online</italic> <xref ref-type="bibr" rid="pone.0095693-Rao1">[23]</xref>. This code transforms the model, constraints, and optimization criteria using the optimal control scheme into a set of partial differential equations, and proceeds to solve these equations using a numerical pseudospectral method. The solution yields the optimal strategy <italic>u*(t)</italic> that corresponds to the maximal energy gain during lifetime. We used this method iteratively to explore how changing model parameters affect the optimal strategy.</p>
<p>As in all models, we make several simplifying assumptions in the construction of this model. We assume that all parameters remain constant throughout a subject’s life-span, as well as the value of information. We also assume that the rate of learning is reduced with the accumulation of knowledge. We believe that while these assumptions imply that the model may not apply to some specific cases, they also keep the model general enough to be applicative across disciplines.</p>
</sec><sec id="s3">
<title>Results and Discussion</title>
<p>The model results were very robust, and remarkably produced only four distinct phases that emerged in a fixed order regardless of the parameter values that were assigned. The phases differed in the subject’s relation to knowledge (<xref ref-type="fig" rid="pone-0095693-g001">Fig. 1</xref>) and can be defined as: 1. Knowledge establishment. 2. Knowledge accumulation. 3. Knowledge maintenance. 4. Knowledge exploitation. Each of these phases relates to a different stage in the life-span of the decision making subject, be it a foraging animal, a human or a company. The framework is relevant across disciplines and can be used to explain a multitude of phenomena and allow for better informed decision making.</p>
<fig id="pone-0095693-g001" position="float"><object-id pub-id-type="doi">10.1371/journal.pone.0095693.g001</object-id><label>Figure 1</label><caption>
<title>The four knowledge phases.</title>
<p>The change with time in the subject’s energy state (<italic>E</italic>; panel A, solid blue line), knowledge state (<italic>L</italic>; panel A, dashed green line), and its optimal proportion of time devoted to knowledge acquisition (<italic>u*(t)</italic>; panel B, solid red line). The vertical dashed lines make a distinction between the four life-phases with regards to the exploration-exploitation dilemma: <italic>a</italic>. Knowledge establishment. <italic>b</italic>. Knowledge accumulation. <italic>c</italic>. Knowledge maintenance. <italic>d</italic>. Knowledge exploitation. The parameters used to generate this example are: <italic>f<sub>max</sub></italic><sub> = </sub>1, <italic>k<sub>L</sub></italic> = 1, <italic>m<sub>L</sub></italic> = 0.08, <italic>alpha</italic> = 1 and <italic>T<sub>max</sub></italic> = 20.</p>
</caption><graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0095693.g001" position="float" xlink:type="simple"/></fig></sec><sec id="s4">
<title>The Four Knowledge Phases</title>
<sec id="s4a">
<title>Knowledge Establishment</title>
<p>In order to exploit any resource, even in the most inefficient manner, the exploiting entity must have some knowledge of its environment. At the very least, knowledge of the existence of a resource and how to reach it are needed. The more is known about alternative resources, ways of obtaining them and various aspects of the environment, the more efficient the exploitation of resources will be. Thus, <italic>knowledge establishment</italic> is an obligatory phase when entering unfamiliar territory, such as for a dispersing or translocated animal, or an emerging company.</p>
<p>During this phase the subject devotes all of its resources to exploration (<xref ref-type="fig" rid="pone-0095693-g001">Fig. 1</xref>). Since the subject does not exploit any resources, it relies solely on its internal reserves (i.e., the energy state of an exploring animal or investors’ funds in an emerging company). Consequently, the length of this phase is mainly determined by the subject’s initial state. A subject that is in a relatively good state can afford to extend this phase considerably, thus improving its future prospects.</p>
<p>It is important to note that both humans and animals frequently use inherited knowledge (that was passed to them genetically or through culture transmission) when entering an unfamiliar territory, and thus may act upon some prior expectations based on that knowledge. If this knowledge is reliable, these individuals may skip this phase entirely and start their life from the knowledge accumulation phase. However, inherited knowledge may sometimes hinder the utilization of resources <xref ref-type="bibr" rid="pone.0095693-Giraldeau1">[24]</xref>, such as in the case of rapidly changing environments, in which case individuals may be left with diminished resources for the establishment phase.</p>
<p>This phase is commonly apparent in technological ventures where in the early stages of a development project, an exploratory search should be undertaken in an attempt to discover something new, as well as to form exploration alliances <xref ref-type="bibr" rid="pone.0095693-MolinaCastillo1">[5]</xref>, <xref ref-type="bibr" rid="pone.0095693-Rothaermel1">[25]</xref>. In the context of animals, this phase exists in dispersing individuals that have reached unfamiliar territories. It is usually very short, and thus there is very little empirical work investigating it in the wild. However, we do know that captive animals that are introduced to new environments exhibit specific behaviors aimed at exploring their new environment <xref ref-type="bibr" rid="pone.0095693-Avni1">[26]</xref>, <xref ref-type="bibr" rid="pone.0095693-Fryxell1">[27]</xref>. The rapid integration of high resolution GPS collars into wildlife reintroductions <xref ref-type="bibr" rid="pone.0095693-Cagnacci1">[28]</xref> promises exciting advances in this field, as we now have the means to investigate the movement behavior of animals that are released to novel environments to better understand the knowledge establishment phase.</p>
</sec><sec id="s4b">
<title>Knowledge Accumulation</title>
<p>This phase is what most literature dealing with the exploration-exploitation trade-off refers to as the exploration stage. During this phase the subject focuses on obtaining new information while exploiting resources from existing knowledge at a low rate aimed only at keeping the subject at some minimal pre-defined state. Thus, the subject is sacrificing its short-term benefits in order to obtain long-term rewards. As this phase progresses the rate of obtaining new information increases slowly because with the accumulation of knowledge, the exploitation of existing resources becomes more efficient and the subject needs to devote less time and energy to reach its minimum pre-defined state, and can therefore allocate more time and energy for further exploration (<xref ref-type="fig" rid="pone-0095693-g001">Fig. 1</xref>).</p>
<p>Since exploratory behavior is such a fundamental behavior in both humans and animals <xref ref-type="bibr" rid="pone.0095693-Fonio1">[29]</xref>, there have been many attempts to describe and characterize the behavior of individuals in novel environments. Some of the more in-depth studies of exploratory behavior have been done on rodents, but even within these studies, exploratory behavior varies according to the species and context. Laboratory mice introduced to a novel arena, showed exploratory behavior of increasing complexity, first examining their nest’s surroundings, then progressively the walls around the arena and only later venturing to the center of the arena <xref ref-type="bibr" rid="pone.0095693-Fonio1">[29]</xref>. A similar behavior was performed by fat sand rats, <italic>Psammomys obesus</italic>, under lit conditions, but in the dark the rats performed looping behavior, in which travel paths tangle into loops <xref ref-type="bibr" rid="pone.0095693-Avni1">[26]</xref>. Outside the laboratory, brown rats, <italic>Rattus norvegicus</italic>, released into the wild, exhibited random walk patterns, increasing in perimeter with time and mediated by central place foraging behavior <xref ref-type="bibr" rid="pone.0095693-Russel1">[30]</xref>. Whatever the exploration method is, in all of these cases the behavior of the animals is clearly primarily aimed at increasing their knowledge about their surroundings and not at the acquisition of resources. Thus, all of these different exploration mechanisms ultimately represent the same phase – <italic>knowledge accumulation</italic>.</p>
<p>The subject’s time horizon (<italic>T</italic><sub>max</sub>) is an important factor determining the length of this phase. Because there is a temporal gap between paying the short-term costs of accumulating knowledge (i.e., exploring) and reaping the benefits of information, subjects with short life-spans should invest less in accumulating knowledge, since for them the benefits of knowing more are greatly reduced. Indeed, numerous studies on humans and animals report that as the relevant time horizon decreases, so does the tendency of the subject to explore <xref ref-type="bibr" rid="pone.0095693-Eliassen1">[9]</xref>, <xref ref-type="bibr" rid="pone.0095693-Khamassi1">[18]</xref>, <xref ref-type="bibr" rid="pone.0095693-Carstensen1">[31]</xref>. A limited time horizon can stem from the time left available for a specific task <xref ref-type="bibr" rid="pone.0095693-Krebs1">[32]</xref> or the age of the subject <xref ref-type="bibr" rid="pone.0095693-Wajnberg1">[33]</xref>. Increasing the time-span of a learning subject will lengthen the <italic>knowledge accumulation</italic> period, but only up to a certain value. Because of cognitive or physiological constraints, as well as environmental stochasticity (that in most cases cannot be fully predicted), there is a limit to the benefits of exploration. Thus, eventually the exploring subject reaches a point in which additional exploration does not improve its future prospects and this phase becomes constant (decreasing the relative weight of this phase as the subject’s life-span increases, <xref ref-type="fig" rid="pone-0095693-g002">Fig. 2a</xref>).</p>
<fig id="pone-0095693-g002" position="float"><object-id pub-id-type="doi">10.1371/journal.pone.0095693.g002</object-id><label>Figure 2</label><caption>
<title>The optimal knowledge phases as a function of age and environment.</title>
<p>The four optimal knowledge phases (dark blue - knowledge establishment, light blue - knowledge accumulation, orange - knowledge maintenance, red - knowledge exploitation) as a function of the subject ‘age’ (i.e., its position on its life-span trajectory, normalized here to a scale of 0–1), and different parameter values: (A) <italic>T<sub>max</sub></italic> - length of life-span. (B) <italic>m<sub>L</sub></italic> - rate of knowledge loss. (C) <italic>k<sub>L</sub></italic> - learning half saturation constant representing the environmental spatial predictability. (D) <italic>alpha</italic> - learning efficiency. In all simulations, the values of all parameters not tested (e.g., for plate A - all parameters but <italic>T<sub>max</sub></italic>) are as described for <xref ref-type="fig" rid="pone-0095693-g001">figure 1</xref>.</p>
</caption><graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0095693.g002" position="float" xlink:type="simple"/></fig>
<p>The environment’s temporal unpredictability (<italic>m<sub>L</sub>)</italic>, which can reflect either external conditions that change with time (such as a highly fluid market environment), or the subject’s own cognitive abilities and liabilities (such as memory capacity or decay), will also determine the length of the knowledge accumulation period. The more unpredictable the environment is, the harder it is to make predictions about the future state of the environment, which lowers the value of exploration (<xref ref-type="fig" rid="pone-0095693-g002">Fig. 2b</xref>). This result is supported by both theoretical models of learning in stochastic environments and empirical studies with humans <xref ref-type="bibr" rid="pone.0095693-Doya1">[20]</xref>, <xref ref-type="bibr" rid="pone.0095693-Eliassen2">[34]</xref>, <xref ref-type="bibr" rid="pone.0095693-Greville1">[35]</xref>.</p>
<p>As the spatial unpredictability (<italic>k<sub>L</sub></italic>) of the environment decreases (i.e., as the environment becomes more homogeneous) the need for exploration is reduced, and in extremely predictable conditions the knowledge gained during the <italic>knowledge establishment</italic> period is sufficient for optimal exploitation, eliminating the <italic>knowledge accumulation</italic> phase (<xref ref-type="fig" rid="pone-0095693-g002">Fig. 2c</xref>). Lastly, the learning efficiency (<italic>α)</italic> of the subject will determine the length of the <italic>knowledge accumulation</italic> period. An extremely efficient learner already accumulates enough knowledge during the knowledge establishment period, and can skip the accumulation stage altogether. In contrast, for an inefficient learner the accumulation period is greatly extended to allow for the accumulation of sufficient information for optimal exploitation of resources at a later stage (<xref ref-type="fig" rid="pone-0095693-g002">Fig. 2d</xref>).</p>
</sec><sec id="s4c">
<title>Knowledge Maintenance</title>
<p>In this phase the subject focuses on the utilization of resources while maintaining its knowledge at a constant optimal level. i.e., learning is only used to replace lost information or update existing knowledge. The leveling of the knowledge curve (<xref ref-type="fig" rid="pone-0095693-g001">Fig. 1</xref>) represents an optimal level of knowledge. Obtaining additional knowledge is too costly (because of the saturating shape of the energy gain function) when weighted against the benefits of knowledge and the rate of knowledge loss (<italic>m<sub>L</sub></italic>).</p>
<p>For animals foraging in heterogeneous landscapes with renewable resources, trap-lining, defined as repeated visitation to a series of resource patches in a predictable order, is usually the most beneficial foraging strategy <xref ref-type="bibr" rid="pone.0095693-Ohashi1">[36]</xref>, and has been reported for a wide variety of species <xref ref-type="bibr" rid="pone.0095693-Watts1">[37]</xref>–<xref ref-type="bibr" rid="pone.0095693-Garrison1">[39]</xref>. Trap-lining foragers utilize resources based on existing knowledge, but since the environment is constantly changing, some method of updating the forager’s information regarding its environment is needed for it to avoid getting ‘stuck’ in an inefficient foraging route. Indeed, several cognitive mechanisms for updating trap-lines have been suggested <xref ref-type="bibr" rid="pone.0095693-BergerTal1">[10]</xref>, <xref ref-type="bibr" rid="pone.0095693-Ohashi1">[36]</xref>. One suggested mechanism that can control both this phase as well as the <italic>knowledge accumulation</italic> phase is the adding of a (usually positive) bias to the subject’s estimation of its environment when it encounters a novel environment (or alternatively, the adding of stochastic variability to its estimate). This idea originates from the field of RL and machine learning <xref ref-type="bibr" rid="pone.0095693-Sutton1">[8]</xref>, <xref ref-type="bibr" rid="pone.0095693-Gullapalli1">[40]</xref>, but has lately been expanded to explain animal behavior <xref ref-type="bibr" rid="pone.0095693-BergerTal1">[10]</xref>, <xref ref-type="bibr" rid="pone.0095693-McNamara1">[41]</xref>. A positively biased estimation of the environment encourages exploration by motivating the subject to keep looking for better rewards. As the subject explores, it constantly updates it estimate of the environment reducing its initial bias. Thus, the longer it explores, the more realistic this estimation will become, until eventually the subject will cease exploration and move into the knowledge maintenance phase. The same mechanism will also ensure that the subject maintains its knowledge in the maintenance phase. Either that stochastic error in the subject’s learning mechanism will keep him exploring to some degree throughout this phase, or alternatively, in the case of an initially biased estimation, whenever the subject encounters a lower than usual reward, as a result of some degradation in the quality of the familiar environment, it will again possess an estimate that is higher than the rewards it acquires, which will send him exploring for a better alternative.</p>
<p>In business management, during the <italic>knowledge maintenance</italic> phase, knowledge regarding existing products is used and maintained, but new lines of products are not pursued <xref ref-type="bibr" rid="pone.0095693-March1">[2]</xref>, <xref ref-type="bibr" rid="pone.0095693-Gupta1">[14]</xref>. The maintenance of knowledge is essential to effectively manage the inevitable errors and changes that are associated with knowledge storage bases, and is therefore considered an essential element of knowledge management <xref ref-type="bibr" rid="pone.0095693-Nevo1">[42]</xref>.</p>
<p>Just as in the <italic>knowledge accumulation</italic> phase, a short time horizon will reduce the length of the <italic>knowledge maintenance</italic> phase, or even eliminate it altogether (<xref ref-type="fig" rid="pone-0095693-g002">Fig. 2a</xref>). When the subject’s time-span is very short, it will be sub-optimal to spend any time learning new information, even if only to maintain the subject’s current knowledge. However, unlike the <italic>knowledge accumulation</italic> phase, as the time-span of the subject expands so does the amount of time devoted to <italic>knowledge maintenance</italic>. During this phase the subject reaps the rewards of past explorations, and thus the longer this period lasts, the more the subject gains.</p>
<p>This phase is strongly affected by the environment’s temporal unpredictability. In an environment that is predictable (as a result of stable conditions and low memory decay of the subject) this phase diminishes as the knowledge that was acquired earlier does not need maintaining and the subject should focus only on exploiting it. On the other hand, in a very fluid (and hence, unpredictable) environment, this phase replaces the <italic>knowledge accumulation</italic> phase simply because there is no point in accumulating knowledge for future use in a constantly changing environment and the subject should focus on continuous learning while exploiting resources (<xref ref-type="fig" rid="pone-0095693-g002">Fig. 2b</xref>). The learning efficiency of the subject produces a similar trend - when it is very low, there is no use in trying to maintain knowledge, since the benefits of investing only partial efforts in learning are close to nil. In this case the subject should concentrate only on the exploitation of knowledge once its <italic>knowledge accumulation</italic> phase is over. When the learning efficiency is especially high the amount of resources devoted to learning during this phase can be maintained at a very low level, and it can replace much of the <italic>knowledge accumulation</italic> phase (<xref ref-type="fig" rid="pone-0095693-g002">Fig. 2d</xref>).</p>
</sec><sec id="s4d">
<title>Knowledge Exploitation</title>
<p>This phase arrives towards the end of a subject’s life-span, and is characterized by a learning investment of 0. As the end approaches, it is sub-optimal to continue investing in gaining new information and the subject should invest its time only in exploiting the knowledge it had already accumulated, temporarily increasing its intake rate of resources (<xref ref-type="fig" rid="pone-0095693-g001">Fig. 1</xref>). It is worthwhile to note that in most cases a subject will have no prior information on its expected life-span. However, there are usually detectable cues that can inform the subject it is approaching the end of its life.</p>
<p>We do not presume to suggest a mechanistic explanation to the effects of old age on learning performance. However, from an evolutionary perspective, our framework corresponds to several of the main paradigms of the psychology of human aging. It is common knowledge that the processing of information and memory in humans decay in old age <xref ref-type="bibr" rid="pone.0095693-Birren1">[43]</xref>. Moreover, in respect to reading, older subjects show a substantial decline in their working memory, but an increase in their use of prior knowledge <xref ref-type="bibr" rid="pone.0095693-Meyer1">[44]</xref>. Three processing styles have been identified in relation to age <xref ref-type="bibr" rid="pone.0095693-Sinnott1">[45]</xref>: The ‘youthful’ style focuses on learning, intense data gathering and bottom-up processing. The ‘mature’ style balances the use of relevant knowledge and information seeking, and the ‘old’ style relies on top-down processing, making use of existing knowledge. This notion that aging is accompanied by an increase in top-down processes pervades recent literature on language in old age <xref ref-type="bibr" rid="pone.0095693-Thornton1">[46]</xref>, <xref ref-type="bibr" rid="pone.0095693-Burke1">[47]</xref>.</p>
<p>Another popular theory that supports our framework is the Socioemotional Selectivity Theory <xref ref-type="bibr" rid="pone.0095693-Carstensen1">[31]</xref>, <xref ref-type="bibr" rid="pone.0095693-Carstensen2">[48]</xref>, <xref ref-type="bibr" rid="pone.0095693-Carstensen3">[49]</xref>. The theory proposes two primary motivations for social interactions: emotion regulation and knowledge acquisition. The perceived time-span of an individual determines the relative importance of these motivational objectives. A long time-horizon tends to be related to knowledge acquisition goals, while a limited time-horizon tends to be related to emotion regulation goals. Because of their limited future time extension, older adults are assumed to be less motivated to acquire knowledge. The theory has received empirical support in a variety of studies <xref ref-type="bibr" rid="pone.0095693-Carstensen4">[50]</xref>, <xref ref-type="bibr" rid="pone.0095693-Riediger1">[51]</xref>. While this can also be explained by the biological fact that the cognitive abilities in humans decay in older people, empirical evidence demonstrates that young people with a limited time horizon (such as terminally ill patients) show similar tendencies to forgo knowledge acquisition <xref ref-type="bibr" rid="pone.0095693-Riediger1">[51]</xref>, <xref ref-type="bibr" rid="pone.0095693-Fung1">[52]</xref>.</p>
<p>It is interesting to note that for very short <italic>T</italic><sub>max</sub> only two phases emerge - knowledge acquisition and knowledge exploitation. Animals with very short life-spans are usually also very small (as they do not have the time to invest in a large body). Small size and a short life-span may promote a more homogeneous environment in space and time (e.g., the animal only lives through one season and forages in a single habitat), which means that there is no need to maintain the knowledge and once enough knowledge is acquired, the animal can immediately switch to the exploitation of resources with no further investment in learning. As lifetime increases, animals need to deal with a more complex environment (more seasons, more habitats), and thus knowledge accumulation and maintenance stages are added to their life-time strategy.</p>
</sec></sec><sec id="s5">
<title>Conclusions</title>
<p>We provide a unifying framework of the exploration-exploitation trade-off, a trade-off prevalent in many disciplines and situations. It is important to note that the timeline presented in our model is restricted to monotonic linear time changes (e.g. lifetime of a human; lifetime of an economical project). However, the model could be easily extended to account for non-linear time-frames. For example, a major change to the environment (e.g., a flood that changes the entire topography, or an economical crisis that changes the entire economical landscape) can force a subject to revert from the <italic>knowledge maintenance</italic> or even the <italic>knowledge exploitation</italic> phases back to the <italic>knowledge accumulation</italic> or <italic>knowledge establishment</italic> phases. Similarly, there can be cases in which the entire sequence of 4 phases can occur multiple times within a subject’s life-span, such as in the case of animals that disperse to new areas several times during their lifetime. In such cases, the length of each sequence can change with time and ‘dispersal experience’, i.e., the explorative phases of an animal dispersing for the first time may be considerably longer than for an animal dispersing to an unfamiliar area for the fifth time in its life.</p>
<p>Our framework demonstrates that the optimal solution to the exploration - exploitation trade-off depends on the life-stage of the subject as well as on the environmental conditions, and that the same strategies can be used by a variety of subjects - animals, humans and organizations alike. This fact points to the universality of the exploration-exploitation dilemma and the strategies aimed at solving it. Thus, the proposed framework can improve our understanding and consequently, our decision making in a multitude of disciplines.</p>
</sec></body>
<back>
<ack>
<p>O. B-T. is supported by the Adams Fellowship Program of the Israel Academy of Sciences and Humanities. This is publication number 828 of the Mitrani Department of Desert Ecology.</p>
</ack>
<ref-list>
<title>References</title>
<ref id="pone.0095693-Schumpeter1"><label>1</label>
<mixed-citation publication-type="other" xlink:type="simple">Schumpeter JA (1934) The theory of economic development. Cambridge: Harvard University Press.</mixed-citation>
</ref>
<ref id="pone.0095693-March1"><label>2</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>March</surname><given-names>JG</given-names></name> (<year>1991</year>) <article-title>Exploration and exploitation in organizational learning</article-title>. <source>Organ Sci</source> <volume>2</volume>: <fpage>71</fpage>–<lpage>87</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-AzoulaySchwartz1"><label>3</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Azoulay-Schwartz</surname><given-names>R</given-names></name>, <name name-style="western"><surname>Kraus</surname><given-names>S</given-names></name>, <name name-style="western"><surname>Wilkenfeld</surname><given-names>J</given-names></name> (<year>2004</year>) <article-title>Exploitation vs. exploration: choosing a supplier in an environment of incomplete information</article-title>. <source>Decis Support Syst</source> <volume>38</volume>: <fpage>1</fpage>–<lpage>18</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Uotila1"><label>4</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Uotila</surname><given-names>J</given-names></name>, <name name-style="western"><surname>Maula</surname><given-names>M</given-names></name>, <name name-style="western"><surname>Keil</surname><given-names>T</given-names></name>, <name name-style="western"><surname>Zahra</surname><given-names>SA</given-names></name> (<year>2009</year>) <article-title>Exploration, exploitation, and financial performance: analysis of S&amp;P 500 corporations</article-title>. <source>Strat Mgmt J</source> <volume>30</volume>: <fpage>221</fpage>–<lpage>231</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-MolinaCastillo1"><label>5</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Molina-Castillo</surname><given-names>F-J</given-names></name>, <name name-style="western"><surname>Jimenez-Jimenez</surname><given-names>D</given-names></name>, <name name-style="western"><surname>Munuera-Aleman</surname><given-names>J-L</given-names></name> (<year>2011</year>) <article-title>Product competence exploitation and exploration strategies: the impact on new product performance through quality and innovativeness</article-title>. <source>Ind Market Manag</source> <volume>40</volume>: <fpage>1172</fpage>–<lpage>1182</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Daw1"><label>6</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Daw</surname><given-names>ND</given-names></name>, <name name-style="western"><surname>O’Doherty</surname><given-names>JP</given-names></name>, <name name-style="western"><surname>Dayan</surname><given-names>P</given-names></name>, <name name-style="western"><surname>Seymour</surname><given-names>B</given-names></name>, <name name-style="western"><surname>Dolan</surname><given-names>RJ</given-names></name> (<year>2006</year>) <article-title>Cortical substrates for exploratory decisions in humans</article-title>. <source>Nature</source> <volume>441</volume>: <fpage>876</fpage>–<lpage>879</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Cohen1"><label>7</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Cohen</surname><given-names>JD</given-names></name>, <name name-style="western"><surname>McClure</surname><given-names>SM</given-names></name>, <name name-style="western"><surname>Yu</surname><given-names>AJ</given-names></name> (<year>2007</year>) <article-title>Should I stay or should I go? How the human brain manages the trade-off between exploitation and exploration</article-title>. <source>Phil Trans R Soc B</source> <volume>362</volume>: <fpage>933</fpage>–<lpage>942</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Sutton1"><label>8</label>
<mixed-citation publication-type="other" xlink:type="simple">Sutton RS, Barto AG (1998) Reinforcement learning: an introduction. Cambridge: MIT Press.</mixed-citation>
</ref>
<ref id="pone.0095693-Eliassen1"><label>9</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Eliassen</surname><given-names>S</given-names></name>, <name name-style="western"><surname>Jorgensen</surname><given-names>C</given-names></name>, <name name-style="western"><surname>Mangel</surname><given-names>M</given-names></name>, <name name-style="western"><surname>Giske</surname><given-names>J</given-names></name> (<year>2007</year>) <article-title>Exploration or exploitation: life expectancy changes the value of learning in foraging strategies</article-title>. <source>Oikos</source> <volume>116</volume>: <fpage>513</fpage>–<lpage>523</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-BergerTal1"><label>10</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Berger-Tal</surname><given-names>O</given-names></name>, <name name-style="western"><surname>Avgar</surname><given-names>T</given-names></name> (<year>2012</year>) <article-title>The glass is half full: Overestimating the quality of a novel environment is advantageous</article-title>. <source>PLoS ONE</source> <volume>7</volume>: <fpage>e34578</fpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-MettkeHofmann1"><label>11</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Mettke-Hofmann</surname><given-names>C</given-names></name>, <name name-style="western"><surname>Winkler</surname><given-names>H</given-names></name>, <name name-style="western"><surname>Leisler</surname><given-names>B</given-names></name> (<year>2002</year>) <article-title>The significance of ecological factors for exploration and neophobia in parrots</article-title>. <source>Ethology</source> <volume>108</volume>: <fpage>249</fpage>–<lpage>272</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Gittins1"><label>12</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Gittins</surname><given-names>JC</given-names></name> (<year>1979</year>) <article-title>Bandit processes and dynamic allocation indices</article-title>. <source>J R Stat Soc B</source> <volume>41</volume>: <fpage>148</fpage>–<lpage>177</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Benner1"><label>13</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Benner</surname><given-names>MJ</given-names></name>, <name name-style="western"><surname>Tushman</surname><given-names>ML</given-names></name> (<year>2003</year>) <article-title>Exploitation, exploration, and process management: the productivity dilemma revisited</article-title>. <source>Acad Manage Rev</source> <volume>28</volume>: <fpage>238</fpage>–<lpage>256</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Gupta1"><label>14</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Gupta</surname><given-names>AK</given-names></name>, <name name-style="western"><surname>Smith</surname><given-names>KG</given-names></name>, <name name-style="western"><surname>Shalley</surname><given-names>CE</given-names></name> (<year>2006</year>) <article-title>The interplay between exploration and exploitation</article-title>. <source>Acad Manage J</source> <volume>49</volume>: <fpage>693</fpage>–<lpage>706</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Burgelman1"><label>15</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Burgelman</surname><given-names>RA</given-names></name> (<year>2002</year>) <article-title>Strategy as a vector and the inertia of coevolutionary lock-in</article-title>. <source>Admin Sci Quart</source> <volume>47</volume>: <fpage>325</fpage>–<lpage>357</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Ishii1"><label>16</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Ishii</surname><given-names>S</given-names></name>, <name name-style="western"><surname>Yoshida</surname><given-names>W</given-names></name>, <name name-style="western"><surname>Yoshimoto</surname><given-names>J</given-names></name> (<year>2002</year>) <article-title>Control of exploitation-exploration meta-parameter in reinforcement learning</article-title>. <source>Neural Networks</source> <volume>15</volume>: <fpage>665</fpage>–<lpage>687</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Schweighofer1"><label>17</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Schweighofer</surname><given-names>N</given-names></name>, <name name-style="western"><surname>Doya</surname><given-names>K</given-names></name> (<year>2003</year>) <article-title>Meta-learning in reinforcement learning</article-title>. <source>Neural Networks</source> <volume>16</volume>: <fpage>5</fpage>–<lpage>9</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Khamassi1"><label>18</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Khamassi</surname><given-names>M</given-names></name>, <name name-style="western"><surname>Enel</surname><given-names>P</given-names></name>, <name name-style="western"><surname>Dominey</surname><given-names>PF</given-names></name>, <name name-style="western"><surname>Procyk</surname><given-names>E</given-names></name> (<year>2012</year>) <article-title>Medial prefrontal cortex and the adaptive regulation of reinforcement learning parameters</article-title>. <source>Prog Brain Res</source> <volume>202</volume>: <fpage>441</fpage>–<lpage>464</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Jacobs1"><label>19</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Jacobs</surname><given-names>RA</given-names></name>, <name name-style="western"><surname>Kruschke</surname><given-names>JK</given-names></name> (<year>2011</year>) <article-title>Bayesian learning theory applied to human cognition</article-title>. <source>Wiley Interdiscip Rev Cogn Sci</source> <volume>2</volume>: <fpage>8</fpage>–<lpage>21</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Doya1"><label>20</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Doya</surname><given-names>K</given-names></name> (<year>2008</year>) <article-title>Modulators of decision making</article-title>. <source>Nat Neurosci</source> <volume>11</volume>: <fpage>410</fpage>–<lpage>416</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Courville1"><label>21</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Courville</surname><given-names>AC</given-names></name>, <name name-style="western"><surname>Daw</surname><given-names>ND</given-names></name>, <name name-style="western"><surname>Touretzky</surname><given-names>DS</given-names></name> (<year>2006</year>) <article-title>Bayesian theories of conditioning in a changing world</article-title>. <source>Trends Cogn Sci</source> <volume>10</volume>: <fpage>294</fpage>–<lpage>300</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Kirk1"><label>22</label>
<mixed-citation publication-type="other" xlink:type="simple">Kirk DE (2004) Optimal control theory. Mineola: Dover Publications.</mixed-citation>
</ref>
<ref id="pone.0095693-Rao1"><label>23</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Rao</surname><given-names>AV</given-names></name>, <name name-style="western"><surname>Benson</surname><given-names>DA</given-names></name>, <name name-style="western"><surname>Darby</surname><given-names>C</given-names></name>, <name name-style="western"><surname>Patterson</surname><given-names>MA</given-names></name>, <name name-style="western"><surname>Francolin</surname><given-names>C</given-names></name>, <etal>et al</etal>. (<year>2010</year>) <article-title>Algorithm 902: GPOPS, a MATLAB software for solving multiple-phase optimal control problems using the gauss pseudospectral method</article-title>. <source>ACM T Math Software</source> <volume>37</volume>: <fpage>1</fpage>–<lpage>39</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Giraldeau1"><label>24</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Giraldeau</surname><given-names>L-A</given-names></name>, <name name-style="western"><surname>Valone</surname><given-names>TJ</given-names></name>, <name name-style="western"><surname>Templeton</surname><given-names>JJ</given-names></name> (<year>2002</year>) <article-title>Potential disadvantages of using socially acquired information. Phil. Trans. R. Soc. Lond</article-title>. <source>B</source> <volume>357</volume>: <fpage>1559</fpage>–<lpage>1566</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Rothaermel1"><label>25</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Rothaermel</surname><given-names>FT</given-names></name>, <name name-style="western"><surname>Leeds</surname><given-names>DL</given-names></name> (<year>2004</year>) <article-title>Exploration and exploitation alliances in biotechnology: a system of new product development</article-title>. <source>Strat Mgmt J</source> <volume>25</volume>: <fpage>201</fpage>–<lpage>221</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Avni1"><label>26</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Avni</surname><given-names>R</given-names></name>, <name name-style="western"><surname>Eilam</surname><given-names>D</given-names></name> (<year>2008</year>) <article-title>On the border: perimeter patrolling as a transitional exploratory phase in a diurnal rodent, the fat sand rat (<italic>Psammomys obesus</italic>)</article-title>. <source>Anim Cogn</source> <volume>11</volume>: <fpage>311</fpage>–<lpage>318</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Fryxell1"><label>27</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Fryxell</surname><given-names>JM</given-names></name>, <name name-style="western"><surname>Hazell</surname><given-names>M</given-names></name>, <name name-style="western"><surname>Borger</surname><given-names>L</given-names></name>, <name name-style="western"><surname>Dalziel</surname><given-names>BD</given-names></name>, <name name-style="western"><surname>Haydon</surname><given-names>DT</given-names></name>, <etal>et al</etal>. (<year>2008</year>) <article-title>Multiple movement modes by large herbivores at multiple spatiotemporal scales</article-title>. <source>P Natl Acad Sci USA</source> <volume>105</volume>: <fpage>19114</fpage>–<lpage>19119</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Cagnacci1"><label>28</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Cagnacci</surname><given-names>F</given-names></name>, <name name-style="western"><surname>Boitani</surname><given-names>L</given-names></name>, <name name-style="western"><surname>Powell</surname><given-names>RA</given-names></name>, <name name-style="western"><surname>Boyce</surname><given-names>MS</given-names></name> (<year>2010</year>) <article-title>Animal ecology meets GPS-based radiotelemetry: a perfect storm of opportunities and challenges</article-title>. <source>Phil Trans R Soc B</source> <volume>365</volume>: <fpage>2157</fpage>–<lpage>2162</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Fonio1"><label>29</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Fonio</surname><given-names>E</given-names></name>, <name name-style="western"><surname>Benjamini</surname><given-names>Y</given-names></name>, <name name-style="western"><surname>Golani</surname><given-names>I</given-names></name> (<year>2009</year>) <article-title>Freedom of movement and the stability of its unfolding in free exploration of mice</article-title>. <source>Proc Natl Acad Sci USA</source> <volume>106</volume>: <fpage>21335</fpage>–<lpage>21340</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Russel1"><label>30</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Russel</surname><given-names>JC</given-names></name>, <name name-style="western"><surname>McMorland</surname><given-names>AJC</given-names></name>, <name name-style="western"><surname>MacKay</surname><given-names>JWB</given-names></name> (<year>2010</year>) <article-title>Exploratory behaviour of colonizing rats in novel environments</article-title>. <source>Anim Behav</source> <volume>79</volume>: <fpage>159</fpage>–<lpage>164</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Carstensen1"><label>31</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Carstensen</surname><given-names>LL</given-names></name>, <name name-style="western"><surname>Isaacowitz</surname><given-names>D</given-names></name>, <name name-style="western"><surname>Charles</surname><given-names>ST</given-names></name> (<year>1999</year>) <article-title>Taking time seriously: a theory of socioemotional selectivity</article-title>. <source>Am Psychol</source> <volume>54</volume>: <fpage>165</fpage>–<lpage>181</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Krebs1"><label>32</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Krebs</surname><given-names>JR</given-names></name>, <name name-style="western"><surname>Kacelnik</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Taylor</surname><given-names>P</given-names></name> (<year>1978</year>) <article-title>Tests of optimal sampling by foraging great tits</article-title>. <source>Nature</source> <volume>275</volume>: <fpage>27</fpage>–<lpage>31</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Wajnberg1"><label>33</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Wajnberg</surname><given-names>E</given-names></name>, <name name-style="western"><surname>Bernhard</surname><given-names>P</given-names></name>, <name name-style="western"><surname>Hamelin</surname><given-names>F</given-names></name>, <name name-style="western"><surname>Boivin</surname><given-names>G</given-names></name> (<year>2006</year>) <article-title>Optimal patch time allocation for time-limited foragers</article-title>. <source>Behav Ecol Sociobiol</source> <volume>60</volume>: <fpage>1</fpage>–<lpage>10</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Eliassen2"><label>34</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Eliassen</surname><given-names>S</given-names></name>, <name name-style="western"><surname>Jorgensen</surname><given-names>C</given-names></name>, <name name-style="western"><surname>Mangel</surname><given-names>M</given-names></name>, <name name-style="western"><surname>Giske</surname><given-names>J</given-names></name> (<year>2009</year>) <article-title>Quantifying the adaptive value of learning in foraging behavior</article-title>. <source>Am Nat</source> <volume>174</volume>: <fpage>478</fpage>–<lpage>489</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Greville1"><label>35</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Greville</surname><given-names>WJ</given-names></name>, <name name-style="western"><surname>Buehner</surname><given-names>MJ</given-names></name> (<year>2010</year>) <article-title>Temporal predictability facilitates causal learning</article-title>. <source>J Exp Psychol Gen</source> <volume>139</volume>: <fpage>756</fpage>–<lpage>771</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Ohashi1"><label>36</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Ohashi</surname><given-names>K</given-names></name>, <name name-style="western"><surname>Thomson</surname><given-names>JD</given-names></name> (<year>2005</year>) <article-title>Efficient harvesting of renewing resources</article-title>. <source>Behav Ecol</source> <volume>16</volume>: <fpage>592</fpage>–<lpage>605</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Watts1"><label>37</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Watts</surname><given-names>DP</given-names></name> (<year>1998</year>) <article-title>Long-term habitat use by mountain gorillas (<italic>Gorilla gorilla beringei</italic>). 2. Reuse of foraging areas in relation to resource abundance, quality, and depletion</article-title>. <source>Int J Primatol</source> <volume>19</volume>: <fpage>681</fpage>–<lpage>702</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Comba1"><label>38</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Comba</surname><given-names>L</given-names></name> (<year>1999</year>) <article-title>Patch use by bumblebees (<italic>Hymenoptera Apidae</italic>): temperature, wind, flower density and traplining</article-title>. <source>Ethol Ecol Evol</source> <volume>11</volume>: <fpage>243</fpage>–<lpage>264</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Garrison1"><label>39</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Garrison</surname><given-names>JSE</given-names></name>, <name name-style="western"><surname>Gass</surname><given-names>CL</given-names></name> (<year>1999</year>) <article-title>Response of a traplining hummingbird to changes in nectar availability</article-title>. <source>Behav Ecol</source> <volume>10</volume>: <fpage>714</fpage>–<lpage>725</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Gullapalli1"><label>40</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Gullapalli</surname><given-names>V</given-names></name> (<year>1990</year>) <article-title>A stochastic reinforcement learning algorithm for learning real-valued functions</article-title>. <source>Neural Networks</source> <volume>3</volume>: <fpage>671</fpage>–<lpage>692</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-McNamara1"><label>41</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>McNamara</surname><given-names>JM</given-names></name>, <name name-style="western"><surname>Trimmer</surname><given-names>PC</given-names></name>, <name name-style="western"><surname>Eriksson</surname><given-names>A</given-names></name>, <name name-style="western"><surname>Marshall</surname><given-names>JAR</given-names></name>, <name name-style="western"><surname>Houston</surname><given-names>AI</given-names></name> (<year>2011</year>) <article-title>Environmental variability can select for optimism or pessimism, Ecol Lett</article-title>. <volume>14</volume>: <fpage>48</fpage>–<lpage>62</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Nevo1"><label>42</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Nevo</surname><given-names>D</given-names></name>, <name name-style="western"><surname>Furneaux</surname><given-names>B</given-names></name>, <name name-style="western"><surname>Wand</surname><given-names>Y</given-names></name> (<year>2008</year>) <article-title>Towards an evaluation framework for knowledge management systems</article-title>. <source>Inf Technol Manage</source> <volume>9</volume>: <fpage>233</fpage>–<lpage>249</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Birren1"><label>43</label>
<mixed-citation publication-type="other" xlink:type="simple">Birren JE, Schaie KW eds (2006) Handbook of the psychology of aging. Amsterdam: Elsevier.</mixed-citation>
</ref>
<ref id="pone.0095693-Meyer1"><label>44</label>
<mixed-citation publication-type="other" xlink:type="simple">Meyer BJF, Pollard CK (2006) Applied learning and aging: a closer look at reading. In: Birren JE, Schaie KW eds. Handbook of the psychology of aging. Amsterdam: Elsevier. 233–261.</mixed-citation>
</ref>
<ref id="pone.0095693-Sinnott1"><label>45</label>
<mixed-citation publication-type="other" xlink:type="simple">Sinnott JD (1989) A model for solution of ill-structured problems: implications for everyday and abstract problem solving. In: Sinnott JD ed. Everyday problem solving: theory and applications. Westport: Praeger. 72–99.</mixed-citation>
</ref>
<ref id="pone.0095693-Thornton1"><label>46</label>
<mixed-citation publication-type="other" xlink:type="simple">Thornton R, Light LL (2006) Language comprehension and production in normal aging. In: Birren JE, Schaie KW eds. Handbook of the psychology of aging. Amsterdam: Elsevier. 262–288.</mixed-citation>
</ref>
<ref id="pone.0095693-Burke1"><label>47</label>
<mixed-citation publication-type="other" xlink:type="simple">Burke DM, MacKay DG, James LE (2000) Theoretical approaches to language and aging. In: Perfect T., Maylor, E. eds. Models of cognitive aging. New York: Oxford University Press. 204–237.</mixed-citation>
</ref>
<ref id="pone.0095693-Carstensen2"><label>48</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Carstensen</surname><given-names>LL</given-names></name> (<year>1993</year>) <article-title>Motivation for social contact across the life span: a theory of socioemotional selectivity</article-title>. <source>Nebr Sym Motiv</source> <volume>40</volume>: <fpage>209</fpage>–<lpage>254</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Carstensen3"><label>49</label>
<mixed-citation publication-type="other" xlink:type="simple">Carstensen LL (1998) A life-spn approach to social motivation. In: Heckhausen J, Dweck, C eds. Motivation and self- regulation across the life span. Cambridge: Cambridge University Press. 341–364.</mixed-citation>
</ref>
<ref id="pone.0095693-Carstensen4"><label>50</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Carstensen</surname><given-names>LL</given-names></name>, <name name-style="western"><surname>Fung</surname><given-names>HH</given-names></name>, <name name-style="western"><surname>Charles</surname><given-names>ST</given-names></name> (<year>2003</year>) <article-title>Socioemotional selectivity theory and the regulation of emotion in the second half of life</article-title>. <source>Motiv Emotion</source> <volume>27</volume>: <fpage>103</fpage>–<lpage>123</lpage>.</mixed-citation>
</ref>
<ref id="pone.0095693-Riediger1"><label>51</label>
<mixed-citation publication-type="other" xlink:type="simple">Riediger M, Li S-C, Lindenberger U (2006) Selection, optimization, and compensation as developmental mechanisms of adaptive resource allocation: review and preview. In: Birren JE, Schaie KW eds. Handbook of the psychology of aging. Amsterdam: Elsevier. 289–314.</mixed-citation>
</ref>
<ref id="pone.0095693-Fung1"><label>52</label>
<mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Fung</surname><given-names>HH</given-names></name>, <name name-style="western"><surname>Carstensen</surname><given-names>LL</given-names></name>, <name name-style="western"><surname>Lutz</surname><given-names>AM</given-names></name> (<year>1999</year>) <article-title>Influence of time on social preference: implications for life-span development</article-title>. <source>Psychol Aging</source> <volume>14</volume>: <fpage>595</fpage>–<lpage>604</lpage>.</mixed-citation>
</ref>
</ref-list></back>
</article>