data/pone.0000217.nxml

<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Archiving and Interchange DTD v2.3 20070202//EN" "archivearticle.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:mml="http://www.w3.org/1998/Math/MathML" article-type="research-article"><?properties open_access?><front><journal-meta><journal-id journal-id-type="nlm-ta">PLoS ONE</journal-id><journal-id journal-id-type="publisher-id">plos</journal-id><journal-id journal-id-type="pmc">plosone</journal-id><journal-title>PLoS ONE</journal-title><issn pub-type="epub">1932-6203</issn><publisher><publisher-name>Public Library of Science</publisher-name><publisher-loc>San Francisco, USA</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="pmid">17299597</article-id><article-id pub-id-type="pmc">1790863</article-id><article-id pub-id-type="publisher-id">06-PONE-RA-00287R1</article-id><article-id pub-id-type="doi">10.1371/journal.pone.0000217</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="Discipline"><subject>Evolutionary Biology</subject><subject>Computational Biology/Systems Biology</subject><subject>Evolutionary Biology/Evolutionary and Comparative Genetics</subject><subject>Evolutionary Biology/Genomics</subject><subject>Genetics and Genomics/Population Genetics</subject><subject>Microbiology/Microbial Evolution and Genomics</subject></subj-group></article-categories><title-group><article-title>Quantifying Organismal Complexity using a Population Genetic Approach</article-title><alt-title alt-title-type="running-head">Population Genetic Complexity</alt-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name><surname>Tenaillon</surname><given-names>Olivier</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref><xref ref-type="aff" rid="aff2"><sup>2</sup></xref><xref ref-type="corresp" rid="n101"><sup>&#x0002a;</sup></xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name><surname>Silander</surname><given-names>Olin K.</given-names></name><xref ref-type="aff" rid="aff2"><sup>2</sup></xref><xref ref-type="aff" rid="aff3"><sup>3</sup></xref></contrib><contrib contrib-type="author"><name><surname>Uzan</surname><given-names>Jean-Philippe</given-names></name><xref ref-type="aff" rid="aff4"><sup>4</sup></xref></contrib><contrib contrib-type="author"><name><surname>Chao</surname><given-names>Lin</given-names></name><xref ref-type="aff" rid="aff2"><sup>2</sup></xref></contrib></contrib-group><aff id="aff1"><label>1</label><addr-line>Institut National de la Sant&#x000e9; et de la Recherche M&#x000e9;dicale (INSERM) U722, Facult&#x000e9; de M&#x000e9;decine Xavier Bichat, Universit&#x000e9; Denis Diderot-Paris VII, Paris, France</addr-line></aff><aff id="aff2"><label>2</label><addr-line> Division of Biology, University of California San Diego, La Jolla, California, United States of America</addr-line></aff><aff id="aff3"><label>3</label><addr-line> Eidgen&#x000f6;ssische Technische Hochschule (ETH) Zurich, Ecology and Evolution, ETH-Zentrum NW, Zurich, Switzerland</addr-line></aff><aff id="aff4"><label>4</label><addr-line> Institut d'Astrophysique de Paris, Universit&#x000e9; Pierre et Marie Curie-Paris VI, Centre National de la Recherche Scientifique (CNRS) UMR 7095, Paris, France</addr-line></aff><contrib-group><contrib contrib-type="editor"><name><surname>Buckling</surname><given-names>Angus</given-names></name><role>Academic Editor</role><xref ref-type="aff" rid="edit1"/></contrib></contrib-group><aff id="edit1">Oxford University, United Kingdom</aff><author-notes><corresp id="n101">&#x0002a; To whom correspondence should be addressed. E-mail: <email>Olivier.Tenaillon@bichat.inserm.fr</email></corresp><fn fn-type="con"><p>Conceived and designed the experiments: LC OT OS. Performed the experiments: OT OS. Analyzed the data: LC OT JU. Wrote the paper: LC OT OS JU.</p></fn></author-notes><pub-date pub-type="collection"><year>2007</year></pub-date><pub-date pub-type="epub"><day>14</day><month>2</month><year>2007</year></pub-date><volume>2</volume><issue>2</issue><elocation-id>e217</elocation-id><history><date date-type="received"><day>26</day><month>10</month><year>2006</year></date><date date-type="accepted"><day>25</day><month>1</month><year>2007</year></date></history><copyright-statement>Tenaillon et al. This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</copyright-statement><copyright-year>2007</copyright-year><abstract><sec><title>Background</title><p>Various definitions of biological complexity have been proposed: the number of genes, cell types, or metabolic processes within an organism. As knowledge of biological systems has increased, it has become apparent that these metrics are often incongruent.</p></sec><sec sec-type="methods"><title>Methodology</title><p>Here we propose an alternative complexity metric based on the number of genetically uncorrelated phenotypic traits contributing to an organism's fitness. This metric, phenotypic complexity, is more objective than previous suggestions, as complexity is measured from a fundamental biological perspective, that of natural selection. We utilize a model linking the equilibrium fitness (drift load) of a population to phenotypic complexity. We then use results from viral evolution experiments to compare the phenotypic complexities of two viruses, the bacteriophage X174 and vesicular stomatitis virus, and to illustrate the consistency of our approach and its applicability.</p></sec><sec><title>Conclusions/Significance</title><p>Because Darwinian evolution through natural selection is the fundamental element unifying all biological organisms, we propose that our metric of complexity is potentially a more relevant metric than others, based on the count of artificially defined set of objects.</p></sec></abstract><counts><page-count count="8"/></counts></article-meta></front><body><sec id="s1"><title>Introduction</title><p>A persistent question in biology is how organismal complexity changes through the course of evolution <xref ref-type="bibr" rid="pone.0000217-McShea1">&#x0005b;1&#x0005d;</xref>&#x02013;<xref ref-type="bibr" rid="pone.0000217-Adami2">&#x0005b;5&#x0005d;</xref>. Although significant progress has been made in the understanding and quantifying organismal characteristics at many level of organization (DNA, proteins, metabolic networks, cellular organization, organ functions, individual behavior) much confusion remains about how to accurately quantify organismal complexity. Several intuitive proposals have been made that take into account simple metrics such as the number of genes or cell types. However, these simple measures quickly lead to conflicting conclusions <xref ref-type="bibr" rid="pone.0000217-Szathmary1">&#x0005b;2&#x0005d;</xref>, <xref ref-type="bibr" rid="pone.0000217-Carroll1">&#x0005b;3&#x0005d;</xref>. Here we propose a fundamentally different approach to measuring organismal complexity; as opposed to relying on bottom-up measures such as the number of genes an organism has, we utilize an objective biological approach: natural selection. Instead of asking how complex an organism is from our own perspective, we ask: how complex is an organism from the perspective of natural selection? Essentially, this is a top-down metric of organismal complexity that we term phenotypic complexity.</p><p>Phenotypic complexity quantifies the number of genetically uncorrelated phenotypic traits contributing to an organism's fitness. A phenotypic trait contributes to an organism's fitness only to the extent that natural selection acts upon that trait. Thus an organismal phenotype that is no longer under selection (for example during an evolutionary transition from a generalist to specialist lifestyle), although expressed by the organism, contributes nothing to organismal complexity. Secondly, if two phenotypes contribute to complexity, they must be genetically separable: some mutations must exist that affect one phenotype but not the other. If no such mutations exist, then although we may perceive two phenotypes under selection, these phenotypes contribute only a single trait toward determining phenotypic complexity. As an example consider the affinity of an enzyme for a substrate, and the rate at which that substrate is converted to product. If there are no mutations that affect one of these traits but not the other, then these two phenotypes are considered one, until the organism gains the genetic complexity to generate variation in one phenotype without affecting the second, for example by evolving functionally separate domains in the enzyme. Phenotypic complexity is thus a combined description of how natural selection perceives organismal phenotypes and how phenotypic variation is generated by the organism. This concept was first articulated by Orr, and followed later by others <xref ref-type="bibr" rid="pone.0000217-Orr1">&#x0005b;6&#x0005d;</xref>&#x02013;<xref ref-type="bibr" rid="pone.0000217-Welch1">&#x0005b;8&#x0005d;</xref>. Notably, it is similar to physical complexity, which is a measure of the amount of information that an organism encodes about its environment <xref ref-type="bibr" rid="pone.0000217-Adami1">&#x0005b;4&#x0005d;</xref>, <xref ref-type="bibr" rid="pone.0000217-Adami2">&#x0005b;5&#x0005d;</xref>.</p><p>An important aspect of measuring complexity in this manner is that both the organism and the environment affect the metric. An organism with many phenotypes, but living in simple environment could thus be just as complex as a simpler organism in the same environment. For example, if one organism is capable of metabolizing both lactose and glucose, while second can metabolize only glucose, the first organism will only be designated as more complex when there is a possibility that lactose will be present in the environment.</p><p>Recent population genetic theory <xref ref-type="bibr" rid="pone.0000217-Hartl1">&#x0005b;9&#x0005d;</xref>, <xref ref-type="bibr" rid="pone.0000217-Poon1">&#x0005b;10&#x0005d;</xref> has suggested that phenotypic complexity is proportional to the drift load, a quantity that describes how equilibrium mean population fitness declines with population size. This can be intuitively understood in the following manner. An organism's fitness is a result of how successfully it interacts with the environment. As the number of interactions (traits) increases, it becomes difficult to simultaneously maintain each one. Very large populations maintain nearly optimal mean population fitness regardless of phenotypic complexity. Small populations can maintain high average fitness only when there are a small number of traits (low complexity) each contributing a relatively large amount to fitness; if there are a large number of traits (high complexity), each contributing only a small amount to fitness, then small populations will be incapable of maintaining all of them. Thus for complex organisms, there will be a large difference in mean fitness between small and large populations; for simple organisms, this difference in average fitness will be small.</p><p>The phenotypic model used to link drift load to phenotypic complexity was first formalized by R. A. Fisher <xref ref-type="bibr" rid="pone.0000217-Fisher1">&#x0005b;11&#x0005d;</xref>. He envisioned a multidimensional phenotypic space in which the origin of each axis corresponded to the most-fit or optimum phenotypic value. As phenotypic values depart from the origin, fitness decreases. The manner in which fitness declines is described by a monotonically decreasing function, which may take a variety of shapes, e.g., linear, concave-up, or &#x02013;down. Individuals of equal fitness but different phenotypic values trace out fitness isoclines in the space. If an organism has only two phenotypes, the phenotypic space is two-dimensional and the fitness isoclines are a series of circles centered on the origin of the axes (<xref ref-type="fig" rid="pone-0000217-g001">Fig. 1</xref>). If an organism has n number of phenotypes, phenotypic space is n-dimensional, and each fitness isocline is an n-dimensional hyper-sphere. Because of the assumed geometry of the isoclines, this model is referred to as Fisher's Geometric Model (FGM) of phenotypic or adaptive evolution.</p><fig id="pone-0000217-g001" position="float"><object-id pub-id-type="doi">10.1371/journal.pone.0000217.g001</object-id><label>Figure 1</label><caption><title>Fisher's geometric model in two-dimensional phenotypic space.</title><p>Fitness varies along two phenotypic axes, with the maximum fitness located, for convenience, at the origin of these axes. Any individual in a population (black point) can thus be described by its phenotypic values, which determine the fitness of that organism. At any specific fitness, there are a number of other phenotypic combinations that have equivalent fitness; the values of these phenotypic combinations establish the fitness isoclines (black circle). From the optimum, fitness declines monotonically according to the structure of the landscape (see text). Each mutation (arrow) is drawn from a distribution centered on the phenotypic position of each individual, resulting in offspring with new phenotypic combinations and fitness values (white point).</p></caption><graphic xlink:href="pone.0000217.g001"/></fig><p>A population of individuals can be represented as a collection of points in FGM and the phenotypic values of each point allow ascertainment of the fitness of each individual. Individual fitness then determines the probability of each individual surviving and reproducing the next generation. Evolution is thus described in FGM by following the collection of points over many generations. To generate novel genetic variation, mutations are drawn from an assumed distribution that is centered on the phenotypic position of each individual (<xref ref-type="fig" rid="pone-0000217-g001">Fig. 1</xref>). By never descending into genotypic space, FGM is analogous to quantitative genetics models. Both types of models assume or require only that a component of phenotype is heritable. However, whereas quantitative genetic models represent populations by their mean and variance, FGM is an individual-based model in which each individual is evaluated according to its fitness.</p><p>FGM makes a set of theoretical predictions about how adaptation tends to occur, and many of these have been corroborated by experimental results. The greater frequency of small-sized beneficial mutations <xref ref-type="bibr" rid="pone.0000217-Burch1">&#x0005b;12&#x0005d;</xref>, the L-shaped distribution of mutations fixed throughout evolution <xref ref-type="bibr" rid="pone.0000217-Estes1">&#x0005b;13&#x0005d;</xref>, the existence of fitness equilibriums <xref ref-type="bibr" rid="pone.0000217-Silander1">&#x0005b;14&#x0005d;</xref>, and the absence of intrinsically beneficial or intrinsically deleterious mutations have all been observed during laboratory evolution, and all conform to the conditions set forth under FGM. The model thus appears to offer a reasonable framework for the study of microbial evolution.</p><p>The utility of FGM lies in the fact that it does not require any particular assumptions about the map between phenotype and genotype, and that the specific predictions about how fitness changes during evolution appear to be robust. In the present paper, we further refine previous predictions derived from FGM <xref ref-type="bibr" rid="pone.0000217-Hartl1">&#x0005b;9&#x0005d;</xref>, <xref ref-type="bibr" rid="pone.0000217-Poon1">&#x0005b;10&#x0005d;</xref> to take into account some fitness functions compatible with experimental data and use these results to estimate the phenotypic complexity of two viruses evolved in the laboratory.</p></sec><sec id="s2"><title>Model and Results</title><p>The link between drift load and phenotypic complexity under FGM was first investigated by Hartl and Taubes <xref ref-type="bibr" rid="pone.0000217-Hartl1">&#x0005b;9&#x0005d;</xref> (although Wagner and Gabriel <xref ref-type="bibr" rid="pone.0000217-Wagner1">&#x0005b;15&#x0005d;</xref> had worked previously on a similar question), and was later refined by Poon and Otto <xref ref-type="bibr" rid="pone.0000217-Poon1">&#x0005b;10&#x0005d;</xref>. Recent theoretical techniques from statistical physics now allow an exact solution of FGM for several fitness functions. Sella and Hirsh <xref ref-type="bibr" rid="pone.0000217-Sella1">&#x0005b;16&#x0005d;</xref> found that mean equilibrium fitness &#x02329;f&#x0232a; can be written as<disp-formula><graphic xlink:href="pone.0000217.e001.jpg" mimetype="image" position="float"/></disp-formula></p><p>In which &#x003bd;&#x0200a;&#x0003d;&#x0200a;2&#x022c5;N<sub>e</sub>&#x02212;1 in the diploid case and 2&#x022c5;N<sub>e</sub>&#x02212;2 in the haploid, and &#x003c1;(f), the density function, <italic>i.e.</italic> the size of fitness f isocline, is dependent on the number of dimensions and of the fitness function used.</p><sec id="s2a"><title>Linear Fitness Decline</title><p>If fitness is assumed to be a linearly decreasing function of the phenotypic distance to the optimum, then we find that the average fitness is given by (<xref ref-type="sec" rid="s4">Methods, Appendix A</xref>):<disp-formula><graphic xlink:href="pone.0000217.e002.jpg" mimetype="image" position="float"/></disp-formula>in the diploid case, in which F<sub>eq</sub> is the equilibrium fitness (drift load) expressed as a fraction of the maximum attainable fitness of the organism, n<sub>e</sub> is the <italic>effective</italic> number of dimensions of the phenotypic space (phenotypic complexity; see the below for a more detailed discussion of why we term this the effective number of dimensions), and N<sub>e</sub> is the effective population size. This confirms the results obtained by Poon and Otto who approximated F<sub>eq</sub>(n<sub>e</sub>, N<sub>e</sub>) as 2N<sub>e</sub>/(2N<sub>e</sub>&#x0002b;n<sub>e</sub>) <xref ref-type="bibr" rid="pone.0000217-Poon1">&#x0005b;10&#x0005d;</xref>.</p><p>Although earlier studies on FGM model have used such linear fitness functions (for the sake of mathematical simplicity), recent experimental studies do not seem to support the use of such a function <xref ref-type="bibr" rid="pone.0000217-Burch2">&#x0005b;17&#x0005d;</xref>&#x02013;<xref ref-type="bibr" rid="pone.0000217-Sanjuan1">&#x0005b;19&#x0005d;</xref>. Linear fitness functions give rise to dramatic synergistic epistasis. For example, a mutation that increases the distance to the optimal phenotype by 0.1 units may decrease fitness by 10&#x00025; in the optimal genotype (which by definition has a fitness of 1); an analogous mutation will decrease fitness by 50&#x00025; in an organism with a fitness of 0.2; this mutation will become lethal in any genotype with a fitness less than 0.1. Recent experimental work suggests that epistasis between deleterious mutations is either antagonistic <xref ref-type="bibr" rid="pone.0000217-Burch2">&#x0005b;17&#x0005d;</xref>&#x02013;<xref ref-type="bibr" rid="pone.0000217-Sanjuan1">&#x0005b;19&#x0005d;</xref> or null <xref ref-type="bibr" rid="pone.0000217-Elena1">&#x0005b;20&#x0005d;</xref>. We therefore decided to use a family of exponential fitness functions with a parameter that allows control over the level and shape of epistasis.</p></sec><sec id="s2b"><title>Exponential-type Fitness Decline</title><p>In an effort to explore fitness functions more compatible with experimental data, we studied the following family of functions. f(d)&#x0200a;&#x0003d;&#x0200a;exp(&#x02212;(d<sup>Q</sup>)), in which fitness is an exponentially decaying function of the distance to the optimum to the power of Q. Q is a parameter that modifies the concavity of the fitness decline. As organisms move away from the optimum the effect of the mutation tend to have bigger effect if Q&#x0003e;1 and smaller effect if Q&#x0003c;1. In such a case the fitness equilibriums are (<xref ref-type="sec" rid="s4">Methods, Appendix A</xref>).<disp-formula><graphic xlink:href="pone.0000217.e003.jpg" mimetype="image" position="float"/></disp-formula></p><p>Thus in the haploid case on which we will focus later:<disp-formula><graphic xlink:href="pone.0000217.e004.jpg" mimetype="image" position="float"/></disp-formula></p><p>The validity of these results was confirmed by an individual based model of simulation analogous to one used previously <xref ref-type="bibr" rid="pone.0000217-Orr1">&#x0005b;6&#x0005d;</xref> (<xref ref-type="fig" rid="pone-0000217-g002">Fig. 2</xref>).</p><fig id="pone-0000217-g002" position="float"><object-id pub-id-type="doi">10.1371/journal.pone.0000217.g002</object-id><label>Figure 2</label><caption><title>Predicted equilibrium fitness as a function of phenotypic complexity (n<sub>e</sub>).</title><p>Results are shown for populations of size 100 (black), ten (grey), and three (white). An exponential fitness decline in which Q&#x0200a;&#x0003d;&#x0200a;1 was used (yielding a fitness function of f(d)&#x0200a;&#x0003d;&#x0200a;exp(&#x02212;d)). Circles indicate the average fitness reached in the simulation model; curves indicate the analytical results.</p></caption><graphic xlink:href="pone.0000217.g002"/></fig></sec><sec id="s2c"><title>Robustness of Fitness Equilibrium to FGM Hypothesis</title><p>The implementation of FGM requires several assumptions in regards to the biology of the organism. The distributions of the mutations and the shape of the fitness function are required, and the geometry of the fitness isoclines needs to be symmetrical. However, we show below that the equilibrium drift load is fairly insensitive to these strict assumptions.</p><p>First, as equation (4) suggests, the fitness equilibrium is independent of the mutational properties. As long as mutation is assumed to be isotropic, only the convergence time to equilibrium, and not the equilibrium fitness value, is affected by the distribution of mutational effects (data not shown). Second, although the results depend on the shape of the fitness function (linear or exponential-type), they are independent of the slope: equilibrium values will be the same if f(d)&#x0200a;&#x0003d;&#x0200a;exp(&#x02212;&#x003b1;d<sup>Q</sup>) (<xref ref-type="sec" rid="s4">Methods, Appendix B</xref>). Third, although the canonical FGM assumes circular fitness isoclines, it can be shown that if fitness isoclines are elliptical instead of circular, then the density function is affected, but this cancels out in the calculation of fitness equilibrium. This holds for fitness isoclines and also for any fitness function of the form f(X)&#x0200a;&#x0003d;&#x0200a;exp(&#x02212;&#x02211;&#x003b1;<sub>i</sub>x<sub>i</sub><sup>Q</sup>), where X&#x0200a;&#x0003d;&#x0200a;(x<sub>0</sub>, x<sub>1</sub>, &#x02026;, x<sub>n</sub>) is the coordinate of an individual in FGM, and &#x003b1;<sub>i</sub> are positive parameters (<xref ref-type="sec" rid="s4">Methods, Appendix B</xref>). Finally, if the mutation cloud is a Gaussian ellipsoid, it has been shown that an appropriate change of axes result in a space in which fitness isoclines are ellipsoid while the mutation cloud is circular <xref ref-type="bibr" rid="pone.0000217-Martin1">&#x0005b;21&#x0005d;</xref>. Hence it seems that asymmetry in both the mutational distribution and the fitness isoclines do not affect the equilibrium fitness values, a robustness of the equilibrium fitness confirmed by some simulation data (data not shown).</p><p>The equilibrium drift load seems to be a robust property of FGM that is determined by the number of dimensions of phenotypic space, the population size and the fitness function (especially its curvature). An accurate estimate of phenotypic complexity can thus be obtained if it is possible to estimate equilibrium fitness values (drift load) for several population sizes, as well as the amount of curvature in the fitness function.</p></sec><sec id="s2d"><title>Viral Evolution</title><p>We used two sets of evolution experiments in which both fitness equilibrium values and fitness curvature have been investigated (<xref ref-type="fig" rid="pone-0000217-g003">Fig. 3</xref>). In the first set of experiments we evolved the bacteriophage &#x003a6;X174 on a bacterial lawn of its host, <italic>Escherichia coli</italic> C. We increased the mutation rate of the phage to hasten convergence to fitness equilibrium with the use of hydroxylamine; this resulted in a mean mutation rate of 0.1 per genome per generation through the 450 generations of evolution. Population size-dependent fitness equilibriums were observed, confirming that evolution occurred in a manner compatible with the assumptions of FGM. From these populations we obtained 21 measures of equilibrium fitness at five different population sizes. Every transfer corresponded roughly to five phage generations and effective population size was then approximated to five times the number of plaques transferred (the harmonic mean).</p><fig id="pone-0000217-g003" position="float"><object-id pub-id-type="doi">10.1371/journal.pone.0000217.g003</object-id><label>Figure 3</label><caption><title>Equilibrium drift load as a function of population size for vesicular stomatitis virus and &#x003a6;X174.</title><p>Each point indicates the mean fitness of a population. The VSV populations are shown in dark grey and the &#x003a6;X174 are shown in white. Some points have been displaced on the x-axis for clarity. The VSV populations were transferred at effective population sizes of four, ten, and 60; the &#x003a6;X174 populations were transferred at effective population sizes of 15, 50, 150, 500, and 1250. The dotted lines specify the maximum likelihood estimate of the f<sub>ref</sub> value (the maximum attainable fitness); the dark dotted line indicates the value for VSV and the lighter dashed line indicates the value for &#x003a6;X174.</p></caption><graphic xlink:href="pone.0000217.g003"/></fig><p>To estimate the curvature of the fitness function we performed a mutation accumulation analysis for high and low fitness clones and showed that the distribution of deleterious mutations was similar at both ends of the fitness range spanning a 300-fold difference. This suggests that there is very little curvature of the fitness function.</p><p>We used a second set of data from the literature, in which populations were evolved for 20 transfers at different effective sizes. Novella et al. <xref ref-type="bibr" rid="pone.0000217-Novella1">&#x0005b;22&#x0005d;</xref> evolved four clones of vesicular stomatitis virus (VSV) using plaque-to-plaque transfers of sizes two, five, and 30. They also observed a population size-dependant fitness convergence. Although the time for convergence was relatively short (40 viral generations), several populations experienced no significant increases or decreases in fitness over all replicates at a given population size, suggesting that those population were at or near an equilibrium fitness value. We used the fitness estimates from 24 populations evolved at population sizes of two, five and 30. Every transfer corresponded to roughly two viral generations and effective population size was thus approximated as two times the number of viral plaques transferred.</p><p>Additionally, an impressive set of data using site directed mutagenesis in VSV suggests that the concavity of fitness function is slightly upward <xref ref-type="bibr" rid="pone.0000217-Sanjuan1">&#x0005b;19&#x0005d;</xref>. However, in further analyses we estimate Q as 1 for both the phage and the virus, as no clear departure from 1 has been observed in either case.</p></sec><sec id="s2e"><title>Maximum Likelihood Estimate of Phenotypic Complexity</title><p>We wish to use the previous mathematical results to estimate phenotypic complexity from experimental data. However, there are two unknown parameters in the experimental system that affect the equilibrium drift load in a population: phenotypic complexity and the maximum attainable fitness that can be reached by the viruses in the laboratory environment (this parameter has been scaled to one in the previous derivations). Using methods from statistical physics, we can find the distribution of population fitness at equilibrium (shown above), and thus derive a likelihood model that gives the probability of the observed data for each couplet (n<sub>e</sub>/Q, f<sub>ref</sub>), in which n<sub>e</sub> is the phenotypic complexity, Q a parameter of the curvature of the fitness surface, and f<sub>ref</sub> the maximum attainable fitness. We also take into account the noise in our experimental assessment of fitness values; especially for high fitness populations, noise in the estimates of fitness can alter the estimation of f<sub>ref</sub>, as this parameter is by definition higher than all fitness measures. Thus rather than using the probability of the point estimate of fitness, we integrated the probability between plus (f<sub>&#x0002b;</sub>) and minus (f<sub>&#x02212;</sub>) one standard deviation of the point estimate. In Appendix C we show that <disp-formula><graphic xlink:href="pone.0000217.e005.jpg" mimetype="image" position="float"/></disp-formula></p></sec><sec id="s2f"><title>Estimates of Phenotypic Complexity for VSV and &#x003a6;X174</title><p>We applied the maximum likelihood estimator to the experimental estimates of population fitness for &#x003a6;X174 and VSV, and using a likelihood ratio test we defined 95&#x00025; confidence intervals (CI), which we list here in parentheses. For &#x003a6;X174 we found n<sub>e</sub>/Q&#x0200a;&#x0003d;&#x0200a;45 (42&#x02212;49), and f<sub>ref</sub>&#x0200a;&#x0003d;&#x0200a;1.245 (1.23&#x02212;1.26), whereas for VSV we found n<sub>e</sub>/Q&#x0200a;&#x0003d;&#x0200a;10 (8&#x02212;12) and f<sub>ref</sub>&#x0200a;&#x0003d;&#x0200a;1.98 (1.94&#x02212;2.05) (<xref ref-type="fig" rid="pone-0000217-g003"><bold>Fig. 3</bold></xref>). In both of these cases, f<sub>ref</sub> is calculated per generation relative to the ancestral virus for &#x003a6;X174 and relative to a reference strain for VSV. As no strong signature of curvature in the fitness surface has been found for either virus, we assume that Q is approximately one.</p></sec></sec><sec id="s3"><title>Discussion</title><p>To understand how biological complexity changes during the course of evolution, a metric is needed. Previously, measures such as the number of genes, cell types or metabolic processes have been proposed, but they often lead to incongruent results. Organisms with more cell types do not necessarily have more genes. Here we suggest that a metric unifying biological systems has not been appropriately identified. To circumvent this problem, we have developed a metric of biological complexity termed phenotypic complexity (n<sub>e</sub>). We have quantified this metric in the viruses &#x003a6;X174 and VSV by utilizing a population genetic model that describes how phenotypic complexity affects the drift load that a population experiences.</p><p>Phenotypic complexity (n<sub>e</sub>) is a measure of the number of genetically uncorrelated phenotypes that are acted upon by natural selection. Because Darwinian evolution through natural selection is the fundamental element unifying all biological organisms, we propose that n<sub>e</sub> is potentially a more relevant metric than those previously suggested.</p><sec id="s3a"><title>Robustness of the Model</title><p>Using recent theoretical results we have analytically quantified the dependency of the drift load (equilibrium fitness) on the effective population size and phenotypic complexity. The linear fitness function that has been employed previously to simplify the mathematical analyses is no longer necessary. Such a function makes strong assumptions about the form of the fitness landscape; specifically, mutational effects become very large as fitness is reduced. Thus at low fitness most mutations are either lethal or of very large effect, a scenario which is incompatible with what we have previously observed <xref ref-type="bibr" rid="pone.0000217-Silander1">&#x0005b;14&#x0005d;</xref>.</p><p>We have therefore studied a more general family of fitness functions of the form f(d)&#x0200a;&#x0003d;&#x0200a;exp(&#x02212;(d<sup>Q</sup>)), and found that F<sub>eq</sub>(N<sub>e</sub>, n<sub>e</sub>)&#x0200a;&#x0003d;&#x0200a;(1&#x02212;(2&#x022c5;N<sub>e</sub>&#x02212;1)<sup>&#x02212;1</sup>)<sup>(ne/Q)</sup>. It appears that this equation remains valid over a much wider range of conditions than those used in the canonical FGM, in which mutations are required to be isotropic and fitness isoclines are symmetric about the origin. An interesting feature of this formula is that it does not require a model in which mutations can affect all phenotypic traits simultaneously. In the initial formulation of FGM, all phenotypic axes intersect at the origin of each axis. This original FGM can be modified slightly such that some phenotypes are grouped into separate phenotypic modules, and within a module, all phenotypes again intersect at each other's origin. Any mutation that occurs within a module can affect only other phenotypes within that module, and none that lie outside of it (<italic>i.e.</italic> there is no pleiotropy between modules, an idea similar to previous conceptions of modularity <xref ref-type="bibr" rid="pone.0000217-Wagner2">&#x0005b;23&#x0005d;</xref>). Using the more general description of the equilibrium drift load that we have derived above, a phenotypic landscape a composed of a single module with n<sub>e</sub> dimensions has the same drift load function as a landscape composed of m independent modules of size n<sub>e,i</sub> with &#x02211;<sub>i</sub> n<sub>e,i</sub>&#x0200a;&#x0003d;&#x0200a;n<sub>e</sub> because we have <disp-formula><graphic xlink:href="pone.0000217.e006.jpg" mimetype="image" position="float"/></disp-formula></p><p>Hence the drift load formula that we have obtained seems to be robust to many of the assumptions underlying FGM.</p></sec><sec id="s3b"><title>Other Attempts to Estimate Phenotypic Complexity</title><p>Recently, another theoretical study developed a framework to estimate phenotypic complexity <xref ref-type="bibr" rid="pone.0000217-Martin1">&#x0005b;21&#x0005d;</xref>. The model developed used predictions on the distribution of mutational effects to estimate complexity. This analysis, which is completely independent from ours, found an interesting correlation between gene number and complexity in a variety of organisms ranging from a virus to <italic>C. elegans</italic>. However, for all the organisms for which enough data existed to perform the analysis, the number of phenotypic dimensions estimated was very small; 0.21 phenotypic dimensions for <italic>E. coli</italic>, 1.07 in VSV, 1&#x02013;2 for <italic>S. cerevisiae</italic>, and 2&#x02013;3 for <italic>D. melanogaster</italic> and <italic>C. elegans</italic>. We think that several effects may limit the predictive quality such a method. Firstly, mutation accumulation methods and the inherent noise in fitness estimates are very different across species and comparison across species are thus difficult. One illustration of this is the large variability in fitness estimates for mutations in a single species using two methods: in VSV earlier estimates (using Bateman-Mukai estimates) predicted a 0.002 mean fitness effect per mutation, while more recent and accurate estimates (which introduced each mutation individually) brought the estimate it to 14&#x00025; (a 70-fold difference). Secondly, neutral mutations are not considered in the model developed by Martin and Lenormand. However, part of the mutation produced by transposable elements might affect genes useless in laboratory conditions and will therefore be taken into account in the calculation of mean fitness effects of mutations even if they do not affect any phenotype in the laboratory environment. Third, contrary to our model, if phenotypes are organized in different modules (as many data suggest), their model will provide different estimates; in other words, their model requires that all traits can be simultaneously affected by a single mutations. All these considerations suggest that a second independent model should be used to estimate phenotypic complexity.</p><p>One of the central FGM hypotheses that we have so far not addressed is the single-peaked nature of the landscape. Although FGM contains few assumptions about the nature of the genotypic landscape, the model explicitly requires a phenotypic landscape containing a single peak; without this, then the fitness function, f(d), cannot be described by a decreasing function. However, recent experimental evidence over large evolutionary time scales strongly suggests that while the genotypic landscape may contain multiple peaks, the phenotypic landscape is generally much less complex. Several experimental studies using microbes have shown that a considerable amount of phenotypic convergence occurs during evolution <xref ref-type="bibr" rid="pone.0000217-Bull1">&#x0005b;24&#x0005d;</xref>&#x02013;<xref ref-type="bibr" rid="pone.0000217-Woods1">&#x0005b;27&#x0005d;</xref>, even when organisms begin from different starting points in the landscape <xref ref-type="bibr" rid="pone.0000217-Travisano1">&#x0005b;28&#x0005d;</xref>. These phenomena would only be expected if the phenotypic landscape exhibited a single-peak. However, the evidence for ruggedness in the genetic landscape is also substantial, especially in experiments that have looked at bacterial evolution of resistance to antibiotics <xref ref-type="bibr" rid="pone.0000217-Schrag1">&#x0005b;29&#x0005d;</xref>. In this case, the fitness relationships between the wild type genotypes, resistant genotypes, compensated resistant genotypes, and sensitive genotypes bearing the compensatory mutation exhibit high levels of epistasis, characteristic of a rugged genetic landscape. In other studies in which the cost of resistance was associated with a phenotype <xref ref-type="bibr" rid="pone.0000217-Reynolds1">&#x0005b;30&#x0005d;</xref>, fitness restoration to wild-type level was sometimes observed and, more importantly for our concern, it was associated with a restoration of the phenotypic damage associated with the occurrence of the resistance mutation (transcription efficiency of rifampicin resistant mutants was restored back to the level observed in rifampicin sensitive strain). This also suggests the singularity of the phenotypic optimum, although different genetic combinations may underlie this optimum. However, as our model is focusing neither on the genetic nature of the adaptive landscape, nor on the rate of adaptation (ruggedness means that several mutations could be needed to restore the effect of one) it should not be too sensitive to the small level ruggedness of the genetic landscape described so far.</p></sec><sec id="s3c"><title>The Concept of Phenotypic Complexity</title><p>As discussed previously, the quantity denoted by n<sub>e</sub> is the number of genetically uncorrelated phenotypes that are influenced by the action of natural selection. The dimensions enumerated by n<sub>e</sub> are thus genetically orthogonal to each other, and analogous to the axes needed to describe the variation among multiple phenotypes measured on a collection of individuals and mutants in a principal component analysis. However, the number of axes enumerated by n<sub>e</sub> is filtered by natural selection, while in a PCA analysis the number of axes is limited only by the number of independent phenotypes that are measured. Because each phenotype is optimized at a value determined by each organism's ecological environment, there is a dependence of phenotypic complexity on the complexity of the ecological niche experienced by each organism; if natural selection does not act on a phenotype, then that phenotype does not contribute to the complexity metric. Finally, although the estimates of n<sub>e</sub> arise from an idealized model of phenotypic evolution; as Orr suggested previously, estimates of phenotypic complexity using FGM can be viewed as &#x0201c;effective&#x0201d; estimates of phenotypic complexity <xref ref-type="bibr" rid="pone.0000217-Orr1">&#x0005b;6&#x0005d;</xref>. This concept is analogous to the concept in population genetics of effective population size, N<sub>e</sub>, in which two populations with different numbers of individuals and different sex ratios might have the same effective population size and therefore respond similarly to the different population genetic forces. Thus two organisms, although they may differ in both the underlying genetic mechanisms and in the complexity of the environment in which they live, may have similar phenotypic complexities. The utility of the concept lies not in the implications it makes about specific phenotypes or genetic details, but in that it enables a general quantification of how an organism is affected by natural selection (the <italic>complexity</italic> with which natural selection acts), and furthermore, how this action affects the evolutionary dynamics of that organism <xref ref-type="bibr" rid="pone.0000217-Orr1">&#x0005b;6&#x0005d;</xref>.</p></sec><sec id="s3d"><title>Viral Estimates of Phenotypic Complexity</title><p>Unsurprisingly, our estimates of phenotypic complexity are orders of magnitude smaller than either the number of nucleotides or even the number of amino acids encoded by the genomes of these organisms (5386 bp and 11,161bp in &#x003a6;X174 and VSV, respectively). This agrees with the concept of phenotypic complexity that we have defined. Although mutations that occur at one nucleotide or amino acid do not affect those at another (<italic>i.e.</italic> they are genetically separable phenotypes), it is clearly unlikely that each nucleotide or amino acid is independently acted up by natural selection. Secondly, each estimate of complexity is greater than the number of genes encoded by each virus (11 and 5 for &#x003a6;X174 and VSV, respectively). The presence of multiple functional domains within a single protein is consistent with an estimate of complexity that is greater than the number of encoded proteins.</p><p>Although we have only two estimates, we can briefly consider them from a comparative standpoint: although the genome size of &#x003a6;X174 is half of VSV, our estimate of phenotypic complexity quantifies &#x003a6;X174 as being approximately four-fold more complex. It is notable, then, that &#x003a6;X174 contains approximately twice the number of genes as VSV. Additionally, the lifestyle of &#x003a6;X174 is arguably much more elaborate than that of VSV. &#x003a6;X174 interacts with several host factors in order to perform transcription and replication; 13 host factors are required for replication alone <xref ref-type="bibr" rid="pone.0000217-Shlomai1">&#x0005b;31&#x0005d;</xref>. This can be contrasted with VSV, in which transcription and replication are similar processes, both performed by the viral polymerase. Few host factors (and thus few interactions) are necessary at all during the entire life cycle of VSV <xref ref-type="bibr" rid="pone.0000217-Bose1">&#x0005b;32&#x0005d;</xref>.</p><p>These estimates suggest that, for very simple organisms such as viruses, phenotypic complexity correlates well with the number of genes in an organism, and more specifically, with the number of interactions characteristic of that organism <xref ref-type="bibr" rid="pone.0000217-Szathmary1">&#x0005b;2&#x0005d;</xref>. This observation supports the idea that phenotypic complexity depends on the interactions between an organism and its environment. Genome size in itself seems to be a poor correlate of phenotypic complexity, a notable result in consideration of the very small genome sizes of these organisms. Whether such correlations or absence of correlation with gene number or genome length would hold for more complex organisms remains an open question. Nevertheless, by studying very simple organisms, we have shown that the use of drift load could be used to estimate complexity in a novel and consistent way. We now propose that such a method could be helpful to identify and quantify the strongest determinants of biological complexity of higher organisms.</p><p>Although the theory presented here appears to be quite robust, it is too early to conclude that it is an accurate reflection of the underlying biology. To be studied in an FGM framework, organisms need to present at least one phenotypic property to selection. Additionally, populations, even those of very small size, should evolve towards a fitness equilibrium that is explicitly dependent on population size. We found data in the literature consistent with this expectation for one organism, VSV. We now provide further support for population size-dependent fitness equilibria by evolving populations of the bacteriophage &#x003a6;X174. Together, these two data sets suggest that evolutionary analyses using an FGM framework are a valid approach. Moreover, the use of very simple organisms such as viruses is useful for gaining insight into metrics of complexity, as for such simple organisms, gene number is likely to be a very good correlate of organismal complexity, and this should be reflected by the metric. Although our observations are currently limited to two viral species, it is clear that from both a qualitative level (<italic>i.e.</italic> population size-dependent fitness equilibria), and a quantitative level (that the number of phenotypic dimensions are reasonable) that the predictions from FGM theory are borne out. An assessment of drift load and phenotypic complexity in a greater number of organisms is needed before further conclusions can be drawn.</p></sec><sec id="s3e"><title>Conclusions</title><p>Here we have presented a top-down approach to quantifying biological complexity. This can be contrasted with previously proposed metrics of complexity, which have relied on physically measurable quantities of the organism (bottom-up approaches). Two important conceptual differences separate these two approaches. Most importantly, phenotypic complexity is dependent on both the organism and the environmental context. An organism is not complex because it has many measurable phenotypes; it is complex because it has many phenotypes on which natural selection acts. Secondly, phenotypic complexity does not rely on artificially constructed concepts such as genes <xref ref-type="bibr" rid="pone.0000217-Pearson1">&#x0005b;33&#x0005d;</xref>. As an example, if two genes are deemed to be of equal complexity because they are functionally equivalent, such a measure necessarily ignores the subtle ways in which each may be regulated, or spliced, or expressed within the cell. Quantifying such multiple layers of complexity is difficult if the metric relies on physically measurable quantities.</p><p>However, phenotypic complexity remains an inherently abstract metric. It cannot aid in identifying the specific characteristics contributing to the complexity of an organism. Instead, it addresses the complexity with which natural selection views an organism, and the complexity with which an organism is capable of generating novel phenotypic variation. For this reason, testing how phenotypic complexity compares to more traditional metrics of complexity (for example, the numbers of genes, protein interactions, or cellular pathways) may provide significant insight into biological systems. Finally, phenotypic complexity (and the resulting equilibrium drift load) affords a unique opportunity to contrast the action of natural selection between different organisms or different environments in a very general and unconstrained manner.</p></sec></sec><sec sec-type="methods" id="s4"><title>Methods</title><sec id="s4a"><title>Viral Evolution</title><p>The details of experimental evolution of &#x003a6;X174 have been described previously <xref ref-type="bibr" rid="pone.0000217-Silander1">&#x0005b;14&#x0005d;</xref>. Briefly, phage were mutagenized in 250 mM hydroxylamine, 1mM EDTA at 37&#x000b0;C for 140 minutes. Mutagenic treatment was stopped by 100 to 1000-fold dilution into fresh media, after which they were plated on LC agar plates containing a bacterial lawn and grown overnight at 32&#x000b0;C. From these plates, a number of plaques equal to the bottleneck size were randomly selected and diluted into culture tubes containing 3 ml of 1mM EDTA. These tubes were vortexed and centrifuged, after which 0.5 ml was removed to a fresh eppendorf tube. Chloroform was added, the tubes were vortexed and centrifuged, and 0.3 ml was removed. This stock was then used for further mutagenesis.</p></sec><sec id="s4b"><title>Appendix A: Derivation of Fitness Equilibriums</title><p>Sella and Hirsh <xref ref-type="bibr" rid="pone.0000217-Sella1">&#x0005b;16&#x0005d;</xref> showed that mean equilibrium fitness could be written<disp-formula><graphic xlink:href="pone.0000217.e007.jpg" mimetype="image" position="float"/></disp-formula>in which &#x003bd;&#x0200a;&#x0003d;&#x0200a;2N<sub>e</sub>&#x02212;1 in the diploid case and 2N<sub>e</sub>&#x02212;2 in the haploid, and &#x003c1;(f) is the density function of fitness value f.</p><p>In an n-dimensional space, the density &#x003c1;(<italic>f</italic>) d<italic>f</italic> is derived from the hyper-sphere surface of radius <italic>x</italic>, with f&#x0200a;&#x0003d;&#x0200a;f(<italic>x</italic>), f(<italic>x</italic>) being the fitness function describing the dependency of fitness on the distance to the optimum, <italic>x</italic>. The surface of the hyper-sphere of radius <italic>x</italic> is &#x003a9;(<italic>n</italic>)<italic>x</italic><sup>(<italic>n</italic>&#x02212;1)</sup>, where &#x003a9;(<italic>n</italic>) is the unit radius hyper-sphere surface, &#x003a9;(<italic>n</italic>)&#x0200a;&#x0003d;&#x0200a;2&#x022c5;&#x003c0;<sup>(<italic>n</italic>/2)</sup>/&#x00393;(<italic>n</italic>/2). We have therefore &#x003c1;(<italic>f</italic>)d<italic>f</italic>&#x0200a;&#x0003d;&#x0200a;&#x003a9;(<italic>n</italic>) <italic>x</italic><sup>(<italic>n</italic>&#x02212;1)</sup> d<italic>x</italic></p><p>If fitness is defined as f(<italic>x</italic>)&#x0200a;&#x0003d;&#x0200a;1&#x02212;<italic>x</italic>, then &#x003a9;(<italic>n</italic>) <italic>x</italic><sup>(<italic>n</italic>&#x02212;1)</sup> d<italic>x</italic>&#x0200a;&#x0003d;&#x0200a;&#x02212;&#x003a9;(<italic>n</italic>) (1&#x02212;<italic>f</italic>)<italic><sup>n</sup></italic><sup>&#x02212;1</sup> d<italic>f</italic> and<disp-formula><graphic xlink:href="pone.0000217.e008.jpg" mimetype="image" position="float"/></disp-formula></p><p>If fitness is defined as: f(<italic>x</italic>)&#x0200a;&#x0003d;&#x0200a;exp(&#x02212;<italic>x</italic><sup>Q</sup>) we have <disp-formula><graphic xlink:href="pone.0000217.e009.jpg" mimetype="image" position="float"/></disp-formula>and <disp-formula><graphic xlink:href="pone.0000217.e010.jpg" mimetype="image" position="float"/></disp-formula></p><p>This expression is independent of mutational properties.</p></sec><sec id="s4c"><title>Appendix B: robustness to assumptions</title><sec id="s4c1"><title>Slope of the fitness function</title><p>Note that if f(<italic>x</italic>)&#x0200a;&#x0003d;&#x0200a;exp(&#x02212;&#x003b1; <italic>x</italic><sup>Q</sup>)<disp-formula><graphic xlink:href="pone.0000217.e011.jpg" mimetype="image" position="float"/></disp-formula>and &#x02329;f&#x0232a;is not affected.</p></sec><sec id="s4c2"><title>Ellipsoidal fitness isoclines</title><p>Let us assume that f&#x0200a;&#x0003d;&#x0200a;exp(&#x02212;<italic>R</italic><sup>Q</sup>) where <italic>R</italic> is defined by <disp-formula><graphic xlink:href="pone.0000217.e012.jpg" mimetype="image" position="float"/></disp-formula>in which <bold>x</bold>&#x0200a;&#x0003d;&#x0200a;(<italic>x</italic><sub>1</sub>,<italic>x</italic><sub>2</sub>,&#x02026;,<italic>x</italic><sub>n</sub>) is the position in the n-dimensional space and &#x003b1;<sub>i</sub> are positive numbers. We then have ellipsoidal fitness isoclines of semi-axes R/&#x003b1;<sub>i</sub>. As the volume of such an ellipsoid is <disp-formula><graphic xlink:href="pone.0000217.e013.jpg" mimetype="image" position="float"/></disp-formula>with <disp-formula><graphic xlink:href="pone.0000217.e014.jpg" mimetype="image" position="float"/></disp-formula> being the Euler Gamma function and the density &#x003c1;(<italic>f</italic>) d<italic>f</italic>&#x0200a;&#x0003d;&#x0200a;dV(<italic>f</italic>) d<italic>f</italic> is similar to the one found in the previous case <disp-formula><graphic xlink:href="pone.0000217.e015.jpg" mimetype="image" position="float"/></disp-formula>with<disp-formula><graphic xlink:href="pone.0000217.e016.jpg" mimetype="image" position="float"/></disp-formula></p><p>we therefore find the same value of &#x02329;f&#x0232a;, as the constant cancels out in the ratio of integrals. More generally, if fitness is defined as <disp-formula><graphic xlink:href="pone.0000217.e017.jpg" mimetype="image" position="float"/></disp-formula></p><p>We can show through recursions that this defines volumes <disp-formula><graphic xlink:href="pone.0000217.e018.jpg" mimetype="image" position="float"/></disp-formula>and that once again the equilibrium fitness remains unchanged.</p></sec></sec><sec id="s4d"><title>Appendix C: Maximum Likelihood Analysis</title><p>Sella and Hirsh showed that the probability of being at fitness <italic>f</italic> is <disp-formula><graphic xlink:href="pone.0000217.e019.jpg" mimetype="image" position="float"/></disp-formula></p><p>Using the previous derivations with f(<italic>x</italic>)&#x0200a;&#x0003d;&#x0200a;exp(&#x02212;<italic>x</italic><sup>Q</sup>), we find the probability that <italic>f</italic> lies between a and b is<disp-formula><graphic xlink:href="pone.0000217.e020.jpg" mimetype="image" position="float"/></disp-formula>with <disp-formula><graphic xlink:href="pone.0000217.e021.jpg" mimetype="image" position="float"/></disp-formula> being the generalized incomplete gamma function</p><p>Because we do not know maximum fitness f<sub>ref</sub>, we must estimate it and therefore fitness b and a be used relative to f<sub>ref</sub>.<disp-formula><graphic xlink:href="pone.0000217.e022.jpg" mimetype="image" position="float"/></disp-formula><disp-formula><graphic xlink:href="pone.0000217.e023.jpg" mimetype="image" position="float"/></disp-formula><disp-formula><graphic xlink:href="pone.0000217.e024.jpg" mimetype="image" position="float"/></disp-formula></p></sec></sec></body><back><ack><p>We would like to thank Art Poon, Dan Weinreich, and Thomas Berngruber for valuable discussions.</p></ack><ref-list><title>References</title><ref id="pone.0000217-McShea1"><label>1</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>McShea</surname><given-names>DW</given-names></name></person-group><year>1996</year><article-title>Metazoan complexity and evolution: Is there a trend? Perspective.</article-title><source>Evolution</source><volume>50</volume><fpage>477</fpage><lpage>492</lpage></citation></ref><ref id="pone.0000217-Szathmary1"><label>2</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Szathmary</surname><given-names>E</given-names></name><name><surname>Jordan</surname><given-names>F</given-names></name><name><surname>Pal</surname><given-names>C</given-names></name></person-group><year>2001</year><article-title>Molecular biology and evolution - Can genes explain biological complexity?</article-title><source>Science</source><volume>292</volume><fpage>1315</fpage><lpage>1316</lpage><pub-id pub-id-type="pmid">11360989</pub-id></citation></ref><ref id="pone.0000217-Carroll1"><label>3</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Carroll</surname><given-names>SB</given-names></name></person-group><year>2001</year><article-title>Chance and necessity: the evolution of morphological complexity and diversity.</article-title><source>Nature</source><volume>409</volume><fpage>1102</fpage><lpage>1109</lpage><pub-id pub-id-type="pmid">11234024</pub-id></citation></ref><ref id="pone.0000217-Adami1"><label>4</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Adami</surname><given-names>C</given-names></name></person-group><year>2002</year><article-title>What is complexity?</article-title><source>Bioessays</source><volume>24</volume><fpage>1085</fpage><lpage>1094</lpage><pub-id pub-id-type="pmid">12447974</pub-id></citation></ref><ref id="pone.0000217-Adami2"><label>5</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Adami</surname><given-names>C</given-names></name><name><surname>Ofria</surname><given-names>C</given-names></name><name><surname>Collier</surname><given-names>TC</given-names></name></person-group><year>2000</year><article-title>Evolution of biological complexity.</article-title><source>Proceedings of the National Academy of Sciences of the United States of America</source><volume>97</volume><fpage>4463</fpage><lpage>4468</lpage><pub-id pub-id-type="pmid">10781045</pub-id></citation></ref><ref id="pone.0000217-Orr1"><label>6</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Orr</surname><given-names>HA</given-names></name></person-group><year>2000</year><article-title>Adaptation and the cost of complexity.</article-title><source>Evolution</source><volume>54</volume><fpage>13</fpage><lpage>20</lpage><pub-id pub-id-type="pmid">10937178</pub-id></citation></ref><ref id="pone.0000217-Whitlock1"><label>7</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Whitlock</surname><given-names>MC</given-names></name><name><surname>Griswold</surname><given-names>CK</given-names></name><name><surname>Peters</surname><given-names>AD</given-names></name></person-group><year>2003</year><article-title>Compensating for the meltdown: The critical effective size of a population with deleterious and compensatory mutations.</article-title><source>Annales Zoologici Fennici</source><volume>40</volume><fpage>169</fpage><lpage>183</lpage></citation></ref><ref id="pone.0000217-Welch1"><label>8</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Welch</surname><given-names>JJ</given-names></name><name><surname>Waxman</surname><given-names>D</given-names></name></person-group><year>2003</year><article-title>Modularity and the cost of complexity.</article-title><source>Evolution</source><volume>57</volume><fpage>1723</fpage><lpage>1734</lpage><pub-id pub-id-type="pmid">14503615</pub-id></citation></ref><ref id="pone.0000217-Hartl1"><label>9</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hartl</surname><given-names>DL</given-names></name><name><surname>Taubes</surname><given-names>CH</given-names></name></person-group><year>1998</year><article-title>Towards a theory of evolutionary adaptation.</article-title><source>Genetica</source><volume>103</volume><fpage>525</fpage><lpage>533</lpage><pub-id pub-id-type="pmid">9720296</pub-id></citation></ref><ref id="pone.0000217-Poon1"><label>10</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Poon</surname><given-names>A</given-names></name><name><surname>Otto</surname><given-names>SP</given-names></name></person-group><year>2000</year><article-title>Compensating for our load of mutations: Freezing the meltdown of small populations.</article-title><source>Evolution</source><volume>54</volume><fpage>1467</fpage><lpage>1479</lpage><pub-id pub-id-type="pmid">11108576</pub-id></citation></ref><ref id="pone.0000217-Fisher1"><label>11</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Fisher</surname><given-names>RA</given-names></name></person-group><year>1930</year><source>The Genetical Theory of Natural Selection.</source><publisher-loc>Oxford</publisher-loc><publisher-name>Clarendon Press</publisher-name><fpage>318 p</fpage></citation></ref><ref id="pone.0000217-Burch1"><label>12</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Burch</surname><given-names>CL</given-names></name><name><surname>Chao</surname><given-names>L</given-names></name></person-group><year>1999</year><article-title>Evolution by small steps and rugged landscapes in the RNA virus phi 6.</article-title><source>Genetics</source><volume>151</volume><fpage>921</fpage><lpage>927</lpage><pub-id pub-id-type="pmid">10049911</pub-id></citation></ref><ref id="pone.0000217-Estes1"><label>13</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Estes</surname><given-names>S</given-names></name><name><surname>Phillips</surname><given-names>PC</given-names></name><name><surname>Denver</surname><given-names>DR</given-names></name><name><surname>Thomas</surname><given-names>WK</given-names></name><name><surname>Lynch</surname><given-names>M</given-names></name></person-group><year>2004</year><article-title>Mutation accumulation in populations of varying size: The distribution of mutational effects for fitness correlates in Caenorhabditis elegans.</article-title><source>Genetics</source><volume>166</volume><fpage>1269</fpage><lpage>1279</lpage><pub-id pub-id-type="pmid">15082546</pub-id></citation></ref><ref id="pone.0000217-Silander1"><label>14</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Silander</surname><given-names>OK</given-names></name><name><surname>Tenaillon</surname><given-names>O</given-names></name><name><surname>Chao</surname><given-names>L</given-names></name></person-group><year>2007</year><article-title>Understanding the evolutionary fate of finite size populations: The dynamics of mutational effects.</article-title><source>PloS Biology</source><volume>In press</volume></citation></ref><ref id="pone.0000217-Wagner1"><label>15</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wagner</surname><given-names>GP</given-names></name><name><surname>Gabriel</surname><given-names>W</given-names></name></person-group><year>1990</year><article-title>Quantitative Variation in Finite Parthenogenetic Populations - What Stops Mullers Ratchet in the Absence of Recombination.</article-title><source>Evolution</source><volume>44</volume><fpage>715</fpage><lpage>731</lpage></citation></ref><ref id="pone.0000217-Sella1"><label>16</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sella</surname><given-names>G</given-names></name><name><surname>Hirsh</surname><given-names>AE</given-names></name></person-group><year>2005</year><article-title>The application of statistical physics to evolutionary biology.</article-title><source>Proceedings of the National Academy of Sciences of the United States of America</source><volume>102</volume><fpage>9541</fpage><lpage>9546</lpage><pub-id pub-id-type="pmid">15980155</pub-id></citation></ref><ref id="pone.0000217-Burch2"><label>17</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Burch</surname><given-names>CL</given-names></name><name><surname>Chao</surname><given-names>L</given-names></name></person-group><year>2004</year><article-title>Epistasis and Its Relationship to Canalization in the RNA Virus Phi-6.</article-title><source>Genetics</source><volume>167</volume><fpage>559</fpage><lpage>567</lpage><pub-id pub-id-type="pmid">15238511</pub-id></citation></ref><ref id="pone.0000217-Bonhoeffer1"><label>18</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bonhoeffer</surname><given-names>S</given-names></name><name><surname>Chappey</surname><given-names>C</given-names></name><name><surname>Parkin</surname><given-names>NT</given-names></name><name><surname>Whitcomb</surname><given-names>JM</given-names></name><name><surname>Petropoulos</surname><given-names>CJ</given-names></name></person-group><year>2004</year><article-title>Evidence for positive epistasis in HIV-1.</article-title><source>Science</source><volume>306</volume><fpage>1547</fpage><lpage>1550</lpage><pub-id pub-id-type="pmid">15567861</pub-id></citation></ref><ref id="pone.0000217-Sanjuan1"><label>19</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sanjuan</surname><given-names>R</given-names></name><name><surname>Moya</surname><given-names>A</given-names></name><name><surname>Elena</surname><given-names>SF</given-names></name></person-group><year>2004</year><article-title>The contribution of epistasis to the archistectureof fitness in an RNA virus.</article-title><source>Proceedings of the National Academy of Sciences of the United States of America</source><volume>101</volume><fpage>15376</fpage><lpage>15379</lpage><pub-id pub-id-type="pmid">15492220</pub-id></citation></ref><ref id="pone.0000217-Elena1"><label>20</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Elena</surname><given-names>SF</given-names></name><name><surname>Lenski</surname><given-names>RE</given-names></name></person-group><year>1997</year><article-title>Test of synergistic interactions among deleterious mutations in bacteria.</article-title><source>Nature</source><volume>390</volume><fpage>395</fpage><lpage>398</lpage><pub-id pub-id-type="pmid">9389477</pub-id></citation></ref><ref id="pone.0000217-Martin1"><label>21</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Martin</surname><given-names>G</given-names></name><name><surname>Lenormand</surname><given-names>T</given-names></name></person-group><year>2006</year><article-title>A general multivariate extension of Fisher's geometrical model and the distribution of mutation fitness effects across species.</article-title><source>Evolution</source><volume>60</volume><fpage>893</fpage><lpage>907</lpage><pub-id pub-id-type="pmid">16817531</pub-id></citation></ref><ref id="pone.0000217-Novella1"><label>22</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Novella</surname><given-names>IS</given-names></name><name><surname>Elena</surname><given-names>SF</given-names></name><name><surname>Moya</surname><given-names>A</given-names></name><name><surname>Domingo</surname><given-names>E</given-names></name><name><surname>Holland</surname><given-names>JJ</given-names></name></person-group><year>1995</year><article-title>Size of Genetic Bottlenecks Leading to Virus Fitness Loss Is Determined by Mean Initial Population Fitness.</article-title><source>Journal of Virology</source><volume>69</volume><fpage>2869</fpage><lpage>2872</lpage><pub-id pub-id-type="pmid">7707510</pub-id></citation></ref><ref id="pone.0000217-Wagner2"><label>23</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wagner</surname><given-names>GP</given-names></name><name><surname>Altenberg</surname><given-names>L</given-names></name></person-group><year>1996</year><article-title>Perspective: Complex adaptations and the evolution of evolvability.</article-title><source>Evolution</source><volume>50</volume><fpage>967</fpage><lpage>976</lpage></citation></ref><ref id="pone.0000217-Bull1"><label>24</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bull</surname><given-names>JJ</given-names></name><name><surname>Badgett</surname><given-names>MR</given-names></name><name><surname>Wichman</surname><given-names>HA</given-names></name><name><surname>Huelsenbeck</surname><given-names>JP</given-names></name><name><surname>Hillis</surname><given-names>DM</given-names></name><etal/></person-group><year>1997</year><article-title>Exceptional convergent evolution in a virus.</article-title><source>Genetics</source><volume>147</volume><fpage>1497</fpage><lpage>1507</lpage><pub-id pub-id-type="pmid">9409816</pub-id></citation></ref><ref id="pone.0000217-Fong1"><label>25</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fong</surname><given-names>SS</given-names></name><name><surname>Joyce</surname><given-names>AR</given-names></name><name><surname>Palsson</surname><given-names>BO</given-names></name></person-group><year>2005</year><article-title>Parallel adaptive evolution cultures of Escherichia coli lead to convergent growth phenotypes with different gene expression states.</article-title><source>Genome Research</source><volume>15</volume><fpage>1365</fpage><lpage>1372</lpage><pub-id pub-id-type="pmid">16204189</pub-id></citation></ref><ref id="pone.0000217-Fong2"><label>26</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fong</surname><given-names>SS</given-names></name><name><surname>Palsson</surname><given-names>BO</given-names></name></person-group><year>2004</year><article-title>Metabolic gene-deletion strains of Escherichia coli evolve to computationally predicted growth phenotypes.</article-title><source>Nature Genetics</source><volume>36</volume><fpage>1056</fpage><lpage>1058</lpage><pub-id pub-id-type="pmid">15448692</pub-id></citation></ref><ref id="pone.0000217-Woods1"><label>27</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Woods</surname><given-names>R</given-names></name><name><surname>Schneider</surname><given-names>D</given-names></name><name><surname>Winkworth</surname><given-names>CL</given-names></name><name><surname>Riley</surname><given-names>MA</given-names></name><name><surname>Lenski</surname><given-names>RE</given-names></name></person-group><year>2006</year><article-title>Tests of parallel molecular evolution in a long-term experiment with Escherichia coli.</article-title><source>Proceedings of the National Academy of Sciences of the United States of America</source><volume>103</volume><fpage>9107</fpage><lpage>9112</lpage><pub-id pub-id-type="pmid">16751270</pub-id></citation></ref><ref id="pone.0000217-Travisano1"><label>28</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Travisano</surname><given-names>M</given-names></name><name><surname>Mongold</surname><given-names>JA</given-names></name><name><surname>Bennett</surname><given-names>AF</given-names></name><name><surname>Lenski</surname><given-names>RE</given-names></name></person-group><year>1995</year><article-title>Experimental Tests of the Roles of Adaptation, Chance, and History in Evolution.</article-title><source>Science</source><volume>267</volume><fpage>87</fpage><lpage>90</lpage><pub-id pub-id-type="pmid">7809610</pub-id></citation></ref><ref id="pone.0000217-Schrag1"><label>29</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schrag</surname><given-names>SJ</given-names></name><name><surname>Perrot</surname><given-names>V</given-names></name><name><surname>Levin</surname><given-names>BR</given-names></name></person-group><year>1997</year><article-title>Adaptation to the fitness costs of antibiotic resistance in Escherichia coli.</article-title><source>Proceedings of the Royal Society of London Series B-Biological Sciences</source><volume>264</volume><fpage>1287</fpage><lpage>1291</lpage></citation></ref><ref id="pone.0000217-Reynolds1"><label>30</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Reynolds</surname><given-names>MG</given-names></name></person-group><year>2000</year><article-title>Compensatory evolution in rifampin-resistant Escherichia coli.</article-title><source>Genetics</source><volume>156</volume><fpage>1471</fpage><lpage>1481</lpage><pub-id pub-id-type="pmid">11102350</pub-id></citation></ref><ref id="pone.0000217-Shlomai1"><label>31</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shlomai</surname><given-names>J</given-names></name><name><surname>Polder</surname><given-names>L</given-names></name><name><surname>Arai</surname><given-names>K</given-names></name><name><surname>Kornberg</surname><given-names>A</given-names></name></person-group><year>1981</year><article-title>Replication of Phi-X174 DNA with Purified Enzymes .1. Conversion of Viral-DNA to a Supercoiled, Biologically-Active Duplex.</article-title><source>Journal of Biological Chemistry</source><volume>256</volume><fpage>5233</fpage><lpage>5238</lpage><pub-id pub-id-type="pmid">6262323</pub-id></citation></ref><ref id="pone.0000217-Bose1"><label>32</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bose</surname><given-names>S</given-names></name><name><surname>Mathur</surname><given-names>M</given-names></name><name><surname>Bates</surname><given-names>P</given-names></name><name><surname>Joshi</surname><given-names>N</given-names></name><name><surname>Banerjee</surname><given-names>AK</given-names></name></person-group><year>2003</year><article-title>Requirement for cyclophilin A for the replication of vesicular stomatitis virus New Jersey serotype.</article-title><source>Journal of General Virology</source><volume>84</volume><fpage>1687</fpage><lpage>1699</lpage><pub-id pub-id-type="pmid">12810862</pub-id></citation></ref><ref id="pone.0000217-Pearson1"><label>33</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pearson</surname><given-names>H</given-names></name></person-group><year>2006</year><article-title>What is a gene?</article-title><source>Nature</source><volume>441</volume><fpage>398</fpage><lpage>401</lpage><pub-id pub-id-type="pmid">16724031</pub-id></citation></ref></ref-list><fn-group><fn fn-type="conflict"><p><bold>Competing Interests: </bold>The authors have declared that no competing interests exist.</p></fn><fn fn-type="financial-disclosure"><p><bold>Funding: </bold>OT was funded by the Agence Nationale de la Recherche (ANR-05-JCJC-0136-01). OS was partially funded by an NIH training grant. LC was funded by an NIH grant.</p></fn></fn-group></back></article>