Permalink
Cannot retrieve contributors at this time
Fetching contributors…
| <?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Archiving and Interchange DTD v1.1d1 20130915//EN" "JATS-archivearticle1.dtd"><article article-type="research-article" dtd-version="1.1d1" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink"><front><journal-meta><journal-id journal-id-type="nlm-ta">eLife</journal-id><journal-id journal-id-type="hwp">elife</journal-id><journal-id journal-id-type="publisher-id">eLife</journal-id><journal-title-group><journal-title>eLife</journal-title></journal-title-group><issn publication-format="electronic">2050-084X</issn><publisher><publisher-name>eLife Sciences Publications, Ltd</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">00093</article-id><article-id pub-id-type="doi">10.7554/eLife.00093</article-id><article-categories><subj-group subj-group-type="display-channel"><subject>Research article</subject></subj-group><subj-group subj-group-type="heading"><subject>Microbiology and infectious disease</subject></subj-group></article-categories><title-group><article-title>Population structuring of multi-copy, antigen-encoding genes in <italic>Plasmodium falciparum</italic></article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes" id="author-1321"><name><surname>Artzy-Randrup</surname><given-names>Yael</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="corresp" rid="cor1">*</xref><xref ref-type="fn" rid="con1"/><xref ref-type="fn" rid="conf2"/></contrib><contrib contrib-type="author" id="author-1816"><name><surname>Rorick</surname><given-names>Mary M</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="fn" rid="con2"/><xref ref-type="fn" rid="conf2"/></contrib><contrib contrib-type="author" id="author-1817"><name><surname>Day</surname><given-names>Karen</given-names></name><xref ref-type="aff" rid="aff2"/><xref ref-type="other" rid="par-1"/><xref ref-type="other" rid="par-2"/><xref ref-type="fn" rid="con3"/><xref ref-type="fn" rid="conf2"/></contrib><contrib contrib-type="author" id="author-1818"><name><surname>Chen</surname><given-names>Donald</given-names></name><xref ref-type="aff" rid="aff3"/><xref ref-type="other" rid="par-2"/><xref ref-type="other" rid="par-3"/><xref ref-type="fn" rid="con4"/><xref ref-type="fn" rid="conf2"/></contrib><contrib contrib-type="author" id="author-1819"><name><surname>Dobson</surname><given-names>Andrew P</given-names></name><xref ref-type="aff" rid="aff4"/><xref ref-type="aff" rid="aff5"/><xref ref-type="other" rid="par-4"/><xref ref-type="fn" rid="con5"/><xref ref-type="fn" rid="conf2"/></contrib><contrib contrib-type="author" id="author-1158"><name><surname>Pascual</surname><given-names>Mercedes</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="aff" rid="aff5"/><xref ref-type="fn" rid="con6"/><xref ref-type="fn" rid="conf1"/></contrib><aff id="aff1"><institution content-type="dept">Department of Ecology and Evolutionary Biology</institution>, <institution>Howard Hughes Medical Institute and the University of Michigan</institution>, <addr-line><named-content content-type="city">Ann Arbor</named-content></addr-line>, <country>United States</country></aff><aff id="aff2"><institution content-type="dept">Department of Microbiology, Division of Medical Parasitology</institution>, <institution>New York University School of Medicine</institution>, <addr-line><named-content content-type="city">New York</named-content></addr-line>, <country>United States</country></aff><aff id="aff3"><institution content-type="dept">Department of Microbiology, Division of Medical Parasitology and Department of Medicine, Division of Infectious Disease</institution>, <institution>New York University School of Medicine</institution>, <addr-line><named-content content-type="city">New York</named-content></addr-line>, <country>United States</country></aff><aff id="aff4"><institution content-type="dept">Department of Ecology and Evolutionary Biology</institution>, <institution>Princeton University</institution>, <addr-line><named-content content-type="city">Princeton</named-content></addr-line>, <country>United States</country></aff><aff id="aff5"><institution>Santa Fe Institute</institution>, <addr-line><named-content content-type="city">Santa Fe</named-content></addr-line>, <country>United States</country></aff></contrib-group><contrib-group content-type="section"><contrib contrib-type="editor"><name><surname>Bergstrom</surname><given-names>Carl T</given-names></name><role>Reviewing editor</role><aff><institution>University of Washington</institution><country>United States</country></aff></contrib></contrib-group><author-notes><corresp id="cor1"><label>*</label>For correspondence: <email>yartzy@umich.edu</email></corresp></author-notes><pub-date date-type="pub" publication-format="electronic"><day>18</day><month>12</month><year>2012</year></pub-date><pub-date pub-type="collection"><year>2012</year></pub-date><volume>1</volume><elocation-id>e00093</elocation-id><history><date date-type="received"><day>24</day><month>07</month><year>2012</year></date><date date-type="accepted"><day>04</day><month>10</month><year>2012</year></date></history><permissions><copyright-statement>© 2012, Artzy-Randrup et al</copyright-statement><copyright-year>2012</copyright-year><copyright-holder>Artzy-Randrup et al</copyright-holder><license xlink:href="http://creativecommons.org/licenses/by/3.0/"><license-p>This article is distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/3.0/">Creative Commons Attribution License</ext-link>, which permits unrestricted use and redistribution provided that the original author and source are credited.</license-p></license></permissions><self-uri content-type="pdf" xlink:href="elife00093.pdf"/><related-article ext-link-type="doi" id="ra1" related-article-type="commentary" xlink:href="10.7554/eLife.00385"/><abstract><object-id pub-id-type="doi">10.7554/eLife.00093.001</object-id><p>The coexistence of multiple independently circulating strains in pathogen populations that undergo sexual recombination is a central question of epidemiology with profound implications for control. An agent-based model is developed that extends earlier ‘strain theory’ by addressing the <italic>var</italic> gene family of <italic>Plasmodium falciparum</italic>. The model explicitly considers the extensive diversity of multi-copy genes that undergo antigenic variation via sequential, mutually exclusive expression. It tracks the dynamics of all unique <italic>var</italic> repertoires in a population of hosts, and shows that even under high levels of sexual recombination, strain competition mediated through cross-immunity structures the parasite population into a subset of coexisting dominant repertoires of <italic>var</italic> genes whose degree of antigenic overlap depends on transmission intensity. Empirical comparison of patterns of genetic variation at antigenic and neutral sites supports this role for immune selection in structuring parasite diversity.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00093.001">http://dx.doi.org/10.7554/eLife.00093.001</ext-link></p></abstract><abstract abstract-type="executive-summary"><object-id pub-id-type="doi">10.7554/eLife.00093.002</object-id><title>eLife digest</title><p>Malaria is an infectious disease that is estimated to kill more than half a million people every year, mostly young children in Africa. It is spread by mosquitos that are infected with <italic>Plasmodium</italic> parasites that attack red blood cells in the human body. <italic>Plasmodium falciparum</italic>, the species that is responsible for most of these deaths, causes malaria by entering red blood cells and releasing antigens that travel to the surface of the cells, where they change the adhesion properties. This causes the infected red blood cells to accumulate in small blood vessels, surface capillaries or the brain, which can have severe consequences for the person infected.</p><p><italic>P. falciparum</italic> is particularly dangerous because of its ability to vary the antigens displayed on the cell surface: this process, known as antigenic variation, helps to maintain infections for extended periods of time by allowing the antigens to stay one step ahead of the immune system (a process known as immune escape). The origins of antigenic variation lie in the fact that each <italic>P. falciparum</italic> genome has a repertoire of between 50 and 60 <italic>var</italic> genes that code for the variability of a major antigen that is responsible for immune escape in malaria. Molecular sequencing has shown that local parasite populations contain thousands of different types of <italic>var</italic> genes: hence, meiotic recombination in the mosquito can create a vast number of combinations of <italic>var</italic> repertoires.</p><p>Artzy-Randrup et al. have developed a computational model of this highly diverse and complex system to address the following question: is a local pathogen population composed of largely random and ephemeral repertoires of these genes, or is it structured into independently circulating strains? Their model goes beyond previous models by including interactions within the local host population that arise as a result of indirect competition between different strains of the pathogen for available hosts: this competition is influenced by the history of infection and, therefore, by the patterns of immunity within the host population. Previous models included within-host processes but not these higher, local population-level interactions.</p><p>The model simulates the dynamics of all the unique combinations of <italic>var</italic> genes in a population of hosts, and shows that even with high rates of reproduction, the parasite population self-organizes into a limited number of coexisting strains: the distinct <italic>var</italic> repertoires of these strains only weakly overlap, suggesting that the immune response of the host population has been partitioned into distinct niches. By investigating genetic variation at both antigenic sites and regions of the genome that do not code for antigens, Artzy-Randrup et al. suggest that immune selection—the selection imposed on <italic>var</italic> repertoires by the build up of specific immunity at the population level—plays a central role in structuring parasite diversity.</p><p>The new model should lead to a better understanding of the epidemiology of <italic>Plasmodium</italic> and other pathogens that work in similar ways, including <italic>Trypanosoma brucei</italic> (sleeping sickness), <italic>Borellia burgdorferi</italic> (Lyme disease) and <italic>Giardia lamblia</italic> (gastroenteritis), and help with global efforts to eliminate malaria and other diseases.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00093.002">http://dx.doi.org/10.7554/eLife.00093.002</ext-link></p></abstract><kwd-group kwd-group-type="author-keywords"><title>Author keywords</title><kwd>parasite population structure</kwd><kwd>epidemiological dynamics</kwd><kwd>antigenic diversity</kwd><kwd>immune selection</kwd><kwd>Plasmodium falciparum</kwd><kwd>var multi-gene family</kwd></kwd-group><kwd-group kwd-group-type="research-organism"><title>Research organism</title><kwd>Other</kwd></kwd-group><funding-group><award-group id="par-1"><funding-source><institution-wrap><institution>The Wellcome Trust Programme</institution></institution-wrap></funding-source><award-id>Grant 041354</award-id><principal-award-recipient><name><surname>Day</surname><given-names>Karen</given-names></name></principal-award-recipient></award-group><award-group id="par-2"><funding-source><institution-wrap><institution>National Institutes of Health/National Institute of General Medical Sciences</institution></institution-wrap></funding-source><award-id>GM061351-07</award-id><principal-award-recipient><name><surname>Day</surname><given-names>Karen</given-names></name><name><surname>Chen</surname><given-names>Donald</given-names></name></principal-award-recipient></award-group><award-group id="par-3"><funding-source><institution-wrap><institution>National Institutes of Health Ruth L. Kirschstein National Research Service Award</institution></institution-wrap></funding-source><award-id>F32AI071765</award-id><principal-award-recipient><name><surname>Chen</surname><given-names>Donald</given-names></name></principal-award-recipient></award-group><award-group id="par-4"><funding-source><institution-wrap><institution>McDonnell Foundation</institution></institution-wrap></funding-source><principal-award-recipient><name><surname>Dobson</surname><given-names>Andrew P</given-names></name></principal-award-recipient></award-group><funding-statement>The funders had no role in study design, data collection and interpretation, or the decision to submit the work for publication.</funding-statement></funding-group><custom-meta-group><custom-meta><meta-name>elife-xml-version</meta-name><meta-value>2</meta-value></custom-meta><custom-meta specific-use="meta-only"><meta-name>Author impact statement</meta-name><meta-value>Mathematical modeling shows that local populations of the malaria parasite self-organize into a limited number of transient but distinct strains through competition for hosts in immunity space.</meta-value></custom-meta></custom-meta-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Many pathogen populations seem to be composed of several independent strains; this has important implications for disease surveillance and control, as well as for the identification of vaccine targets. In particular, the population genetic interactions between pathogen strains can have significant epidemiological consequences, influencing transmissibility, clinical immunity, and the duration and severity of infection. An extensive variety of microparasites have been studied in this context: protozoa, such as <italic>Plasmodium falciparum</italic>, <italic>Leishmania</italic>, and <italic>Trypanosoma brucei</italic>; viruses, such as <italic>Influenza</italic>, <italic>HIV</italic> and <italic>Dengue</italic>; and bacteria, such as <italic>E. coli</italic>, <italic>Bordetella spp.</italic> and <italic>Neisseria meningitides</italic> (<xref ref-type="bibr" rid="bib52">Tibayrenc et al., 1990</xref>; <xref ref-type="bibr" rid="bib33">Gupta et al., 1994</xref>; <xref ref-type="bibr" rid="bib51">Tibayrenc and Ayala, 2002</xref>).</p><p>The conceptual challenges and significant human health implications associated with the pathogen population structure have led to the establishment of several theories for why we observe this structure in nature (<xref ref-type="bibr" rid="bib46">Selander et al., 1987</xref>; <xref ref-type="bibr" rid="bib52">Tibayrenc et al., 1990</xref>; <xref ref-type="bibr" rid="bib48">Smith et al., 1993</xref>; <xref ref-type="bibr" rid="bib30">Gupta and Day, 1994a</xref>, <xref ref-type="bibr" rid="bib31">1994b</xref>; <xref ref-type="bibr" rid="bib32">Gupta et al., 1996</xref>; <xref ref-type="bibr" rid="bib50">Tibayrenc, 1994</xref>). In particular, while it would seem that sufficient out-crossing should always lead to random associations between alleles (<xref ref-type="bibr" rid="bib52">Tibayrenc et al., 1990</xref>; <xref ref-type="bibr" rid="bib51">Tibayrenc and Ayala, 2002</xref>) and preclude the persistence of ‘independently transmitted strains’ (<xref ref-type="bibr" rid="bib50">Tibayrenc, 1994</xref>), mathematical models of competition between pathogen strains have demonstrated that immune selection can lead to the maintenance of discrete, non-overlapping, antigenic repertoires—even when antigenic variability is driven by several unlinked genes that undergo recombination (<xref ref-type="bibr" rid="bib32">Gupta et al., 1996</xref>; <xref ref-type="bibr" rid="bib29">Gupta and Anderson, 1999</xref>). An inherent challenge in testing ‘strain theory’ is to determine whether observed empirical patterns in pathogen population structure result from immune selection, or alternatively, from simple demographic processes (i.e., uneven relatedness among individuals in the pathogen population that can result from random genetic drift, particularly within the complex context of transmission dynamics) (<xref ref-type="bibr" rid="bib10">Buckee et al., 2008</xref>, <xref ref-type="bibr" rid="bib11">2011</xref>).</p><p><italic>P. falciparum</italic> is responsible for the deadliest type of malaria in humans. The complexities of its population genetics, in terms of the variable and often enormous levels of sequence variation observed at antigenic sites within local populations, are intimately tied to both its pathology and its ability to escape immune detection. While this genetic complexity provides significant challenges to malaria research and control, it also provides an opportunity to extend existing strain theory in a way that can be tested empirically. Specifically, an important extension of earlier strain theory is to consider the effects of immune selection in populations of pathogens whose antigen-encoding loci are: (a) multi-copy and recombining (i.e., located on different chromosomes of a haploid genome), and (b) undergoing antigenic variation via sequential, mutually exclusive expression within an infected host. It is not clear whether a stable strain structure would emerge under the sequential expression of multi-copy genes. Consideration of this type of system provides a more complete framework for understanding antigenic structure and its epidemiological consequences in a broader variety of pathogens; it also offers the opportunity to distinguish the effects of immune selection from those of neutral demographic forces, providing testable predictions for these two alternative mechanisms.</p><p>We describe an agent-based model that extends strain theory to address the effect of immune selection acting on multi-copy antigen genes; we use the <italic>var</italic> gene family of <italic>P. falciparum</italic> as the basis for this model. The <italic>var</italic> genes encode <italic>P. falciparum</italic> erythrocyte membrane protein 1 (PfEMP1)—the major surface antigen of the parasite's blood stages that binds to host endothelial cell receptors to allow the parasite to sequester within various host tissues (<xref ref-type="bibr" rid="bib39">Miller et al., 2002</xref>; <xref ref-type="bibr" rid="bib45">Scherf et al., 2008</xref>). <italic>Var</italic> genes are composed of multiple Duffy-binding-like (DBL) and cysteine-interdomain-rich (CIDR) domains that encode binding functions for specific endothelial receptors. DBLα, is the only domain found in nearly all <italic>var</italic> genes (<xref ref-type="bibr" rid="bib39">Miller et al., 2002</xref>), and hence is the most informative molecular marker of <italic>var</italic> gene diversity. Each parasite genome has up to 60 <italic>var</italic> genes, and differential sequential expression of these genes allows the parasite to evade the host immune response and establish a chronic infection. This clonal antigenic variation sensu stricto (<xref ref-type="bibr" rid="bib39">Miller et al., 2002</xref>; <xref ref-type="bibr" rid="bib45">Scherf et al., 2008</xref>) extends the duration of infection to facilitate transmission to the mosquito. Not only do <italic>var</italic> genes influence transmission, but specific <italic>var</italic> genes are associated with severe malarial disease and specific PfEMP1 binding phenotypes (<xref ref-type="bibr" rid="bib20">Deitsch et al., 2009</xref>; <xref ref-type="bibr" rid="bib15">Chan et al., 2012</xref>; <xref ref-type="bibr" rid="bib17">Claessens et al., 2012</xref>; <xref ref-type="bibr" rid="bib38">Lavstsen et al., 2012</xref>; <xref ref-type="bibr" rid="bib54">Warimwe et al., 2012</xref>).</p><p>Population studies have shown that individual <italic>P. falciparum</italic> genomes have distinct repertoires of <italic>var</italic> genes (<xref ref-type="bibr" rid="bib2">Barry et al., 2007</xref>; <xref ref-type="bibr" rid="bib45">Scherf et al., 2008</xref>; <xref ref-type="bibr" rid="bib16">Chen et al., 2011</xref>) that extensively recombine (<xref ref-type="bibr" rid="bib26">Freitas-Junior et al., 2000</xref>; <xref ref-type="bibr" rid="bib49">Taylor et al., 2000</xref>) during sexual recombination in the mosquito (<xref ref-type="bibr" rid="bib42">Paul et al., 1995</xref>). The immense sequence diversity observed among <italic>var</italic> genes and <italic>var</italic> repertoires has been attributed to high rates of meiotic (and possibly also mitotic) recombination. These high rates of recombination presumably allow for very low linkage disequilibrium among <italic>var</italic> loci. Our modeling framework considers the dynamics shaping the enormous potential diversity of genomic repertoires of <italic>var</italic> genes by tracking all possible <italic>var</italic> repertoires, given a diverse pool of genetic variants. We explore whether structured parasite populations resulting from the selection pressures exerted by competition among distinct <italic>var</italic> repertoires for hosts, mediated by cross-immunity, can emerge.</p></sec><sec id="s2" sec-type="results"><title>Results</title><p>We model the dynamics of multiple parasite genomes that simultaneously circulate in a large host population, continuously tracking the formation of new genomes through recombination, mutation and immigration events (<xref ref-type="bibr" rid="bib42">Paul et al., 1995</xref>; <xref ref-type="bibr" rid="bib6">Bruce et al., 2000a</xref>, <xref ref-type="bibr" rid="bib7">2000b</xref>). Reliable numerical results require the simulation of explicit transmission events, as well as complete knowledge of the exposure history of each individual host with respect to past and present infections by different parasite genomes. Thus, an agent-based model is formulated that follows each host from birth to death, while recording their exposure history and the specific immunity each gradually gains as a result of infections (for a detailed description of the model see the ‘Materials and methods’ section).</p><p>The simulated host population is continuously exposed to an immense diversity of distinct <italic>var</italic> repertoires, since new combinations of <italic>var</italic> genes are continuously generated through meiotic recombination events. As a conservative example, consider the number of potential configurations arising from the combinatorial possibilities of 6 loci with 50 <italic>var</italic> genes in the pool: more than 3 × 10<sup>7</sup> repertoires! Despite this large potential diversity, simulation results show that only a few dominant <italic>var</italic> repertoires circulate and persist at any given time, effectively keeping <italic>var</italic> repertoire diversity orders of magnitude lower than is potentially possible given the number of <italic>var</italic> genes present in the host population (<xref ref-type="fig" rid="fig1">Figure 1</xref>). We find that epidemiological dynamics significantly limit the diversity of coexisting dominant genomes under a broad spectrum of transmission intensities. This pattern persists in the long-term, far out-living the influence of initial conditions, and persisting through occasional changes in the identity of the dominant <italic>var</italic> repertoires (<xref ref-type="fig" rid="fig1">Figure 1</xref>). Thus, on epidemiological (and longer) time scales, most of the parasite population is structured into a limited number of distinct <italic>var</italic> repertoires.<fig id="fig1" position="float"><object-id pub-id-type="doi">10.7554/eLife.00093.003</object-id><label>Figure 1.</label><caption><p>Characteristic time series demonstrating the emergence and maintenance of population structure under three levels of recombination probabilities, 0.001 (a), 0.01 (b) and 0.1 (c), while keeping all other parameters equal. Top: stacked histograms of the number of genome transmission events per year of the different circulating repertoires, each represented by a different color. All <italic>var</italic> repertoires sampled less than 50 times are pooled and plotted in grey. Bottom: The corresponding number of transmission events of each <italic>var</italic> gene per year (each gene plotted in a different color). As recombination increases, population turnover is more rapid, still showing well-defined population structure. Although dominant genome identities may change in time, the level of transmission per gene is relatively constant and hardly influenced by turnovers on the strain population level. The relative fraction of short-lived genomes increases with recombination (grey area), and although the total number of transmission events per year is not influenced by recombination rate, cases of transmission of de-novo genomes is higher for higher levels of recombination. Parameters: <italic>b</italic> = 18, <italic>G</italic> = 30, <italic>g</italic> = 6, <italic>α</italic> = 15, <italic>H</italic> = 10,000, <italic>ω</italic> = 0.0005, <italic>τ</italic> = 1.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00093.003">http://dx.doi.org/10.7554/eLife.00093.003</ext-link></p></caption><graphic xlink:href="elife00093f001"/></fig></p><p>We find that the parasite population structure exhibits punctuated turnover: brief episodes of restructuring result in a new set of dominant <italic>var</italic> repertoires. Despite the changing identities of the dominant <italic>var</italic> repertoires, the overall diversity of repertoires present and the individual gene frequencies remain remarkably constant (<xref ref-type="fig" rid="fig1">Figure 1</xref>, lower panels). These transient phenomena punctuate periods of stasis with stable population structure. In essence, although there are an effectively infinite number of niches in host immunity space, <italic>var</italic> repertoires appear to exploit this space by partitioning it into a number of discrete and partially overlapping niches. In addition, these repertoires appear to quickly adapt and achieve some optimum after perturbations arising from the stochastic nature of the underlying demographic and transmission processes. The episodes of restructuring become more frequent as recombination rates increase, but the diversity of dominant <italic>var</italic> repertoires remains low throughout these semi-stable states. Indeed, the maintenance of structure is found to be robust even under very high levels of recombination (<xref ref-type="fig" rid="fig1">Figure 1</xref>). The emergence of pathogen population structure is robust to alternative formulations of our multi-locus model that do not consider sequential expression, or formulations that consider randomly ordered sequential expression. In addition, episodes of restructuring can also be observed when expression is not sequential.</p><p>The level of diversity remains orders of magnitude lower than that potentially allowed by the <italic>var</italic> gene pool itself. However, as transmission intensity increases, the overlap between distinct dominant <italic>var</italic> repertoires also increases, with completely discordant genomes only appearing at the lower end of the spectrum (see <xref ref-type="fig" rid="fig2">Figure 2</xref>). To capture the characteristic features of different population compositions we defined four metrics: <italic>N*</italic>, measuring the average number of successful transmission events per year, <italic>V*</italic>, measuring the average number of de-novo genomes transmitted per year, <italic>R*</italic>, measuring the diversity of <italic>var</italic> repertoires, and <italic>F*</italic>, measuring the degree of <italic>var</italic> overlap between distinct repertoires (see ‘Materials and methods’). We find that as transmission intensity (biting rate) increases, all four measures increase as well, and that epidemiological dynamics clearly constrain <italic>var</italic> repertoire diversity and structure parasite populations, with the degree of overlap determined by epidemiological parameters (<xref ref-type="fig" rid="fig3">Figure 3A–D</xref>). Our findings are robust to different host population sizes (from 1,000 to 100,000 individuals), different gene pools sizes (from 10 to 500), and different repertoire lengths (from 2 to 30) (<xref ref-type="fig" rid="fig3">Figure 3</xref>).<fig id="fig2" position="float"><object-id pub-id-type="doi">10.7554/eLife.00093.004</object-id><label>Figure 2.</label><caption><p>Different degrees of distinct <italic>var</italic> repertoire overlap with transmission intensity. The number of genome transmission events per year for the different circulating repertoires are represented by different colors as stacked histograms similar to those of <xref ref-type="fig" rid="fig1">Figure 1</xref>. Emerging populations are typically characterized for low transmission intensities (<bold>A</bold>), by a low number of dominating genomes with a low level of antigenic overlap (<italic>R</italic>* = 9.2, <italic>F</italic>* = 1.2, see ‘Materials and methods’); and for high transmission intensities (<bold>B</bold>), by higher diversity and higher antigenic similarity (<italic>R</italic>* = 17.5, <italic>F</italic>* = 2.1). The fraction of long-lived genomes dominating transmission events is labeled by A in both figures, and the fraction of short-lived genomes, by B (these are grouped into one single number and plotted in gray). Parameters: <italic>b</italic> = 8.5 and <italic>b</italic> = 9.5, <italic>G</italic> = 50, <italic>g</italic> = 6, <italic>α</italic> = 15, <italic>H</italic> = 20,000, <italic>ω</italic> = 0.0005, ρ=0.01, <italic>τ</italic> = 1, <italic>κ</italic> = 1 year.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00093.004">http://dx.doi.org/10.7554/eLife.00093.004</ext-link></p></caption><graphic xlink:href="elife00093f002"/></fig><fig id="fig3" position="float"><object-id pub-id-type="doi">10.7554/eLife.00093.005</object-id><label>Figure 3.</label><caption><p>Top four panels: the metrics characterizing population structure for three host population sizes as a function of transmission intensity (see ‘Materials and methods’). Green, blue and purple represent <italic>H</italic> = 5,000, <italic>H</italic> = 10,000, and <italic>H</italic> = 25,000, respectively. (<bold>A</bold>) A measure of diversity capturing the number of dominating genomes (<italic>R</italic>*, in the y-axis) as a function of <italic>b</italic>, (<bold>B</bold>), a measure of average antigenic similarity between genomes (<italic>F</italic>*, in the y-axis) as a function of <italic>b</italic>, (<bold>C</bold>) the average number of novel repertoires generated and successfully transmitted each year, and (<bold>D</bold>) the total number of successful transmission events each year. As transmission intensity increases, the number of dominating genomes increases, and in accordance, the degree of antigenic similarity increases as well—however the number of distinct repertoires that are maintained in the system at epidemiologically relevant frequencies remains extremely low relative to the total number of distinct repertoires that can be crated through recombination. Note the differences in magnitude; while the number of de novo repertoires entering the system is 10-fold higher then the observed diversity, the number of successful transmission events that these dominating repertoires are involved in is on the order of 10<sup>6</sup>. For extremely low biting rates, in a narrow window of parameter values, diversity decreases abruptly (<bold>A</bold>). This reflects a different dynamic regime in which dominant strains replace each other in a fluctuating manner and population structure does not apply. Parameters: <italic>G</italic> = 50, <italic>g</italic> = 6, <italic>α</italic> = 15, <italic>ω</italic> = 0.0005, ρ=0.05, <italic>τ</italic> = 1, <italic>κ</italic> = 1 year. Bottom four panels: characteristic time series demonstrating structured parasite populations for larger gene pools (<italic>G</italic>) and longer sequence lengths (<italic>g</italic>): (<bold>A</bold>) <italic>b</italic> = 18, <italic>G</italic> = 100, <italic>g</italic> = 6, <italic>α</italic> = 15, <italic>N</italic> = 20,000, <italic>ω</italic> = 0.0005, ρ=0.001, <italic>τ</italic> = 1. (<bold>B</bold>) <italic>b</italic> = 18, <italic>G</italic> = 200, <italic>g</italic> = 6, <italic>α</italic> = 15, <italic>H</italic> = 20,000, <italic>ω</italic> = 0.0005, ρ=0.001, <italic>τ</italic> = 1. (<bold>C</bold>) <italic>b</italic> = 18, <italic>G</italic> = 300, <italic>g</italic> = 20, <italic>α</italic> = 15, <italic>H</italic> = 20,000, <italic>ω</italic> = 0.0005, ρ=0.001, <italic>τ</italic> = 1. (<bold>D</bold>) <italic>b</italic> = 12, <italic>G</italic> = 120, <italic>g</italic> = 6, <italic>α</italic> = 15, <italic>H</italic> = 10,000, <italic>ω</italic> = 0.0005, ρ=0.005, <italic>τ</italic> = 1, <italic>κ</italic> = 1 year.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00093.005">http://dx.doi.org/10.7554/eLife.00093.005</ext-link></p></caption><graphic xlink:href="elife00093f003"/></fig></p><p>The model suggests that areas that experience different transmission intensities will exhibit ‘characteristic’ epidemiological signatures (<xref ref-type="fig" rid="fig4">Figure 4</xref>). Importantly, the gain of immunity is found to depend on the degree of repertoire overlap (i.e., the number of shared <italic>var</italic> alleles) among the different dominant genomes and not just on total prevalence (<xref ref-type="fig" rid="fig5">Figure 5</xref>). This is an important difference with compartmental transmission models that consider superinfection but have no explicit treatment of <italic>var</italic> genes and repertoire diversity.<fig id="fig4" position="float"><object-id pub-id-type="doi">10.7554/eLife.00093.006</object-id><label>Figure 4.</label><caption><p>Age profiles of immunity and infection: (<bold>A</bold>) In color are the number of hosts immune to a single arbitrary antigen in different age classes superimposed over a histogram representing the entire age distribution of hosts (in gray). The level of immunity in each class is shown for four different transmission intensities (<italic>b</italic> = 2, 4, 8 and 30, where <italic>b</italic> is the average number of biting events per host per year). (<bold>B</bold>) The average level of immunity to the general antigenic pool as a function of age. It can be seen in (<bold>A</bold>) and (<bold>B</bold>), that at higher levels of transmission intensity, exposure to the diversity of antigenic types typically shifts towards the younger age classes, and hosts gain high levels of immunity to a majority of the variants earlier on in life. (<bold>C</bold>) A measure of parasite rate demonstrated by the fraction of infected hosts in different age groups (see also <xref ref-type="bibr" rid="bib31">Gupta and Day, 1994b</xref>) for 2 transmission intensities (<italic>b</italic> = 2 and 8). (<bold>D</bold>) A measure of superinfection demonstrated by the average number of antigens an infected host is naïve in each age class. Under high-transmission regimes, we characteristically observe high levels of superinfection (i.e., relatively long durations of infection) and high parasite rates in the very young age classes, after which immunity is rapidly gained to most of the antigenic variants circulating in the population. In contrast, host populations in regimes of very low transmission, characteristically exhibit similar levels of parasite rates in all age groups, and immunity is gradually gained throughout life, with infection spanning all age classes. Parameters: <italic>G</italic> = 40, <italic>g</italic> = 6, <italic>α</italic> = 15, <italic>H</italic> = 20,000, <italic>ω</italic> = 0.0005, ρ=0.01, <italic>τ</italic> = 1, <italic>κ</italic> = 1 year. Transmission events were sampled at a frequency of 1:100, and the host population was sampled every 10 years at a ratio of 1:100.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00093.006">http://dx.doi.org/10.7554/eLife.00093.006</ext-link></p></caption><graphic xlink:href="elife00093f004"/></fig><fig id="fig5" position="float"><object-id pub-id-type="doi">10.7554/eLife.00093.007</object-id><label>Figure 5.</label><caption><p>Strain specific immunity and transcending immunity. (<bold>A</bold>) Diagram demonstrating the partition of 40 genes from the general pool (represented by circles) between 8 dominating strains (each marked with a unique color, and composed of a subset of 6 genes). Five of these strains are antigenically unique as they have no overlap with any of the other strains, two of these strains share all of their genes with other strains (red and light blue), and one of the strains has a partially unique antigenic profile sharing 66% of its genes with other strains (purple). (<bold>B</bold>) The number of hosts immune to strains 1 and 2 (orange and red, respectively) for each age class superimposed over the host age distribution (grey). Immunity to strain 1 is strain specific and only gained through exposure to this particular strain due to the uniqueness of its antigenic profile. By contrast, immunity to strain 2 is strain ‘transcending’ and acquired also by exposure to other strains with which it shares genes. It follows that hosts are exposed to strain 1 at a higher level and at younger ages, than those for strain 2. Parameters: <italic>b</italic> = 3, <italic>G</italic> = 40, <italic>g</italic> = 6, <italic>α</italic> = 15, <italic>H</italic> = 20,000, <italic>ω</italic> = 0.0005, ρ=0.01, <italic>τ</italic> = 1, <italic>κ</italic> = 1 year.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00093.007">http://dx.doi.org/10.7554/eLife.00093.007</ext-link></p></caption><graphic xlink:href="elife00093f005"/></fig></p><p>Two recent large-scale studies aimed at assessing the extent of local reservoirs of <italic>var</italic> genes in five epidemiologically and geographically distinct <italic>P. falciparum</italic> populations (<xref ref-type="bibr" rid="bib2">Barry et al., 2007</xref>; <xref ref-type="bibr" rid="bib16">Chen et al., 2011</xref>) provide us with new knowledge on the distribution of <italic>var</italic> genes in parasite genomes. These new data clearly show that the frequency distribution of distinct <italic>var</italic> genes, or sequence ‘types’ (defined by the level of sequence identity within the DBLα domain) is significantly different from what we would expect if sequence types were equal in frequency and uncorrelated (<xref ref-type="fig" rid="fig6">Figure 6</xref>). In addition, the data show significant nonrandom associations among many <italic>var</italic> DBLα types within the sampled isolates (<xref ref-type="fig" rid="fig6">Figure 6</xref>).<fig id="fig6" position="float"><object-id pub-id-type="doi">10.7554/eLife.00093.008</object-id><label>Figure 6.</label><caption><p>Nonrandom organization of <italic>var</italic> DBLα types between 30 sampled parasite isolates from Amele, Papua New Guinea as published in (<xref ref-type="bibr" rid="bib16">Chen et al., 2011</xref>). (<bold>A</bold>) Presence–absence matrix showing the distribution of <italic>var</italic> types in isolates: Each row corresponds to an individual parasite isolate and each column to a distinct <italic>var</italic> type. The color bar indicates the number of distinct isolates each <italic>var</italic> type was identified in. (<bold>B</bold>) The frequency distribution of the number of isolates in which each <italic>var</italic> type was identified, obtained by assuming a total <italic>var</italic> richness of ∼369, as estimated in (<xref ref-type="bibr" rid="bib16">Chen et al., 2011</xref>). The observed distribution for the data (red) and the expected distribution when assuming all <italic>var</italic> types circulate at equal frequencies (blue) were found to be significantly different (p<sub>v</sub><0.0001 using a K–S two sample test). Note the enrichment for both very rare and very common <italic>var</italic> types in the data. (<bold>C</bold>) Observed and expected co-occurrence of <italic>var</italic> DBLα types. In each matrix cell (<italic>i</italic>,<italic>j</italic>) is the number of times <italic>var</italic> types <italic>i</italic> and <italic>j</italic> were found in the same isolate. The co-occurrence of <italic>var</italic> types found in multiple isolates is significantly higher than for the null expectation under the assumption of linkage equilibrium among all <italic>var</italic> types (p<sub>v</sub><0.01) (<xref ref-type="bibr" rid="bib1">Artzy-Randrup and Stone, 2005</xref>) (the expected co-occurrence matrix conserves both the observed number of <italic>var</italic> types in each isolate and the observed frequency distribution of different <italic>var</italic> types (<xref ref-type="bibr" rid="bib16">Chen et al., 2011</xref>)). (<bold>D</bold>) A network of allele pairs with both high <italic>D</italic> and <italic>r</italic>. The <italic>D</italic> values are among the highest pair-wise comparisons in the dataset (using a cutoff of <italic>D</italic> > 0.0748), and the <italic>r</italic> values range from 1 to 0.58, and are reflected by the weight of the edges. Based on sequence features (<xref ref-type="bibr" rid="bib12">Bull et al., 2007</xref>), and the fact that genomic organization of <italic>var</italic> sequence groups appear to be conserved across globally distributed isolates (<xref ref-type="bibr" rid="bib37">Kyes et al., 2007</xref>), it is very unlikely that <italic>var</italic> type 22 (being UpsA-like) is physically linked to the other alleles in the network (since they are all UpsB/UpsC-like). (<bold>E</bold>) The relatedness of the <italic>var</italic> DBLα repertoires of an isolate pair as a function of the relatedness of their microsatellite repertoires. Relatedness is defined as the number of <italic>var</italic> types shared between the two isolates, divided by the average number of <italic>var</italic> types identified per isolate for that pair of isolates.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00093.008">http://dx.doi.org/10.7554/eLife.00093.008</ext-link></p></caption><graphic xlink:href="elife00093f006"/></fig></p><p>These patterns in observed <italic>var</italic> repertoires may alternatively result from neutral demographic processes: that is, individual mosquitoes bite discrete hosts, and thus, inevitably sample the host population unevenly. This limits ‘random mating’ and thus recombination between parasite genomes. Hence, even under neutral forces, it is possible for parasites to differ in their relatedness to one another. Under this alternative assumption we expect these neutral demographic processes to shape the diversity at all loci to the same extent (after controlling for differences in physical linkage and recombination rate between loci). Evidence of more extensive ‘strain structure’ at antigenic, immune-selected sites compared to neutral sites suffices as proof that selective forces are at work, and of these, immune selection is the most parsimonious explanation.</p><p>We compare patterns of variation at immune-selected sites to neutral sites in a variety of ways (see ‘Materials and methods’), and we propose this as an effective empirical test of strain theory. Our test is conceptually similar to empirical analyses of strain theory undertaken in the past (<xref ref-type="bibr" rid="bib9">Buckee et al., 2010</xref>), but in this system, there is the opportunity for a more powerful test since the multi-copy nature of <italic>var</italic> genes allows us to examine patterns of variation at many independent (i.e., physically unlinked) genetic sites. Currently, the dataset with the most extensive sampling of diversity at both <italic>var</italic> and microsatellite loci within a local population consists of a set of 30 single infection isolates from a local population in Papua New Guinea for which we have sequences for a portion of the <italic>var</italic> DBLα domain and the alleles for 12 microsatellite loci (<xref ref-type="bibr" rid="bib2">Barry et al., 2007</xref>; <xref ref-type="bibr" rid="bib16">Chen et al., 2011</xref>).</p><p>Because we expect alleles at the same locus to anti-correlate, and because it is unknown which DBLα alleles share a common locus, we only analyze positive correlations. We measure the positive linkage disequilibrium coefficients (<italic>D</italic>) for the presence/absence states for all unique pairs of microsatellite or <italic>var</italic> DBLα alleles. High <italic>D</italic> values indicate a correlation between alleles within isolates, and they are maximized at intermediate allele frequency (see and ‘Materials and methods’). For the <italic>var</italic> DBLα dataset there are 1288 distinct pairs of alleles with positive <italic>D</italic> values that exceed a two-tailed significance threshold of 0.05 (<xref ref-type="bibr" rid="bib34">Hedrick et al., 1978</xref>). Given the number of tests performed, under the null hypothesis of no significant correlations between alleles, we would expect only 310 pairs to exceed this threshold. For the microsatellite dataset there are 146 distinct pairs of alleles with positive <italic>D</italic> values that exceed the significance threshold and under the null hypothesis we would expect only 49. Therefore, both datasets show an enrichment of positive correlations among allele pairs, and thus, significant linkage disequilibrium. The <italic>D</italic> values of the <italic>var</italic> DBLα dataset are higher than those of the microsatellite dataset (p<sub>v</sub><<0.0001 by Mann–Whitney test), and we argue that this cannot easily be explained by allele frequency differences or differences in the extent of physical linkage among sites (see ‘Materials and methods’).</p><p>Another important observation is that, at least at this level of resolution, <italic>var</italic> DBLα repertoire relatedness is not a function of microsatellite repertoire relatedness. <xref ref-type="fig" rid="fig6">Figure 6E</xref> shows the relatedness of the <italic>var</italic> DBLα repertoires of an isolate pair as a function of the relatedness of their microsatellite repertoires. The absence of any correlation suggests the possibility that <italic>var</italic> DBLα variation is shaped by other forces than the neutral demographic forces shaping microsatellite variation.</p><p>We also consider only the most informative <italic>var</italic> types in isolation by identifying highly correlated sets of <italic>var</italic> types. We then tested the relatedness of microsatellite alleles among the isolates containing these networks of correlated <italic>var</italic> types. The networks of correlated <italic>var</italic> types were constructed from pairs of <italic>var</italic> types exhibiting both high linkage disequilibrium and correlation coefficients (i.e., <italic>D</italic> and <italic>r</italic>). <xref ref-type="fig" rid="fig6">Figure 6D</xref> represents one of the largest of such fully connected networks (with <italic>D</italic> > 0.0748 used as the cutoff), however this complete network is only observed in two isolates in the dataset. The microsatellite repertoires of these two isolates are less related than average for the whole dataset, so at least in this case, high microsatellite relatedness does not explain the existence of these highly correlated <italic>var</italic> types. Additionally, smaller subsets of correlated <italic>var</italic> types are often found in isolates with very dissimilar microsatellite alleles. These results suggest that the existence of highly correlated <italic>var</italic> types is not always explained by high levels of underlying genome relatedness. Moreover, when we use the same cutoff <italic>D</italic> value to look for fully connected networks of correlated microsatellite alleles, the largest of such networks comprises only four alleles as opposed to six (six pairwise connections as compared to 15).</p><p>Although the sample size of this dataset is too small to identify anything but very strong correlations between intermediate frequency <italic>var</italic> types (<xref ref-type="bibr" rid="bib3">Brown, 1975</xref>), these analyses support a possible role for immune selective forces in structuring the variation at an important class of antigen-encoding loci in <italic>P. falciparum</italic>. More extensive datasets will be needed for definitive conclusions, but these are now within reach as next generation sequencing methods make it feasible to consider sampling whole communities of parasite genomes to assess <italic>var</italic> population structure.</p></sec><sec id="s3" sec-type="discussion"><title>Discussion</title><p>In accordance with predictions from the original ‘strain theory’, our model constrains total repertoire diversity to levels that are orders of magnitude lower than is potentially possible given the diversity of the gene pool. This reduction in diversity occurs because coexisting parasites are structured into a few variants with largely discordant repertoires. In a departure from previous strain theory, our model predicts that the different dominant repertoires can exhibit partial overlap; the extent of the overlap increases with transmission intensity and this, in turn, influences observed epidemiological patterns (particularly age-serology profiles).</p><p>The specific immune profile of each individual host effectively structures the population into distinct sets of ‘patches’ or ‘resources’ that define an immune environment, ultimately causing immune selection to act on the parasite population. These distinct sets of patches are formed and conserved even when immunity to the <italic>var</italic> alleles is shorter-lived. Observations of individuals becoming susceptible to severe infection at later stages of their life (see for example (<xref ref-type="bibr" rid="bib21">Dhingra et al., 2010</xref>)), may be in part a consequence of short-lived immunity. Under this assumption, hosts in our model regain protection by exposure to one of the dominant strains circulating in the host population at high frequencies, and do so at a sufficiently high rate to preserve strain population structure except at extremely low transmission intensity. In the event that a host is infected by one of the low frequency genomes that are continuously being introduced (and equally quickly vanishing), it is highly unlikely that this successful transmission event is sufficient for invasion or even replacement of the currently dominating strain community.</p><p>Discordant repertoires that exhibit partial immunological/antigenic overlap blur the distinction between the acquisition of strictly strain-specific immunity and the acquisition of strictly strain-transcending immunity (<xref ref-type="bibr" rid="bib30">Gupta and Day, 1994a</xref>, <xref ref-type="bibr" rid="bib31">1994b</xref>) (see caption of <xref ref-type="fig" rid="fig5">Figure 5</xref>). This underscores the role of strain diversity structure, rather than diversity per se, in determining observed epidemiological patterns and their response to intervention. By reducing antigenic overlap between strains, vector control efforts will result in infection at an older age and a more gradual acquisition of protection to infection, even in the absence of changes in <italic>var</italic> gene diversity. The model in its current form does not differentiate infection from clinical disease, thus we cannot explicitly address the impact of control on the severity of symptoms. However, if the number of <italic>var</italic> genes that a host has previously encountered relates to the degree of protection against clinical disease, we would expect more severe symptoms to occur at younger ages under high transmission settings, and in contrast, more homogeneous malaria incidents are likely to occur over a broader range of age-classes when transmission is lowered (<xref ref-type="fig" rid="fig4">Figure 4D</xref>). Investigation of these patterns awaits the formulation of models that include functional, non-antigenic, differences between strains, as well as more empirical understanding of the role played by <italic>var</italic> genes associated with more severe disease. Future work should thus extend our model to consider functional, non-antigen-encoding differences between <italic>var</italic> genes (<xref ref-type="bibr" rid="bib13">Bull et al., 1999</xref>; <xref ref-type="bibr" rid="bib39">Miller et al., 2002</xref>; <xref ref-type="bibr" rid="bib45">Scherf et al., 2008</xref>; <xref ref-type="bibr" rid="bib8">Buckee et al., 2009</xref>; <xref ref-type="bibr" rid="bib17">Claessens et al., 2012</xref>; <xref ref-type="bibr" rid="bib47">Severins et al., 2012</xref> for an example of a recent model applied to questions on the evolution of virulence). Ultimately, ways to represent the effects of pathogen diversity implicitly within a standard epidemiological framework, that might also be more easily parameterized, should also be investigated.</p><p>The goal of malaria eradication is to reduce the reservoir of malaria infection in humans to zero. <xref ref-type="bibr" rid="bib16">Chen et al. (2011)</xref> have pointed to the importance of <italic>var</italic> genes in malaria surveillance, due to their influence on both the duration of infection and the degree of superinfection, and they demonstrated the existence of an immense diversity of <italic>var</italic> genes and limited <italic>var</italic> repertoire overlap in Africa, even in sites with low malaria prevalence. Consequently, they have proposed that <italic>var</italic> typing be used to complement prevalence measures for molecular surveillance of malaria control and elimination efforts. Our models support this proposal as they show that decreasing transmission provokes nonlinear changes in the dominant <italic>var</italic> configurations. Importantly, our results demonstrate that there is not a simple relationship between <italic>var</italic> diversity and repertoire diversity. Indeed, the ‘<italic>var</italic> strain’ model suggests that vector control strategies that reduce transmission will not always drastically reduce <italic>var</italic> gene diversity, because a reservoir of parasite genomes with diverse (highly non-overlapping) <italic>var</italic> repertoires will remain. This insight from the model provides a plausible explanation for why it is so difficult to eliminate malaria: non-overlapping <italic>var</italic> diversity will create significant inherent difficulties in reducing the potential of the malaria parasite to reinfect the same hosts. It also suggests that <italic>var</italic> surveillance might provide a good molecular means of evaluating control. If the end game is to be achieved in malaria control, then the mechanisms creating and maintaining antigenic diversity warrant further investigation in both modeling and empirical studies.</p><p>In conclusion, the results of our model on the dynamics of population structure in <italic>P. falciparum</italic> as defined by the <italic>var</italic> multi-gene family, have broad implications for the possible emergence of similar structure in many important human and animal pathogens that have major surface antigens encoded by multigene families, including bacterial, protozoan and fungal pathogens (<xref ref-type="bibr" rid="bib20">Deitsch et al., 2009</xref>).</p></sec><sec id="s4" sec-type="materials|methods"><title>Materials and methods</title><sec id="s4-1"><title>Epidemiological model</title><p>Each parasite is composed of a set of exactly <italic>g var</italic> genes, and the genomes are distinguishable from each other by their unique <italic>var</italic> combination. The overall diversity of <italic>var</italic> genes circulating in the host population is assumed to originate from a general predefined pool of <italic>G</italic> variants (<xref ref-type="bibr" rid="bib2">Barry et al., 2007</xref>; <xref ref-type="bibr" rid="bib16">Chen et al., 2011</xref>; <xref ref-type="bibr" rid="bib43">Recker et al., 2011</xref>). Hence, the total number of distinct <italic>var</italic> repertoires is <italic>G</italic>!/(G-<italic>g</italic>)!. In the beginning of a simulation we generate five random repertoires by sampling variants from this pool, and we infect 10 random hosts with each of these repertoires. The size of the overall host population is <italic>H</italic>. Throughout the simulation, variants from this pool are sampled, either by the mutation of one <italic>var</italic> gene to another, at probability <italic>ψ</italic>, or through an immigration event, where at rate <italic>ζ</italic> a random host in the population is infected by a <italic>var</italic> repertoire randomly sampled from this pool. While mitotic recombination within <italic>var</italic> genes may play an important role in generating additional <italic>var</italic> diversity, we do not explicitly include this process here, because for the purposes of this model, and given the high levels of diversity already present in the pool, it would play a role essentially equivalent to mutation or immigration. All our results are robust to variation in these two parameters.</p><p>During the course of an infection, a parasite expresses all of its <italic>var</italic> genes, and these are responsible for encoding PfEMP1 variant surface antigens (VSAs) (<xref ref-type="bibr" rid="bib33">Gupta et al., 1994</xref>; <xref ref-type="bibr" rid="bib39">Miller et al., 2002</xref>; <xref ref-type="bibr" rid="bib45">Scherf et al., 2008</xref>; <xref ref-type="bibr" rid="bib51">Tibayrenc and Ayala, 2002</xref>). After the host is exposed to each of these VSAs, it gains life-long immunity that is specific to each of the antigens (<xref ref-type="bibr" rid="bib14">Bull et al., 1998</xref>; <xref ref-type="bibr" rid="bib43">Recker et al., 2011</xref>). We assume that the total duration of infection in a susceptible host lasts a fixed time (<italic>κ</italic><sub>yrs.</sub>), and that in partially immune hosts, the actual duration decreases proportionally to the number of <italic>var</italic> genes that have been expressed in earlier infections (<xref ref-type="bibr" rid="bib6">Bruce et al., 2000a</xref>, <xref ref-type="bibr" rid="bib7">2000b</xref>; <xref ref-type="bibr" rid="bib27">Giha et al., 2000</xref>). It is recognized that the gain of immunity during the course of an infection is gradual (<xref ref-type="bibr" rid="bib23">Ewers, 1972</xref>; <xref ref-type="bibr" rid="bib40">Miller et al., 1994</xref>), and we capture this feature by considering that the <italic>var</italic> genes composing an infecting parasite are mutually and exclusively expressed in a fixed sequential order. Hence, at each stage of an infection, the host has already acquired specific immunity to all the VSA's encoded by <italic>var</italic> genes expressed up to that point in time. As a result, immunity to each infecting parasite is gained gradually. The infection history of each host is tracked in time and determines its immune status (<xref ref-type="bibr" rid="bib13">Bull et al., 1999</xref>; <xref ref-type="bibr" rid="bib6">Bruce et al., 2000a</xref>, <xref ref-type="bibr" rid="bib7">2000b</xref>; <xref ref-type="bibr" rid="bib27">Giha et al., 2000</xref>; <xref ref-type="bibr" rid="bib8">Buckee et al., 2009</xref>; <xref ref-type="bibr" rid="bib22">Doolan et al., 2009</xref>). This effectively structures the population of hosts into distinct sets of individual ‘patches’ or ‘resources’ that define an immune environment, which ultimately causes immune selection to act on the parasite population.</p><p>The specific rules of infection constitute a static within-host sub-model and an implicit representation of within-host dynamics, which allowed us to implement the population transmission model without explicitly representing the mechanisms that give rise to the sequential expression of different VSAs within the host. As addressed in the main text, these mechanisms remain poorly understood, although multiple within-host models for sequential waves of parasitaemia have been developed (<xref ref-type="bibr" rid="bib24">Frank, 1999</xref>; <xref ref-type="bibr" rid="bib44">Recker et al., 2004</xref>; <xref ref-type="bibr" rid="bib25">Frank and Barbour, 2006</xref>).</p><p>An infected host can harbor multiple simultaneously co-infecting parasite genomes, and each has the potential of being transmitted to another host through a mosquito biting event. When such an event takes place, each of the infecting parasites has a probability, <italic>τ</italic>, of successfully being transmitted from the infected host to the mosquito, making it possible for several different genomes to be transmitted in a single biting event (see <xref ref-type="fig" rid="fig7">Figure 7A</xref>). However, in our model we assume that the actual transmission probability of each of the genomes, is divided by the total number of co-infecting genomes at the time of the biting event. Therefore, in effect, there is a cost to co-infection that is consistent with empirical evidence for a density-dependent regulating mechanism on parasite abundance within the host (<xref ref-type="bibr" rid="bib6">Bruce et al., 2000a</xref>, <xref ref-type="bibr" rid="bib7">2000b</xref>; <xref ref-type="bibr" rid="bib4">Bruce and Day, 2002</xref>, <xref ref-type="bibr" rid="bib5">2003</xref>) (see <xref ref-type="fig" rid="fig7">Figure 7B</xref>). To demonstrate the robustness of our results under different assumptions of the within-host representation, we also considered four alternative rules governing the dynamics of co-infection. For these different rules we find similar results to those presented here. The alternative rules for within host dynamics of multiple infections are: (1) <italic>Co-infection, no cost</italic>: during the course of co-infection, there is no cost on the transmission probability of each of the infecting genomes, and hence the transmissibility of each remains, <italic>τ</italic>, identical to what it would be, had there been no other infecting genomes. (2) <italic>Co-infection, full cost</italic>: during the course of co-infection, the transmissibility of the earliest infecting genome is not compromised by the later infections and stands at <italic>τ</italic>, all later infections are not transmissible. When the earliest infection is cleared it is the next one that becomes fully transmissible. (3) <italic>Mutually exclusive infections</italic>: here, co-infections are not permitted; while a host is infected with one infection, it is not susceptible to any other. (4) <italic>Delayed super-infection</italic>: a host can harbor multiple parasite genomes, but only one actively infects the host, with transmissibility <italic>τ</italic>, while the rest remain latent until the active parasite genome is cleared. After that, one of the latent parasite genomes begins its active state until it is cleared, and so on.<fig id="fig7" position="float"><object-id pub-id-type="doi">10.7554/eLife.00093.009</object-id><label>Figure 7.</label><caption><p>Diagrams showing processes that take place during the course of a simulation: (<bold>A</bold>) in a biting event, there is likeliness that multiple parasite genomes will be transmitted simultaneously. In these events, at probability ρ, the genomes recombine to create new parasite genome variants, which then infect the receiving host. (<bold>B</bold>) A sketch of the rules governing the dynamics of infection and co-infection. By sequentially expressing different <italic>var</italic> genes during the course of an infection, host immunity is gradually gained to the PfEMP1 variants (VSA's) associated with the infecting parasite genome. When the host is exposed to an additional genome, this parasite begins expressing its <italic>var</italic> genes sequentially, as it would, had it been infecting the host on its own. Transmissibility of each of the infecting parasites during such periods of co-infection decreases according to the multiplicity of infection at the time.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00093.009">http://dx.doi.org/10.7554/eLife.00093.009</ext-link></p></caption><graphic xlink:href="elife00093f007"/></fig></p><p>Because the model is stochastic and formulated in continuous time, the implementation of the numerical simulations relies on the well-known Gillespie algorithm (<xref ref-type="bibr" rid="bib28">Gillespie, 1977</xref>) for three of the processes; biting (responsible for transmission), host death, and immigration of new parasite genomes, whose respective rates are <italic>b</italic>, <italic>α</italic>, and <italic>ζ</italic>. The algorithm considers that these processes are Poisson and determines, based on these rates, the timing of each of these events. We further consider that the population size is constant in time, such that in the case of a death, a new susceptible host is born, replacing the previous host that died. We assume that this new host has no history of exposure, nor any acquired immunity. At a ‘biting event’, a vector bites two randomly chosen hosts sequentially, if the first host is actively infected by one or several parasite genomes at that time, there is a probability for each of these to be transmitted to the second host. As noted earlier, this probability depends on transmission probability, <italic>τ</italic>, and on the number of co-infecting parasite genomes. A parasite genome that is transmitted from one host to another, has a probability <italic>ψ</italic> of mutating, such that one of its randomly chosen <italic>var</italic> genes is replaced by a randomly chosen variant from the pool. This new genome is then the one transmitted to the second host. When two or more parasite genomes are successfully transmitted from the first host to a mosquito, there is a given probability, ρ, that recombination occurs, resulting in a new <italic>var</italic> repertoire that is then transmitted from the mosquito to the second host. In this case, the novel combination is formed by randomly sampling a subset of <italic>var</italic> genes from each of the parent repertoires. Hence, when ρ>0, this effectively leads to a continuous reshuffling of <italic>var</italic> repertoires circulating in the host population. Given the extensive number of possible <italic>var</italic> combinations, these recombination events often introduce de novo parasite genomes not yet present in the infected host population. Epidemiologically, after the introduction of a de novo genome, this parasite may successfully be transmitted multiple times, possibly leading to an epidemic, and persisting in the host population for extended periods of time. Alternatively, however, it may be unsuccessful in its transmission, persisting only for a short duration of time before stochastically going extinct.</p><p>In our numerical experiments, we consider different levels of transmission intensity by specifically varying the biting rate. Thus, throughout the paper, variation in transmission intensity refers to variation in this parameter (and therefore, in the so-called entomological inoculation rate, or EIR).</p></sec><sec id="s4-2"><title>A measure of diversity</title><p><italic>R*</italic> is calculated using Simpson's Diversity index, <inline-formula><mml:math id="inf1"><mml:mrow><mml:mi mathvariant="italic">R</mml:mi><mml:mo>*</mml:mo><mml:mo>=</mml:mo><mml:mrow><mml:mn>1</mml:mn><mml:mo>/</mml:mo><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi mathvariant="italic">i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi mathvariant="italic">S</mml:mi></mml:munderover><mml:mrow><mml:msubsup><mml:mi mathvariant="italic">p</mml:mi><mml:mi mathvariant="italic">i</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:mstyle></mml:mrow></mml:mrow><mml:mo>,</mml:mo></mml:mrow></mml:math></inline-formula> where <italic>S</italic> is the number of unique genomes responsible for transmission events in a window of time, and <italic>p</italic><sub><italic>i</italic></sub> is their relative proportion. The benefit of using Simpson's index over alternative diversity indices is that it has low sensitivity to species at low abundance (in this case genomes), and gives most weight to the most abundant ones. This is appropriate in our case as we are aiming to identify the number of dominating unique genomes, and are not interested in the general richness (<italic>S</italic>), which in our case can be immense.</p></sec><sec id="s4-3"><title>A measure of antigenic overlap</title><p>The calculation of <italic>F*</italic> is also based on Simpson's Diversity index, with a focus on the distribution of genes between transmission events, such that: <inline-formula><mml:math id="inf2"><mml:mrow><mml:mi mathvariant="italic">F</mml:mi><mml:mo>*</mml:mo><mml:mo>=</mml:mo><mml:mrow><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi mathvariant="italic">j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi mathvariant="italic">G</mml:mi></mml:munderover><mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>/</mml:mo><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>∑</mml:mo><mml:mrow><mml:mi mathvariant="italic">i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi mathvariant="italic">S</mml:mi></mml:munderover><mml:mrow><mml:msubsup><mml:mi mathvariant="italic">p</mml:mi><mml:mi mathvariant="italic">i</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:mstyle></mml:mrow></mml:mrow></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mstyle></mml:mrow><mml:mo>/</mml:mo><mml:mi mathvariant="italic">G</mml:mi></mml:mrow><mml:mo>.</mml:mo></mml:mrow></mml:math></inline-formula> As before, <italic>S</italic> is the number of unique genomes responsible for transmission events in a window of time, and for each gene <italic>i</italic> from the gene pool, <italic>p</italic><sub><italic>i</italic></sub> is its relative frequency in each of the transmitted genomes. Hence, a gene that is not shared between dominating genomes will be represented at high frequency at a single genome (and the diversity will be close to 1). In contrast, the frequency of a gene that is shared by two dominating genomes will be split between both those two (and the diversity will be close to 2). We then average the degree of overlap between all genes.</p></sec><sec id="s4-4"><title>Molecular marker of <italic>var</italic> diversity</title><p>Because DBLα is the only domain found in nearly all PfEMP1 variants (<xref ref-type="bibr" rid="bib39">Miller et al., 2002</xref>), the sequence encoding the central portion of this domain provides the most informative molecular marker of <italic>var</italic> gene diversity (<xref ref-type="bibr" rid="bib26">Freitas-Junior et al., 2000</xref>; <xref ref-type="bibr" rid="bib49">Taylor et al., 2000</xref>; <xref ref-type="bibr" rid="bib2">Barry et al., 2007</xref>; <xref ref-type="bibr" rid="bib16">Chen et al., 2011</xref>). Two DBLα tags are considered to represent two distinct <italic>var</italic> ‘types’ if their nucleotide sequence identity is less than 96%.</p></sec><sec id="s4-5"><title>Microsatellites as neutral markers</title><p>Microsatellites offer an ideal and practical means to construct a null hypothesis reflecting the demographic forces shaping diversity because these sites are predominantly neutral, and their diversity can be explained by a mechanism unrelated to immune selection (i.e., slippage). In contrast, single nucleotide polymorphisms or single feature polymorphisms, because they are predominantly found in multi-copy antigenic genes in <italic>P. falciparum</italic> (<xref ref-type="bibr" rid="bib36">Jiang et al., 2008</xref>), do not offer a good basis for a null hypothesis.</p></sec><sec id="s4-6"><title>Relatedness</title><p>Relatedness is defined as the number of <italic>var</italic> types shared between two isolates, divided by the average number of <italic>var</italic> types identified per isolate for that pair of isolates.</p></sec><sec id="s4-7"><title>Linkage disequilibrium coefficient <italic>D</italic></title><p><italic>D</italic> is maximized when allele frequencies are 0.5, so <italic>D</italic> also indicates the amount of information upon which the coefficient is based (e.g., if two alleles appear only once and in the same isolate, their <italic>D</italic> will be low despite the fact that they are in perfect correlation with one another). The higher <italic>D</italic> values for <italic>var</italic> DBLα alleles versus microsatellite alleles cannot be attributed to differences in allele frequencies since the <italic>var</italic> DBLα alleles have lower frequencies than the microsatellite alleles, and thus, <italic>D</italic> values biased to lower magnitudes. While the higher <italic>D</italic> values from the <italic>var</italic> DBLα dataset could be due to the influence of the close physical linkage of a small subset of pairs of <italic>var</italic> loci (<xref ref-type="bibr" rid="bib19">Deitsch and Hviid, 2004</xref>), it seems somewhat unlikely because the great majority of <italic>var</italic> loci are located very far from other <italic>var</italic> loci in the 3D7 genome (<xref ref-type="bibr" rid="bib19">Deitsch and Hviid, 2004</xref>), and <italic>var</italic> loci have been shown to coincide with recombination hotspots (<xref ref-type="bibr" rid="bib41">Mu et al., 2010</xref>; <xref ref-type="bibr" rid="bib35">Jiang et al., 2011</xref>) in a genome that is already characterized by remarkably high underlying rates of recombination (<xref ref-type="bibr" rid="bib18">Conway et al., 1999</xref>; <xref ref-type="bibr" rid="bib53">Volkman et al., 2006</xref>).</p></sec></sec></body><back><ack id="ack"><title>Acknowledgements</title><p>We thank Sunetra Gupta and Caroline Buckee for discussions on the subject, and Daniel Zinder for implementation of the simulation code. YAR and MMR are Howard Hughes Medical Institute postdoctoral Associates and MP is an Howard Hughes Medical Institute Investigator.</p></ack><sec sec-type="additional-information"><title>Additional information</title><fn-group content-type="competing-interest"><title>Competing interests</title><fn fn-type="conflict" id="conf1"><p>MP: Reviewing Editor, <italic>eLife</italic>.</p></fn><fn fn-type="conflict" id="conf2"><p>The remaining authors have declared that no competing interests exist.</p></fn></fn-group><fn-group content-type="author-contribution"><title>Author contributions</title><fn fn-type="con" id="con1"><p>YAR: Conception and design, Analysis and interpretation of data, Drafting or revising the article</p></fn><fn fn-type="con" id="con2"><p>MMR: Conception and design, Analysis and interpretation of data, Drafting or revising the article</p></fn><fn fn-type="con" id="con3"><p>KD: Generated and provided the expertise on the empirical data, Drafting or revising the article</p></fn><fn fn-type="con" id="con4"><p>DC: Generated and provided the expertise on the empirical data</p></fn><fn fn-type="con" id="con5"><p>APD: Conception and design, Drafting or revising the article</p></fn><fn fn-type="con" id="con6"><p>MP: Conception and design, Drafting or revising the article</p></fn></fn-group></sec><ref-list><title>References</title><ref id="bib1"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Artzy-Randrup</surname><given-names>Y</given-names></name><name><surname>Stone</surname><given-names>L</given-names></name></person-group><year>2005</year><article-title>Generating uniformaly distributed networks</article-title><source>Physical Review E</source><volume>72</volume></element-citation></ref><ref id="bib2"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Barry</surname><given-names>AE</given-names></name><name><surname>Leliwa-Syteck</surname><given-names>A</given-names></name><name><surname>Tavul</surname><given-names>L</given-names></name><name><surname>Imrie</surname><given-names>H</given-names></name><name><surname>Migot-Nabias</surname><given-names>F</given-names></name><name><surname>Brown</surname><given-names>SM</given-names></name><etal/></person-group><year>2007</year><article-title>Population genomics of the immune evasion (var) genes of Plasmodium falciparum</article-title><source>PLoS Pathog</source><volume>3</volume><fpage>e34</fpage></element-citation></ref><ref id="bib3"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Brown</surname><given-names>AHD</given-names></name></person-group><year>1975</year><article-title>Sample sizes required to detect linkage disequilibrium between two or three loci</article-title><source>Theor Popul Biol</source><volume>8</volume><fpage>184</fpage><lpage>201</lpage></element-citation></ref><ref id="bib4"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bruce</surname><given-names>MC</given-names></name><name><surname>Day</surname><given-names>KP</given-names></name></person-group><year>2002</year><article-title>Cross-species regulation of malaria parasitaemia in the human host</article-title><source>Curr Opin Microbiol</source><volume>5</volume><fpage>431</fpage><lpage>7</lpage></element-citation></ref><ref id="bib5"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bruce</surname><given-names>MC</given-names></name><name><surname>Day</surname><given-names>KP</given-names></name></person-group><year>2003</year><article-title>Cross-species regulation of Plasmodium parasitemia in semi-immune children from Papua New Guinea</article-title><source>Trends Parasitol</source><volume>19</volume><fpage>271</fpage><lpage>7</lpage></element-citation></ref><ref id="bib6"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bruce</surname><given-names>MC</given-names></name><name><surname>Donnelly</surname><given-names>CA</given-names></name><name><surname>Alpers</surname><given-names>MP</given-names></name><name><surname>Galinski</surname><given-names>MR</given-names></name><name><surname>Barnwell</surname><given-names>JW</given-names></name><name><surname>Walliker</surname><given-names>D</given-names></name><etal/></person-group><year>2000a</year><article-title>Cross-species interactions between malaria parasites in humans</article-title><source>Science</source><volume>287</volume><fpage>845</fpage><lpage>8</lpage></element-citation></ref><ref id="bib7"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bruce</surname><given-names>MC</given-names></name><name><surname>Donnelly</surname><given-names>CA</given-names></name><name><surname>Packer</surname><given-names>M</given-names></name><name><surname>Lagog</surname><given-names>M</given-names></name><name><surname>Gibson</surname><given-names>N</given-names></name><name><surname>Narara</surname><given-names>A</given-names></name><etal/></person-group><year>2000b</year><article-title>Age- and species-specific duration of infection in asymptomatic malaria infections in Papua New Guinea</article-title><source>Parasitology</source><volume>121</volume><fpage>247</fpage><lpage>56</lpage></element-citation></ref><ref id="bib8"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Buckee</surname><given-names>CO</given-names></name><name><surname>Bull</surname><given-names>PC</given-names></name><name><surname>Gupta</surname><given-names>S</given-names></name></person-group><year>2009</year><article-title>Inferring malaria parasite population structure from serological networks</article-title><source>Proc Biol Sci</source><volume>276</volume><fpage>477</fpage><lpage>85</lpage></element-citation></ref><ref id="bib9"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Buckee</surname><given-names>CO</given-names></name><name><surname>Gupta</surname><given-names>S</given-names></name><name><surname>Kriz</surname><given-names>P</given-names></name><name><surname>Maiden</surname><given-names>MC</given-names></name><name><surname>Jolley</surname><given-names>KA</given-names></name></person-group><year>2010</year><article-title>Long-term evolution of antigen repertoires among carried meningococci</article-title><source>Proc Biol Sci</source><volume>277</volume><fpage>1635</fpage><lpage>41</lpage></element-citation></ref><ref id="bib10"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Buckee</surname><given-names>CO</given-names></name><name><surname>Jolley</surname><given-names>KA</given-names></name><name><surname>Recker</surname><given-names>M</given-names></name><name><surname>Penman</surname><given-names>B</given-names></name><name><surname>Kriz</surname><given-names>P</given-names></name><name><surname>Gupta</surname><given-names>S</given-names></name><etal/></person-group><year>2008</year><article-title>Role of selection in the ermergence of lineages and the evolution of virulence in Neisseria meningitidis</article-title><source>Proc Natl Acad Sci USA</source><volume>105</volume><fpage>15082</fpage><lpage>7</lpage></element-citation></ref><ref id="bib11"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Buckee</surname><given-names>CO</given-names></name><name><surname>Recker</surname><given-names>M</given-names></name><name><surname>Watkins</surname><given-names>ER</given-names></name><name><surname>Gupta</surname><given-names>S</given-names></name></person-group><year>2011</year><article-title>Role of stochastic processes in maintaining discrete strain structure in antigenically diverse pathogen populations</article-title><source>Proc Natl Acad Sci USA</source><volume>108</volume><fpage>15504</fpage><lpage>9</lpage></element-citation></ref><ref id="bib12"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bull</surname><given-names>PC</given-names></name><name><surname>Kyes</surname><given-names>S</given-names></name><name><surname>Buckee</surname><given-names>CO</given-names></name><name><surname>Montgomery</surname><given-names>J</given-names></name><name><surname>Kortok</surname><given-names>MM</given-names></name><name><surname>Newbold</surname><given-names>CI</given-names></name><name><surname>Marsh</surname><given-names>K</given-names></name></person-group><year>2007</year><article-title>An approach to classifying sequence tags sampled from Plasmodium falciparum var genes</article-title><source>Molecular Biochemistry Parasitology</source><volume>154</volume><fpage>98</fpage><lpage>102</lpage></element-citation></ref><ref id="bib13"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bull</surname><given-names>PC</given-names></name><name><surname>Lowe</surname><given-names>BS</given-names></name><name><surname>Kortok</surname><given-names>M</given-names></name><name><surname>Marsh</surname><given-names>K</given-names></name></person-group><year>1999</year><article-title>Antibody recognition of plasmodium falciparum erythrocyte surface antigens in Kenya: evidence for rare and prevalent variants</article-title><source>Infect Immun</source><volume>67</volume><fpage>733</fpage><lpage>9</lpage></element-citation></ref><ref id="bib14"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bull</surname><given-names>PC</given-names></name><name><surname>Lowe</surname><given-names>BS</given-names></name><name><surname>Kortok</surname><given-names>M</given-names></name><name><surname>Molyneux</surname><given-names>CS</given-names></name><name><surname>Newbold</surname><given-names>CI</given-names></name><name><surname>Marsh</surname><given-names>K</given-names></name></person-group><year>1998</year><article-title>Parasite antigens on the infected red cell surface are targets for naturally acquired immunity to malaria</article-title><source>Nat Med</source><volume>4</volume><fpage>358</fpage><lpage>60</lpage></element-citation></ref><ref id="bib15"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chan</surname><given-names>JA</given-names></name><name><surname>Howell</surname><given-names>KB</given-names></name><name><surname>Reiling</surname><given-names>L</given-names></name><name><surname>Ataide</surname><given-names>R</given-names></name><name><surname>Mackintosh</surname><given-names>CL</given-names></name><name><surname>Fowkes</surname><given-names>FJ</given-names></name><etal/></person-group><year>2012</year><article-title>Targets of antibodies against Plasmodium falciparum-infected erythrocytes in malaria immunity</article-title><source>J Clin Invest</source><volume>122</volume><fpage>3227</fpage><lpage>38</lpage></element-citation></ref><ref id="bib16"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname><given-names>DS</given-names></name><name><surname>Barry</surname><given-names>AE</given-names></name><name><surname>Leliwa-Syteck</surname><given-names>A</given-names></name><name><surname>Smith</surname><given-names>T</given-names></name><name><surname>Peterson</surname><given-names>I</given-names></name><name><surname>Brown</surname><given-names>SM</given-names></name><etal/></person-group><year>2011</year><article-title>A molecular epidemiological study of var gene diversity to characterize the reservoir of Plasmodium falciparum in humans in Africa</article-title><source>PLoS One</source><volume>6</volume><fpage>e16629</fpage></element-citation></ref><ref id="bib17"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Claessens</surname><given-names>A</given-names></name><name><surname>Adams</surname><given-names>Y</given-names></name><name><surname>Ghumra</surname><given-names>A</given-names></name><name><surname>Lindergard</surname><given-names>G</given-names></name><name><surname>Buchan</surname><given-names>C</given-names></name><name><surname>Andisi</surname><given-names>C</given-names></name><etal/></person-group><year>2012</year><article-title>A subset of group A-like var genes encodes the malaria parasite ligands for binding to human brain endothelial cells</article-title><source>Proc Natl Acad Sci USA</source><volume>109</volume><fpage>E1772</fpage><lpage>81</lpage></element-citation></ref><ref id="bib18"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Conway</surname><given-names>DJ</given-names></name><name><surname>Roper</surname><given-names>C</given-names></name><name><surname>Oduola</surname><given-names>AMJ</given-names></name><name><surname>Arnots</surname><given-names>DE</given-names></name><name><surname>Kremsner</surname><given-names>PG</given-names></name><name><surname>Grobusch</surname><given-names>MP</given-names></name><etal/></person-group><year>1999</year><article-title>High recombination rate in natural populations of Plasmodium falciparum</article-title><source>Proc Natl Acad Sci USA</source><volume>96</volume><fpage>4506</fpage><lpage>11</lpage></element-citation></ref><ref id="bib19"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Deitsch</surname><given-names>KW</given-names></name><name><surname>Hviid</surname><given-names>L</given-names></name></person-group><year>2004</year><article-title>Variant surface antigens, virulence genes and pathogenesis of malaria</article-title><source>Trends Parasitol</source><volume>20</volume><fpage>562</fpage><lpage>6</lpage></element-citation></ref><ref id="bib20"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Deitsch</surname><given-names>KW</given-names></name><name><surname>Lukehart</surname><given-names>SA</given-names></name><name><surname>Stringer</surname><given-names>JR</given-names></name></person-group><year>2009</year><article-title>Common strategies for antigenic variation by bacterial, fungal and protozoan pathogens</article-title><source>Nat Rev Microbiol</source><volume>7</volume><fpage>493</fpage><lpage>503</lpage></element-citation></ref><ref id="bib21"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Dhingra</surname><given-names>N</given-names></name><name><surname>Jha</surname><given-names>P</given-names></name><name><surname>Sharma</surname><given-names>VP</given-names></name><name><surname>Cohen</surname><given-names>AA</given-names></name><name><surname>Jotkar</surname><given-names>RM</given-names></name><name><surname>Rodriguez</surname><given-names>PS</given-names></name><etal/></person-group><year>2010</year><article-title>Adult and child malaria mortality in India: a nationally representative mortality survey</article-title><source>Lancet</source><volume>376</volume><fpage>1768</fpage><lpage>74</lpage></element-citation></ref><ref id="bib22"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Doolan</surname><given-names>DL</given-names></name><name><surname>Dobaño</surname><given-names>C</given-names></name><name><surname>Baird</surname><given-names>JK</given-names></name></person-group><year>2009</year><article-title>Acquired immunity to malaria</article-title><source>Clin Microbiol Rev</source><volume>22</volume><fpage>13</fpage><lpage>36</lpage></element-citation></ref><ref id="bib23"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ewers</surname><given-names>W</given-names></name></person-group><year>1972</year><article-title>Robert Koch, his work in New Guinea and his contribution to malariology</article-title><source>PNG Med J</source><volume>15</volume><fpage>117</fpage><lpage>24</lpage></element-citation></ref><ref id="bib24"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Frank</surname><given-names>SA</given-names></name></person-group><year>1999</year><article-title>A model for the sequential dominance of antigenic variants in African trypanosome infections</article-title><source>Proc Biol Sci</source><volume>266</volume><fpage>1397</fpage><lpage>401</lpage></element-citation></ref><ref id="bib25"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Frank</surname><given-names>SA</given-names></name><name><surname>Barbour</surname><given-names>AG</given-names></name></person-group><year>2006</year><article-title>Within-host dynamics of antigenic variation</article-title><source>Infect Genet Evol</source><volume>6</volume><fpage>141</fpage><lpage>6</lpage></element-citation></ref><ref id="bib26"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Freitas-Junior</surname><given-names>LH</given-names></name><name><surname>Bottius</surname><given-names>E</given-names></name><name><surname>Pirrit</surname><given-names>LA</given-names></name><name><surname>Deitsch</surname><given-names>KW</given-names></name><name><surname>Scheidig</surname><given-names>C</given-names></name><name><surname>Guinet</surname><given-names>F</given-names></name><etal/></person-group><year>2000</year><article-title>Frequent ectopic recombination of virulence factor genes in telomeric chromosome clusters of P. falciparum</article-title><source>Nature</source><volume>407</volume><fpage>1018</fpage><lpage>22</lpage></element-citation></ref><ref id="bib27"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Giha</surname><given-names>HA</given-names></name><name><surname>Staalsoe</surname><given-names>T</given-names></name><name><surname>Dodoo</surname><given-names>D</given-names></name><name><surname>Roper</surname><given-names>C</given-names></name><name><surname>Satti</surname><given-names>GM</given-names></name><name><surname>Arnot</surname><given-names>DE</given-names></name><etal/></person-group><year>2000</year><article-title>Antibodies to variable Plasmodium falciparum-infected erythrocyte surface antigens are associated with protection from novel malaria infections</article-title><source>Immunol Lett</source><volume>71</volume><fpage>117</fpage><lpage>26</lpage></element-citation></ref><ref id="bib28"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gillespie</surname><given-names>DT</given-names></name></person-group><year>1977</year><article-title>Exact stochastic simulation of coupled chemical reactions</article-title><source>Journal of Physical Chemistry</source><volume>81</volume><fpage>2340</fpage><lpage>61</lpage></element-citation></ref><ref id="bib29"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gupta</surname><given-names>S</given-names></name><name><surname>Anderson</surname><given-names>RM</given-names></name></person-group><year>1999</year><article-title>Population structure of pathogens: the role of immune selection</article-title><source>Parasitol Today</source><volume>12</volume><fpage>497</fpage><lpage>501</lpage></element-citation></ref><ref id="bib30"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gupta</surname><given-names>S</given-names></name><name><surname>Day</surname><given-names>KP</given-names></name></person-group><year>1994a</year><article-title>A strain theory of malaria transmission</article-title><source>Parasitol Today</source><volume>10</volume><fpage>476</fpage><lpage>81</lpage></element-citation></ref><ref id="bib31"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gupta</surname><given-names>S</given-names></name><name><surname>Day</surname><given-names>KP</given-names></name></person-group><year>1994b</year><article-title>A theoretical framework for the immunoepidemiology of Plasmodium falciparum malaria</article-title><source>Parasite Immunol</source><volume>16</volume><fpage>361</fpage><lpage>70</lpage></element-citation></ref><ref id="bib32"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gupta</surname><given-names>S</given-names></name><name><surname>Maiden</surname><given-names>MC</given-names></name><name><surname>Feavers</surname><given-names>IM</given-names></name><name><surname>Nee</surname><given-names>S</given-names></name><name><surname>May</surname><given-names>RM</given-names></name><name><surname>Anderson</surname><given-names>RM</given-names></name></person-group><year>1996</year><article-title>The maintenance of strain structure in populations of recombining infectious agents</article-title><source>Nat Med</source><volume>2</volume><fpage>437</fpage><lpage>42</lpage></element-citation></ref><ref id="bib33"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gupta</surname><given-names>S</given-names></name><name><surname>Trenholme</surname><given-names>K</given-names></name><name><surname>Anderson</surname><given-names>RM</given-names></name><name><surname>Day</surname><given-names>KP</given-names></name></person-group><year>1994</year><article-title>Antigenic diversity and the transmission dynamics of Plasmodium falciparum</article-title><source>Science</source><volume>263</volume><fpage>961</fpage><lpage>3</lpage></element-citation></ref><ref id="bib34"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hedrick</surname><given-names>P</given-names></name><name><surname>Jain</surname><given-names>S</given-names></name><name><surname>Holden</surname><given-names>L</given-names></name></person-group><year>1978</year><article-title>Multilocus systems in evolution</article-title><source>Evolutionary Biology</source><volume>11</volume><fpage>101</fpage><lpage>84</lpage></element-citation></ref><ref id="bib35"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Jiang</surname><given-names>H</given-names></name><name><surname>Li</surname><given-names>N</given-names></name><name><surname>Gopalan</surname><given-names>V</given-names></name><name><surname>Zilversmit</surname><given-names>MM</given-names></name><name><surname>Varma</surname><given-names>S</given-names></name><name><surname>Nagarajan</surname><given-names>V</given-names></name><etal/></person-group><year>2011</year><article-title>High recombination rates and hotspots in a Plasmodium falciparum genetic cross</article-title><source>Genome Biol</source><volume>12</volume><fpage>R33</fpage></element-citation></ref><ref id="bib36"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Jiang</surname><given-names>H</given-names></name><name><surname>Yi</surname><given-names>M</given-names></name><name><surname>Mu</surname><given-names>J</given-names></name><name><surname>Zhang</surname><given-names>L</given-names></name><name><surname>Ivens</surname><given-names>A</given-names></name><name><surname>Klimczak</surname><given-names>L</given-names></name><etal/></person-group><year>2008</year><article-title>Detection of genome-wide polymorphisms in the AT-rich Plasmodium falciparum genome using a high-density microarray</article-title><source>BMC Genomics</source><volume>9</volume><fpage>398</fpage></element-citation></ref><ref id="bib37"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kyes</surname><given-names>SA</given-names></name><name><surname>Kraemer</surname><given-names>SM</given-names></name><name><surname>Smith</surname><given-names>JD</given-names></name></person-group><year>2007</year><article-title>Antigenic variation in Plasmodium falciparum: gene organization and regulation of the var multigene family</article-title><source>Eukaryotic Cell</source><volume>6</volume><fpage>1511</fpage><lpage>20</lpage></element-citation></ref><ref id="bib38"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lavstsen</surname><given-names>T</given-names></name><name><surname>Turner</surname><given-names>L</given-names></name><name><surname>Saguti</surname><given-names>F</given-names></name><name><surname>Magistrado</surname><given-names>P</given-names></name><name><surname>Rask</surname><given-names>TS</given-names></name><name><surname>Jespersen</surname><given-names>JS</given-names></name><etal/></person-group><year>2012</year><article-title>Plasmodium falciparum erythrocyte membrane protein 1 domain cassettes 8 and 13 are associated with severe malaria in children</article-title><source>Proc Natl Acad Sci USA</source><volume>109</volume><fpage>E1791</fpage><lpage>800</lpage></element-citation></ref><ref id="bib39"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Miller</surname><given-names>LH</given-names></name><name><surname>Baruch</surname><given-names>DI</given-names></name><name><surname>Marsh</surname><given-names>K</given-names></name><name><surname>Doumbo</surname><given-names>OK</given-names></name></person-group><year>2002</year><article-title>The pathogenic basis of malaria</article-title><source>Nature</source><volume>415</volume><fpage>673</fpage><lpage>9</lpage></element-citation></ref><ref id="bib40"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Miller</surname><given-names>LH</given-names></name><name><surname>Good</surname><given-names>MF</given-names></name><name><surname>Milon</surname><given-names>G</given-names></name></person-group><year>1994</year><article-title>Malaria pathogenesis</article-title><source>Science</source><volume>264</volume><fpage>1878</fpage><lpage>83</lpage></element-citation></ref><ref id="bib41"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Mu</surname><given-names>J</given-names></name><name><surname>Myers</surname><given-names>RA</given-names></name><name><surname>Jiang</surname><given-names>H</given-names></name><name><surname>Liu</surname><given-names>S</given-names></name><name><surname>Ricklefs</surname><given-names>S</given-names></name><name><surname>Waisberg</surname><given-names>M</given-names></name><etal/></person-group><year>2010</year><article-title>Plasmodium falciparum genome-wide scans for positive selection, recombination hot spots and resistance to antimalarial drugs</article-title><source>Nat Genet</source><volume>42</volume><fpage>268</fpage><lpage>71</lpage></element-citation></ref><ref id="bib42"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Paul</surname><given-names>RE</given-names></name><name><surname>Packer</surname><given-names>MJ</given-names></name><name><surname>Walmsley</surname><given-names>M</given-names></name><name><surname>Lagog</surname><given-names>M</given-names></name><name><surname>Ranford-Cartwright</surname><given-names>LC</given-names></name><name><surname>Paru</surname><given-names>R</given-names></name><etal/></person-group><year>1995</year><article-title>Mating patterns in malaria parasite populations of Papua New Guinea</article-title><source>Science</source><volume>269</volume><fpage>1709</fpage><lpage>11</lpage></element-citation></ref><ref id="bib43"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Recker</surname><given-names>M</given-names></name><name><surname>Buckee</surname><given-names>CO</given-names></name><name><surname>Serazin</surname><given-names>A</given-names></name><name><surname>Kyes</surname><given-names>S</given-names></name><name><surname>Pinches</surname><given-names>R</given-names></name><name><surname>Christodoulou</surname><given-names>Z</given-names></name><etal/></person-group><year>2011</year><article-title>Antigenic variation in Plasmodium falciparum malaria involves a highly structured switching pattern</article-title><source>PLoS Pathog</source><volume>7</volume><fpage>e1001306</fpage></element-citation></ref><ref id="bib44"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Recker</surname><given-names>M</given-names></name><name><surname>Nee</surname><given-names>S</given-names></name><name><surname>Bull</surname><given-names>PC</given-names></name><name><surname>Kinyanjui</surname><given-names>S</given-names></name><name><surname>Marsh</surname><given-names>K</given-names></name><name><surname>Newbold</surname><given-names>C</given-names></name><etal/></person-group><year>2004</year><article-title>Transient cross-reactive immune responses can orchestrate antigenic variation in malaria</article-title><source>Nature</source><volume>429</volume><fpage>555</fpage><lpage>8</lpage></element-citation></ref><ref id="bib45"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Scherf</surname><given-names>A</given-names></name><name><surname>Lopez-Rubio</surname><given-names>JJ</given-names></name><name><surname>Riviere</surname><given-names>L</given-names></name></person-group><year>2008</year><article-title>Antigenic variation in Plasmodium falciparum</article-title><source>Annu. Rev. Microbiol</source><volume>62</volume><fpage>445</fpage><lpage>70</lpage></element-citation></ref><ref id="bib46"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Selander</surname><given-names>RK</given-names></name><name><surname>Musser</surname><given-names>JM</given-names></name><name><surname>Caugant</surname><given-names>DA</given-names></name><name><surname>Gilmour</surname><given-names>MN</given-names></name><name><surname>Whittam</surname><given-names>TS</given-names></name></person-group><year>1987</year><article-title>Population genetics of pathogenic bacteria</article-title><source>Microb Pathog</source><volume>3</volume><fpage>1</fpage><lpage>7</lpage></element-citation></ref><ref id="bib47"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Severins</surname><given-names>M</given-names></name><name><surname>Klinkenberg</surname><given-names>D</given-names></name><name><surname>Heesterbeck</surname><given-names>H</given-names></name></person-group><year>2012</year><article-title>How selection forces dictate the variant surface antigens used by malaria parasites</article-title><source>J R Soc Interface</source><volume>9</volume><fpage>246</fpage><lpage>60</lpage></element-citation></ref><ref id="bib48"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Smith</surname><given-names>M</given-names></name><name><surname>Smith</surname><given-names>NH</given-names></name><name><surname>O'Rourke</surname><given-names>M</given-names></name><name><surname>Spratt</surname><given-names>BG</given-names></name></person-group><year>1993</year><article-title>How clonal are bacteria?</article-title><source>Proc Natl Acad Sci USA</source><volume>90</volume><fpage>4384</fpage><lpage>8</lpage></element-citation></ref><ref id="bib49"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Taylor</surname><given-names>HM</given-names></name><name><surname>Kyes</surname><given-names>SA</given-names></name><name><surname>Newbold</surname><given-names>CI</given-names></name></person-group><year>2000</year><article-title>Var gene diversity in Plasmodium falciparum is generated by frequent recombination events</article-title><source>Mol Biochem Parasitol</source><volume>110</volume><fpage>391</fpage><lpage>7</lpage></element-citation></ref><ref id="bib50"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tibayrenc</surname><given-names>M</given-names></name></person-group><year>1994</year><article-title>Antigenic diversity and the transmission dynamics of Plasmodium falciparum: the clonality/sexuality debate revisited</article-title><source>Parasitol Today</source><volume>10</volume><fpage>456</fpage><lpage>7</lpage></element-citation></ref><ref id="bib51"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tibayrenc</surname><given-names>M</given-names></name><name><surname>Ayala</surname><given-names>FJ</given-names></name></person-group><year>2002</year><article-title>The clonal theory of parasitic protozoa: 12 years on</article-title><source>Trends Parasitol</source><volume>18</volume><fpage>405</fpage><lpage>10</lpage></element-citation></ref><ref id="bib52"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tibayrenc</surname><given-names>M</given-names></name><name><surname>Kjellberg</surname><given-names>F</given-names></name><name><surname>Ayala</surname><given-names>FJ</given-names></name></person-group><year>1990</year><article-title>A clonal theory of parasitic protozoa: the population structures of Entamoeba, Giardia, Leishmania, Naegleria, Plasmodium, Trichomonas, and Trypanosoma and their medical and taxonomical consequences</article-title><source>Proc Natl Acad Sci USA</source><volume>87</volume><fpage>2414</fpage><lpage>8</lpage></element-citation></ref><ref id="bib53"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Volkman</surname><given-names>S</given-names></name><name><surname>Sabeti</surname><given-names>PC</given-names></name><name><surname>DeCaprio</surname><given-names>D</given-names></name><name><surname>Neafsey</surname><given-names>DE</given-names></name><name><surname>Schaffner</surname><given-names>SF</given-names></name><name><surname>Milner</surname><given-names>J</given-names></name><etal/></person-group><year>2006</year><article-title>A genome-wide map of diversity in Plasmodium falciparum</article-title><source>Nat Genet</source><volume>39</volume><fpage>113</fpage><lpage>9</lpage></element-citation></ref><ref id="bib54"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Warimwe</surname><given-names>GM</given-names></name><name><surname>Fegan</surname><given-names>G</given-names></name><name><surname>Musyoki</surname><given-names>JN</given-names></name><name><surname>Newton</surname><given-names>CR</given-names></name><name><surname>Opiyo</surname><given-names>M</given-names></name><name><surname>Githinji</surname><given-names>G</given-names></name><etal/></person-group><year>2012</year><article-title>Prognostic indicators of life-threatening malaria are associated with distinct parasite variant antigen profiles</article-title><source>Sci Transl Med</source><volume>4</volume><fpage>129ra145</fpage><pub-id pub-id-type="doi">10.1126/scitranslmed.3003247</pub-id></element-citation></ref></ref-list></back><sub-article article-type="article-commentary" id="SA1"><front-stub><article-id pub-id-type="doi">10.7554/eLife.00093.010</article-id><title-group><article-title>Decision letter</article-title></title-group><contrib-group content-type="section"><contrib contrib-type="editor"><name><surname>Bergstrom</surname><given-names>Carl T</given-names></name><role>Reviewing editor</role><aff><institution>University of Washington</institution><country>United States</country></aff></contrib></contrib-group></front-stub><body><boxed-text><p>eLife posts the editorial decision letter and author response on a selection of the published articles (subject to the approval of the authors). An edited version of the letter sent to the authors after peer review is shown, indicating the substantive concerns or comments; minor concerns are not usually shown. Reviewers have the opportunity to discuss the decision before the letter is sent (see <ext-link ext-link-type="uri" xlink:href="http://www.elifesciences.org/the-journal/review-process">review process</ext-link>). Similarly, the author response typically shows only responses to the major concerns raised by the reviewers.</p></boxed-text><p>Thank you for choosing to send your work entitled “Population structuring of multi-copy, antigen-encoding genes in <italic>Plasmodium falciparum</italic>” for consideration at <italic>eLife</italic>. Your article has been evaluated by a Senior Editor and 3 reviewers, one of whom is a member of <italic>eLife's</italic> Board of Reviewing Editors.</p><p>The Reviewing Editor, Carl Bergstrom, and the other reviewers discussed their comments before we reached this decision, and the Reviewing Editor has assembled the following comments based on the reviewers' reports.</p><p>Strain theory reveals how immune selection interacts with patterns of transmission to determine the population-genetic structure of pathogen populations. This paper extends strain theory to treat the malaria parasite, by demonstrating the effects on immune selection upon a multi-gene system with sequential expression, as characteristic of the <italic>var</italic> gene family, which is central to the within-host antigenic variation of <italic>Plasmodium falciparum</italic>. On the theoretical side, the authors have answered the question of whether immune selection can cause the parasite population to self-organise into a finite number of strains with non-overlapping <italic>var</italic> repertoires even when the genes are expressed sequentially. They have further shown that the degree of structuring depends on transmission intensity: partially overlapping repertoires can arise when transmission levels are high. On the empirical side, the paper presents an analysis of microsatellite and <italic>var</italic> DBLα sequence data, revealing that linkage disequilibrium among the latter cannot be attributed to demographic forces alone. The following comments should be addressed before acceptance:</p><p>1) The Introduction could be expanded to provide more thorough background for non-specialist readers. Please provide a more detailed paragraph on the biology of the <italic>var</italic> genes, including their domain structure (as it will help the reader understand the data section more easily), before explaining what the model does. We would recommend expanding and clarifying the background sentences “Individual <italic>Plasmodium</italic> genomes…among <italic>var</italic> loci”, before describing the model and its findings.</p><p>2) The authors observe episodes of restructuring leading to punctuated turnover. It is clear from the exposition that this is a dynamically different process to the cyclical strain structure exhibited by the deterministic model under intermediate levels of immune selection. If possible without extensive further analysis, are the authors able to comment on the following? To what degree does the sequential expression itself contribute to this phenomenon? In other words, is this behavior likely to be observed in a stochastic multi-locus model without sequential expression? Or is the instability inextricably linked to sequential expression?</p><p>3) It is not obvious that “This important insight provides a plausible explanation for why it is so difficult to eliminate malaria”. However, the predicted failure of transmission control strategies to reduce <italic>var</italic> diversity may have important ramifications for the reduction of disease, given that PfEMP1 is now firmly established as the principal target of clinical immunity. Would the authors feel comfortable speculating on the differential effects of reducing transmission on disease and infection?</p><p>4) Please provide some explanation on how well the model works under the assumption that immunity is not life long given recent evidence that malaria may well kill adults as well as children (Dhingra et al, Lancet 2010). This needs to be addressed only in the Discussion.</p><p>5) Parts of the Materials and methods are difficult to follow and parameters such as nh are not always clearly defined. Please make an effort to clarify. Two-letter parameter names, e.g., gp, sl, nh, can look like products. Please consider changing these. Why is the total number of distinct <italic>var</italic> repertoires given by gp!/sl! instead of gp!/((gp-sl)! sl!)?</p></body></sub-article><sub-article article-type="reply" id="SA2"><front-stub><article-id pub-id-type="doi">10.7554/eLife.00093.011</article-id><title-group><article-title>Author response</article-title></title-group></front-stub><body><p><italic>1) The Introduction could be expanded to provide more thorough background for non-specialist readers. Please provide a more detailed paragraph on the biology of the var genes, including their domain structure (as it will help the reader understand the data section more easily), before explaining what the model does. We would recommend expanding and clarifying the background sentences “Individual Plasmodium genomes…among var loci”, before describing the model and its findings</italic>.</p><p>We have now expanded the background information on the <italic>var</italic> genes in the Introduction.</p><p><italic>2) The authors observe episodes of restructuring leading to punctuated turnover. It is clear from the exposition that this is a dynamically different process to the cyclical strain structure exhibited by the deterministic model under intermediate levels of immune selection. If possible without extensive further analysis, are the authors able to comment on the following? To what degree does the sequential expression itself contribute to this phenomenon? In other words, is this behavior likely to be observed in a stochastic multi-locus model without sequential expression? Or is the instability inextricably linked to sequential expression</italic>?</p><p>In extensions of our work we have shown that episodes of restructuring with punctuated turnover do not depend on sequential expression. This phenomenon was observed in stochastic multi-locus models, both with, and without, sequential expression. However, we cannot yet say if these episodes are more likely to occur when expression is ordered.</p><p>We should also note that the likeliness of these episodes may vary when considering different within host rules, but nonetheless, in all the cases we discussed here, episodes of restructuring did take place.</p><p>We have reported the robustness of this phenomenon to relaxing the assumption of sequential expression in the Results section (see end of the third paragraph in this section).</p><p><italic>3) It is not obvious that “This important insight provides a plausible explanation for why it is so difficult to eliminate malaria”. However, the predicted failure of transmission control strategies to reduce var diversity may have important ramifications for the reduction of disease, given that PfEMP1 is now firmly established as the principal target of clinical immunity. Would the authors feel comfortable speculating on the differential effects of reducing transmission on disease and infection</italic>?</p><p>We have rewritten that sentence in the Discussion to better clarify what we meant. We have also added a paragraph in the Discussion on the effect of control. We have only briefly speculated on the consequences for disease vs. infection with respect to their age distribution. To better support this paragraph, we have replaced one of the plots in Figure 4 to illustrate age distributions, and added Figure 5 to better illustrate the results that were already in the text regarding the change in the overlap of repertoires with transmission intensity.</p><p><italic>4) Please provide some explanation on how well the model works under the assumption that immunity is not life long given recent evidence that malaria may well kill adults as well as children (Dhingra et al, Lancet 2010). This needs to be addressed only in the Discussion</italic>.</p><p>We have added a discussion on short-lived immunity and the reference by Dhingra et al. in the second paragraph of the Discussion to indicate that our results are robust to modifying the assumption of lifelong immunity.</p><p><italic>5) Parts of the Materials and methods are difficult to follow and parameters such as nh are not always clearly defined. Please make an effort to clarify. Two-letter parameter names, e.g., gp, sl, nh, can look like products. Please consider changing these. Why is the total number of distinct var repertoires given by gp!/sl! instead of gp!/((gp-sl)! sl!)</italic>?</p><p>We have replaced these parameter names with the following: G represents the general gene pool size, g is the number of genes in each parasite genome, and H is the total population size. We think this new notation helps to make this section clearer.</p><p>The total number of distinct <italic>var</italic> repertoires should be G!/(G-g)! (earlier this was gp!/sl!). This is because in our model we assume the order of expression is fixed and this order matters when counting the different repertoires. Hence, for a group of g genes there are exactly g! different strain types. These different strains are composed of identical genes, but the particular order of expression of each of these can have significance, particularly in the presence of other strain types that have partially overlapping genes. More generally, we are considering the number of ordered arrangements of n objects taken from N different objects; this is given by N!/(N-n)!</p><p>Note that fixed order is not a necessary condition for our results. We simulated cases where for each infection event, the order of expression of the particular genome being transmitted would be reshuffled with a certain probability. In the extreme case when this probability is 1, for a group of g genes there would effectively be exactly 1 strain type because the particular order of expression would not matter any more. For these different cases, structuring of the parasite population was also seen to emerge.</p></body></sub-article></article> |