Permalink
Switch branches/tags
Nothing to show
Find file
Fetching contributors…
Cannot retrieve contributors at this time
2 lines (1 sloc) 226 KB
<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Archiving and Interchange DTD v1.1d1 20130915//EN" "JATS-archivearticle1.dtd"><article article-type="research-article" dtd-version="1.1d1" xmlns:xlink="http://www.w3.org/1999/xlink"><front><journal-meta><journal-id journal-id-type="nlm-ta">elife</journal-id><journal-id journal-id-type="hwp">eLife</journal-id><journal-id journal-id-type="publisher-id">eLife</journal-id><journal-title-group><journal-title>eLife</journal-title></journal-title-group><issn publication-format="electronic">2050-084X</issn><publisher><publisher-name>eLife Sciences Publications, Ltd</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">03198</article-id><article-id pub-id-type="doi">10.7554/eLife.03198</article-id><article-categories><subj-group subj-group-type="display-channel"><subject>Research article</subject></subj-group><subj-group subj-group-type="heading"><subject>Genomics and evolutionary biology</subject></subj-group><subj-group subj-group-type="heading"><subject>Plant biology</subject></subj-group></article-categories><title-group><article-title>Natural epigenetic polymorphisms lead to intraspecific variation in Arabidopsis gene imprinting</article-title></title-group><contrib-group><contrib contrib-type="author" id="author-8995"><name><surname>Pignatta</surname><given-names>Daniela</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="fn" rid="con1"/><xref ref-type="fn" rid="conf1"/><xref ref-type="other" rid="dataro1"/></contrib><contrib contrib-type="author" id="author-13583"><name><surname>Erdmann</surname><given-names>Robert M</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="aff" rid="aff2"/><xref ref-type="other" rid="par-3"/><xref ref-type="fn" rid="con3"/><xref ref-type="fn" rid="conf1"/><xref ref-type="other" rid="dataro1"/></contrib><contrib contrib-type="author" id="author-13584"><name><surname>Scheer</surname><given-names>Elias</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="fn" rid="con4"/><xref ref-type="fn" rid="conf1"/><xref ref-type="other" rid="dataro1"/></contrib><contrib contrib-type="author" id="author-13585"><name><surname>Picard</surname><given-names>Colette L</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="aff" rid="aff3"/><xref ref-type="other" rid="par-3"/><xref ref-type="fn" rid="con5"/><xref ref-type="fn" rid="conf1"/></contrib><contrib contrib-type="author" id="author-8998"><name><surname>Bell</surname><given-names>George W</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="fn" rid="con6"/><xref ref-type="fn" rid="conf1"/><xref ref-type="other" rid="dataro1"/></contrib><contrib contrib-type="author" corresp="yes" id="author-8476"><name><surname>Gehring</surname><given-names>Mary</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="aff" rid="aff2"/><xref ref-type="aff" rid="aff3"/><xref ref-type="corresp" rid="cor1">*</xref><xref ref-type="other" rid="par-1"/><xref ref-type="other" rid="par-2"/><xref ref-type="fn" rid="con2"/><xref ref-type="fn" rid="conf1"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/></contrib><aff id="aff1"><institution>Whitehead Institute for Biomedical Research</institution>, <addr-line><named-content content-type="city">Cambridge</named-content></addr-line>, <country>United States</country></aff><aff id="aff2"><institution content-type="dept">Department of Biology</institution>, <institution>Massachusetts Institute of Technology</institution>, <addr-line><named-content content-type="city">Cambridge</named-content></addr-line>, <country>United States</country></aff><aff id="aff3"><institution content-type="dept">Computational and Systems Biology Graduate Program</institution>, <institution>Massachusetts Institute of Technology</institution>, <addr-line><named-content content-type="city">Cambridge</named-content></addr-line>, <country>United States</country></aff></contrib-group><contrib-group content-type="section"><contrib contrib-type="editor"><name><surname>Weigel</surname><given-names>Detlef</given-names></name><role>Reviewing editor</role><aff><institution>Max Planck Institute for Developmental Biology</institution>, <country>Germany</country></aff></contrib></contrib-group><author-notes><corresp id="cor1"><label>*</label>For correspondence: <email>mgehring@wi.mit.edu</email></corresp></author-notes><pub-date date-type="pub" publication-format="electronic"><day>03</day><month>07</month><year>2014</year></pub-date><pub-date pub-type="collection"><year>2014</year></pub-date><volume>3</volume><elocation-id>e03198</elocation-id><history><date date-type="received"><day>25</day><month>04</month><year>2014</year></date><date date-type="accepted"><day>02</day><month>07</month><year>2014</year></date></history><permissions><copyright-statement>© 2014, Pignatta et al</copyright-statement><copyright-year>2014</copyright-year><copyright-holder>Pignatta et al</copyright-holder><license xlink:href="http://creativecommons.org/licenses/by/4.0/"><license-p>This article is distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License</ext-link>, which permits unrestricted use and redistribution provided that the original author and source are credited.</license-p></license></permissions><self-uri content-type="pdf" xlink:href="elife03198.pdf"/><abstract><object-id pub-id-type="doi">10.7554/eLife.03198.001</object-id><p>Imprinted gene expression occurs during seed development in plants and is associated with differential DNA methylation of parental alleles, particularly at proximal transposable elements (TEs). Imprinting variability could contribute to observed parent-of-origin effects on seed development. We investigated intraspecific variation in imprinting, coupled with analysis of DNA methylation and small RNAs, among three Arabidopsis strains with diverse seed phenotypes. The majority of imprinted genes were parentally biased in the same manner among all strains. However, we identified several examples of allele-specific imprinting correlated with intraspecific epigenetic variation at a TE. We successfully predicted imprinting in additional strains based on methylation variability. We conclude that there is standing variation in imprinting even in recently diverged genotypes due to intraspecific epiallelic variation. Our data demonstrate that epiallelic variation and genomic imprinting intersect to produce novel gene expression patterns in seeds.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.001">http://dx.doi.org/10.7554/eLife.03198.001</ext-link></p></abstract><abstract abstract-type="executive-summary"><object-id pub-id-type="doi">10.7554/eLife.03198.002</object-id><title>eLife digest</title><p>When animals or plants reproduce sexually, the DNA in a sperm or pollen is combined with that in an egg cell to generate an offspring that inherits two copies of each gene, one from each parent. For a very small number of genes, the copy from one of the parents is consistently turned off. This process—called imprinting—means that the same gene can have different effects depending on if it is inherited from the mother or the father. In plants, imprinting is vital for the production of seeds and typically occurs in the endosperm: the tissue within a seed that provides nourishment to the plant embryo.</p><p>One way genes can be imprinted is by adding small chemical marks—called methyl groups—on to the DNA that makes up the gene or nearby sequences. These marks can either switch on, or switch off, the expression of the gene. DNA methylation also immobilises stretches of DNA called transposable elements, stopping them from moving from one location to another in the genome. These stretches of DNA are identified and targeted for methylation by small molecules of RNA that match their DNA sequences.</p><p>Genes that are imprinted in the endosperm of the model plant Arabidopsis are often associated with transposable elements, which can be methylated differently in the naturally occurring varieties, or strains, of Arabidopsis. However it is unclear how many genes are differently imprinted between these different strains.</p><p>Pignatta et al. looked for differences in gene imprinting, DNA methylation and small RNA production in the seeds, embryos and endosperm tissue from three strains of Arabidopsis. They also examined seeds from crosses between these three strains.</p><p>While most genes had the same imprinting pattern in all strains and crosses examined, 12 genes were imprinted differently depending on whether they were inherited from the male or female of a given strain. For example, for some genes the copy inherited from the male parent is always turned off, unless it is inherited via the pollen of one specific Arabidopsis strain. Half of this variation could be explained by a transposable element near to each gene that was methylated differently among the strains.</p><p>By comparing the differentially methylated regions in the genomes of 140 Arabidopsis strains, Pignatta et al. found that differences in methylation may affect 11% of imprinted genes—and went on to confirm variable imprinting in some Arabidopsis strains based on the presence or absence of DNA methylation.</p><p>Future work is needed to understand how variation in gene imprinting might affect the traits of hybrid seeds, and how it might affect the evolution of new traits in hybrid plants.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.002">http://dx.doi.org/10.7554/eLife.03198.002</ext-link></p></abstract><kwd-group kwd-group-type="author-keywords"><title>Author keywords</title><kwd>genomic imprinting</kwd><kwd>DNA methylation</kwd><kwd>natural variation</kwd><kwd>epialleles</kwd><kwd>transposable elements</kwd><kwd>seeds</kwd></kwd-group><kwd-group kwd-group-type="research-organism"><title>Research organism</title><kwd>Arabidopsis</kwd></kwd-group><funding-group><award-group id="par-1"><funding-source><institution-wrap><institution-id institution-id-type="FundRef">http://dx.doi.org/10.13039/100000001</institution-id><institution>National Science Foundation</institution></institution-wrap></funding-source><award-id>MCB 1121952</award-id><principal-award-recipient><name><surname>Gehring</surname><given-names>Mary</given-names></name></principal-award-recipient></award-group><award-group id="par-2"><funding-source><institution-wrap><institution-id institution-id-type="FundRef">http://dx.doi.org/10.13039/100000875</institution-id><institution>Pew Charitable Trusts</institution></institution-wrap></funding-source><award-id>Pew Scholars Program in the Biomedical Sciences</award-id><principal-award-recipient><name><surname>Gehring</surname><given-names>Mary</given-names></name></principal-award-recipient></award-group><award-group id="par-3"><funding-source><institution-wrap><institution-id institution-id-type="FundRef">http://dx.doi.org/10.13039/100000001</institution-id><institution>National Science Foundation</institution></institution-wrap></funding-source><award-id>Graduate Research Fellowship</award-id><principal-award-recipient><name><surname>Erdmann</surname><given-names>Robert M</given-names></name><name><surname>Picard</surname><given-names>Colette L</given-names></name></principal-award-recipient></award-group><funding-statement>The funders had no role in study design, data collection and interpretation, or the decision to submit the work for publication.</funding-statement></funding-group><custom-meta-group><custom-meta><meta-name>elife-xml-version</meta-name><meta-value>2</meta-value></custom-meta><custom-meta specific-use="meta-only"><meta-name>Author impact statement</meta-name><meta-value>By examining natural variation in DNA methylation for effects on parent-of-origin specific expression, it is demonstrated that epiallelic variation intersects with genomic imprinting mechanisms to produce novel gene expression patterns in seeds.</meta-value></custom-meta></custom-meta-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Diploid sexually reproducing organisms inherit an allele of each gene from both parents, which masks deleterious effects of recessive mutations. However, a subset of genes in flowering plants and mammals are subject to imprinting, whereby genes are expressed predominantly from one allele in a parent-of-origin dependent manner, such that traits controlled by these genes reflect the genotype of only one parent. Imprinted gene expression affects fetal growth regulation and postnatal behavior in mammals and the formation of viable seeds and the inhibition of interspecies hybridization in plants (<xref ref-type="bibr" rid="bib54">Tycko and Morison, 2002</xref>; <xref ref-type="bibr" rid="bib25">Jiang and Köhler, 2012</xref>; <xref ref-type="bibr" rid="bib31">Kradolfer et al., 2013</xref>). Imprinting is primarily restricted to the endosperm in plants, the triploid tissue that develops alongside the embryo and is necessary for normal embryo patterning and growth. Genome-wide surveys for imprinted expression have identified several dozen to hundreds of imprinted genes in rice, maize, Arabidopsis, mice, mules, and hinnies (<xref ref-type="bibr" rid="bib13">Gehring et al., 2011</xref>; <xref ref-type="bibr" rid="bib20">Hsieh et al., 2011</xref>; <xref ref-type="bibr" rid="bib37">Luo et al., 2011</xref>; <xref ref-type="bibr" rid="bib61">Wolff et al., 2011</xref>; <xref ref-type="bibr" rid="bib64">Zhang et al., 2011</xref>; <xref ref-type="bibr" rid="bib8">DeVeale et al., 2012</xref>; <xref ref-type="bibr" rid="bib60">Waters et al., 2012</xref>; <xref ref-type="bibr" rid="bib62">Xin et al., 2013</xref>; <xref ref-type="bibr" rid="bib58">Wang et al., 2013b</xref>). Differential DNA methylation and histone modifications between maternally-inherited and paternally-inherited alleles are important regulators of imprinted gene expression (<xref ref-type="bibr" rid="bib30">Köhler et al., 2012</xref>). Endosperm DNA is maternally hypomethylated at thousands of discrete loci (<xref ref-type="bibr" rid="bib11">Gehring et al., 2009</xref>; <xref ref-type="bibr" rid="bib19">Hsieh et al., 2009</xref>; <xref ref-type="bibr" rid="bib23">Ibarra et al., 2012</xref>) in a process dependent on the 5-methylcytosine DNA glycosylase DME (<xref ref-type="bibr" rid="bib12">Gehring et al., 2006</xref>, <xref ref-type="bibr" rid="bib11">2009</xref>; <xref ref-type="bibr" rid="bib19">Hsieh et al., 2009</xref>; <xref ref-type="bibr" rid="bib23">Ibarra et al., 2012</xref>). Maintenance and de novo methylation pathways also appear to be compromised in the central cell and during early endosperm development (<xref ref-type="bibr" rid="bib26">Jullien et al., 2012</xref>; <xref ref-type="bibr" rid="bib5">Belmonte et al., 2013</xref>; <xref ref-type="bibr" rid="bib55">Vu et al., 2013</xref>), which might further contribute to loss of methylation from the maternally inherited genome. Endosperm DMRs (differentially methylated regions) are enriched for TE sequences, although not all imprinted gene are associated with a neighboring TE (<xref ref-type="bibr" rid="bib11">Gehring et al., 2009</xref>).</p><p>TE methylation dynamics during reproduction appear to be an important driver of imprinted gene expression, yet the epigenetic modification of TEs and their presence or absence in genomes can be variable on short evolutionary timescales. Although very few TEs are presently active in <italic>Arabidopsis thaliana</italic>, most differences between genomic sequences of Arabidopsis strains are due to variation in TEs (<xref ref-type="bibr" rid="bib7">Cao et al., 2011</xref>). Many euchromatic TEs and related sequences are targeted for RNA-directed DNA methylation (RdDM), an active process through which 24-nt small RNAs derived from longer non-coding RNA transcripts direct DNA methyltransferases to cognate sequences (<xref ref-type="bibr" rid="bib35">Law and Jacobsen, 2010</xref>). RdDM is important for maintaining transcriptional silencing of TEs. Gene expression is negatively correlated with the proximity of TEs targeted by small RNAs and methylated TEs are under stronger purifying selection when they are near genes (<xref ref-type="bibr" rid="bib17">Hollister and Gaut, 2009</xref>; <xref ref-type="bibr" rid="bib57">Wang et al., 2013a</xref>). TE methylation is quite stable, although loss of methylation at TEs can occur spontaneously at very low frequency (<xref ref-type="bibr" rid="bib4">Becker et al., 2011</xref>; <xref ref-type="bibr" rid="bib43">Schmitz et al., 2011</xref>). However, a quarter of TEs in Arabidopsis are not methylated (<xref ref-type="bibr" rid="bib1">Ahmed et al., 2011</xref>) and only 68% are associated with small RNAs (<xref ref-type="bibr" rid="bib18">Hollister et al., 2011</xref>). Thus the epigenetic modification status of TEs can be variable within the species, between different classes of elements, or even among elements of the same family.</p><p>The potential role of TEs in establishing or maintaining imprinted expression coupled with the evolutionary forces that select for parent-of-origin specific expression suggest that substantial intraspecific variation in imprinting could exist. Indeed, the first imprinted gene described, the maize <italic>R</italic> gene (<xref ref-type="bibr" rid="bib27">Kermicle, 1970</xref>), is an example of allele-specific imprinting; only alleles that have a <italic>Doppia</italic> TE inserted in the promoter are imprinted (<xref ref-type="bibr" rid="bib28">Kermicle, 1978</xref>; <xref ref-type="bibr" rid="bib56">Walker, 1998</xref>; <xref ref-type="bibr" rid="bib2">Alleman and Doctor, 2000</xref>). Once imprinted gene expression arises, the kinship or parental conflict theory of imprinting (<xref ref-type="bibr" rid="bib16">Haig, 2013</xref>) posits that it could be evolutionarily selected because asymmetrically related kin (e.g., half-siblings that have the same mother but different fathers) compete for maternal resources. Thus, maternally and paternally inherited alleles of genes that influence maternal resource transfer to offspring have different optima for total gene expression levels. Plants adopt a range of different strategies with regards to maternal resource transfer to offspring—producing a few large seeds, or many small seeds. Intraspecific variation in this trait could potentially be linked to differences in the set of genes subject to imprinting in each strain. To systematically evaluate whether gene imprinting varies on short evolutionary time scales and to further understand the role of genetic and epigenetic polymorphisms in this process, we have investigated the conservation and variability of imprinting, DNA methylation, and small RNA production in reciprocal crosses among three strains of Arabidopsis. Arabidopsis is an ideal system in which to ask these questions because of the availability of genotyped and epigenotyped strains that have diverged for only a few thousand years.</p><p>Here we discovered 12 examples of allele-specific imprinting, about half of which were associated with endosperm demethylation of a TE that was variably methylated within the strains we examined. We further evaluated intraspecific methylation variability at regions targeted for CG DNA demethylation during female reproductive development for 140 strains where vegetative methylation patterns are known (<xref ref-type="bibr" rid="bib44">Schmitz et al., 2013</xref>). Approximately 11% of imprinted genes are associated with an endosperm DMR that is variably methylated among strains. From this analysis we predicted and experimentally validated allele-specific imprinting in additional strains for two genes. The ability to predict imprinting status based on strain-to-strain variation in vegetative methylation patterns suggests that these genes are strong candidates for allelic variation in imprinting due to epigenetic differences at TEs, and thus act as epialleles. Our data demonstrate that epiallelic variation and genomic imprinting intersect to produce novel gene expression patterns in seeds. Thus, naturally occurring epialleles could have the strongest phenotypic effect during the reproductive phase of plant development, when patterns of methylation are altered.</p></sec><sec id="s2" sec-type="results"><title>Results</title><p>We analyzed genome-wide DNA methylation, small RNA, and gene expression patterns in whole seeds, embryo, and endosperm of three different <italic>Arabidopsis thaliana</italic> strains and in reciprocal crosses among them to investigate imprinting variation within the species and to assess the role of epigenetic polymorphisms in this process. We focused on the commonly used strains Col and Ler and the more polymorphic strain Cvi (<xref ref-type="bibr" rid="bib40">Nordborg et al., 2005</xref>). Cvi produces larger seeds than Col or Ler (<xref ref-type="fig" rid="fig1s1">Figure 1—figure supplement 1</xref>) due to increased and prolonged endosperm and integument growth (<xref ref-type="bibr" rid="bib3">Alonso-Blanco et al., 1999</xref>), an effect that is even more pronounced when Cvi is pollinated by Col or Ler (<xref ref-type="fig" rid="fig1s1">Figure 1—figure supplement 1</xref>). In our experimental design the Col, Ler and Cvi alleles for each gene were represented twice as the maternally or paternally inherited allele, allowing us to draw conclusions about the activity of an allele independent of the genotype of the other parent in the cross.</p><sec id="s2-1"><title>Allele-specific expression analysis identifies genes imprinted among all strains</title><p>We first identified genes with consistent parentally biased expression in embryo and endosperm using mRNA-seq data from six different crosses representing three sets of reciprocals: Col-Ler, Col-Cvi, and Ler-Cvi (<xref ref-type="fig" rid="fig1">Figure 1</xref>, <xref ref-type="supplementary-material" rid="SD1-data">Figure 1—source data 1</xref>). Imprinting could be evaluated for 16,646 loci in at least one set of reciprocal crosses and 8088 loci in all three sets of reciprocal crosses based on SNPs and sequencing depth. As previously, we implemented a series of filters to define imprinted genes (<xref ref-type="bibr" rid="bib13">Gehring et al., 2011</xref>) ('Materials and methods') except that we added an additional filtering step to require endosperm maternally biased genes to have at least 85% maternal reads in each direction of the cross and paternally biased genes to have at least 50% paternal reads in each direction of the cross (the maternal and paternal cutoffs in the embryo were 70%) (<xref ref-type="fig" rid="fig1">Figure 1</xref>). In the endosperm between 122 and 145 maternally expressed imprinted genes (MEGs) were identified for each pair of reciprocal crosses (Col-Ler, Col-Cvi, or Ler-Cvi) along with between 43 and 52 paternally expressed imprinted genes (PEGs) for a total of 285 possible MEGs (including 5 TEs) and 103 PEGs in the union of all crosses (<xref ref-type="fig" rid="fig1">Figure 1B</xref>, <xref ref-type="supplementary-material" rid="SD2-data">Figure 1—source data 2</xref>). Many of these genes have previously been identified as imprinted genes (<xref ref-type="supplementary-material" rid="SD4-data">Figure 1—source data 4</xref>). Consistent with previous results (<xref ref-type="bibr" rid="bib13">Gehring et al., 2011</xref>; <xref ref-type="bibr" rid="bib20">Hsieh et al., 2011</xref>), very few potential imprinted genes were detected in the embryo (<xref ref-type="fig" rid="fig1">Figure 1C</xref>, <xref ref-type="supplementary-material" rid="SD3-data">Figure 1—source data 3</xref>). Imprinting calls based on whole-genome mRNA-seq were validated by sequencing or performing CAPs digestion on RT-PCR amplicons of 29 genes from independently isolated embryo and endosperm RNA samples (<xref ref-type="fig" rid="fig1s2">Figure 1—figure supplement 2</xref>, <xref ref-type="supplementary-material" rid="SD5-data">Figure 1—source data 5</xref>); results were mostly consistent with the mRNA-seq data.<fig-group><fig id="fig1" position="float"><object-id pub-id-type="doi">10.7554/eLife.03198.003</object-id><label>Figure 1.</label><caption><title>mRNA-seq identifies genes with biased expression.</title><p>(<bold>A</bold>) Proportion of maternal (m) and paternal (p) reads for all three sets of reciprocal crosses in the endosperm. One replicate of each reciprocal cross is shown. Biases represented by each quadrant are depicted for Col-Ler endosperm crosses but apply to all graphs. Orange and pink dots represent MEGs (pink dots are MEGs in all three sets of reciprocal crosses), blue and green dots represent PEGs (blue dots are PEGs in all three sets of reciprocal crosses). Crosshairs indicate the expected log ratio for genes that lack biased expression. (<bold>B</bold>) Overlap of MEGs and PEGs in the endosperm among three sets of reciprocal crosses. Pink and blue circles: Col-Ler; brown and purple circles: Col-Cvi; yellow and gray circles: Ler-Cvi. (<bold>C</bold>) Proportion of maternal (m) and paternal (p) reads for Col-Cvi and Cvi-Ler reciprocal crosses in the embryo. Colored dots as in part <bold>A</bold>. <xref ref-type="fig" rid="fig1s1">Figure 1—figure supplement 1</xref> shows seeds used in the experiment. <xref ref-type="fig" rid="fig1s2">Figure 1—figure supplement 2</xref> shows validation of an imprinted gene. <xref ref-type="fig" rid="fig1s3">Figure 1—figure supplement 3</xref> examines maternal:paternal ratios of imprinted genes identified in one set of crosses in the other two sets of reciprocal crosses. <xref ref-type="fig" rid="fig1s4">Figure 1—figure supplement 4</xref> examines overall expression levels of imprinted genes at other stages of development. Information on mRNA-seq library metrics is in <xref ref-type="supplementary-material" rid="SD1-data">Figure 1—source data 1</xref> and allele-specific expression information for all genes in endosperm and embryo is in <xref ref-type="supplementary-material" rid="SD2-data">Figure 1—source data 2</xref> and <xref ref-type="supplementary-material" rid="SD3-data">Figure 1—source data 3</xref>, respectively. <xref ref-type="supplementary-material" rid="SD4-data">Figure 1—source data 4</xref> shows the overlap among imprinted genes identified in this study and those identified in previous efforts and <xref ref-type="supplementary-material" rid="SD5-data">Figure 1—source data 5</xref> includes independent validation of imprinted genes.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.003">http://dx.doi.org/10.7554/eLife.03198.003</ext-link></p><p><supplementary-material id="SD1-data"><object-id pub-id-type="doi">10.7554/eLife.03198.004</object-id><label>Figure 1—source data 1.</label><caption><title>mRNA-seq libraries generated in this study.</title><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.004">http://dx.doi.org/10.7554/eLife.03198.004</ext-link></p></caption><media mime-subtype="xlsx" mimetype="application" xlink:href="elife03198s001.xlsx"/></supplementary-material></p><p><supplementary-material id="SD2-data"><object-id pub-id-type="doi">10.7554/eLife.03198.005</object-id><label>Figure 1—source data 2.</label><caption><title>Endosperm imprinting data for all genes.</title><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.005">http://dx.doi.org/10.7554/eLife.03198.005</ext-link></p></caption><media mime-subtype="xlsx" mimetype="application" xlink:href="elife03198s002.xlsx"/></supplementary-material></p><p><supplementary-material id="SD3-data"><object-id pub-id-type="doi">10.7554/eLife.03198.006</object-id><label>Figure 1—source data 3.</label><caption><title>Embryo imprinting data for all genes.</title><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.006">http://dx.doi.org/10.7554/eLife.03198.006</ext-link></p></caption><media mime-subtype="xlsx" mimetype="application" xlink:href="elife03198s003.xlsx"/></supplementary-material></p><p><supplementary-material id="SD4-data"><object-id pub-id-type="doi">10.7554/eLife.03198.007</object-id><label>Figure 1—source data 4.</label><caption><title>Overlap among published imprinted gene lists.</title><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.007">http://dx.doi.org/10.7554/eLife.03198.007</ext-link></p></caption><media mime-subtype="xlsx" mimetype="application" xlink:href="elife03198s004.xlsx"/></supplementary-material></p><p><supplementary-material id="SD5-data"><object-id pub-id-type="doi">10.7554/eLife.03198.008</object-id><label>Figure 1—source data 5.</label><caption><title>Validation of imprinted genes.</title><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.008">http://dx.doi.org/10.7554/eLife.03198.008</ext-link></p></caption><media mime-subtype="xlsx" mimetype="application" xlink:href="elife03198s005.xlsx"/></supplementary-material></p></caption><graphic xlink:href="elife03198f001"/></fig><fig id="fig1s1" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.03198.009</object-id><label>Figure 1—figure supplement 1.</label><caption><title>Seed development in the crosses used in this study.</title><p>(<bold>A</bold>) Seeds cleared with chloral hydrate and imaged 6 days after pollination. Scale bar = 100 microns for all panels. (<bold>B</bold>) Mature seeds. Scale bar = 500 microns.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.009">http://dx.doi.org/10.7554/eLife.03198.009</ext-link></p></caption><graphic xlink:href="elife03198fs001"/></fig><fig id="fig1s2" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.03198.010</object-id><label>Figure 1—figure supplement 2.</label><caption><title>Validation of AT4G00750 allele-specific imprinting by RT-PCR and CAPs digestion.</title><p>Endosperm cDNA from the indicated crosses (female in cross listed first) was amplified using intron-spanning primers that flank a C&gt;G polymorphism between Col and Ler or Cvi and then restriction digested with Hpy188I. The PCR amplifies a 324 bp product. After digestion with Hpy188I, Col remains uncut but Ler or Cvi alleles are digested to 209 and 115 bp. Consistent with the RNA-seq data, AT4G00750 expression is primarily from the maternally inherited allele except when Ler is the male parent. AT4G00750 is a MEG in both directions of the cross for Col-Cvi.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.010">http://dx.doi.org/10.7554/eLife.03198.010</ext-link></p></caption><graphic xlink:href="elife03198fs002"/></fig><fig id="fig1s3" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.03198.011</object-id><label>Figure 1—figure supplement 3.</label><caption><title>Consistency of imprinting among different sets of reciprocal crosses.</title><p>Allele-specific expression ratios of imprinted genes identified in one set of reciprocal crosses in the other two sets of reciprocal crosses. Pink dots, MEGs in both sets of crosses being compared; orange dots, MEGs not shared with the dataset being plotted; blue dots, PEGs in both sets of crosses being compared; green dots, PEGs not shared with the dataset being plotted. Most pink and orange dots are in the upper right quardrant and most blue and green in the lower left, indicating consistent parental bias. m, maternal; p, paternal.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.011">http://dx.doi.org/10.7554/eLife.03198.011</ext-link></p></caption><graphic xlink:href="elife03198fs003"/></fig><fig id="fig1s4" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.03198.012</object-id><label>Figure 1—figure supplement 4.</label><caption><title>Imprinted genes are expressed at multiple stages of development.</title><p>(<bold>A</bold>) Expression of 199 MEGs and 82 PEGs in leaves, shoot apex (Sh), flowers, roots (R), pollen (P), and seeds at various stages of development. Tissue series data was downloaded using the e-Northern expression tool from the Bio-Analytic Resource (<xref ref-type="bibr" rid="bib52">Toufighi et al., 2005</xref>). (<bold>B</bold>) Expression of MEGs and PEGs in whole seeds (WS), embryo proper (EP), suspensor (S), micropylar endosperm (MCE), peripheral endosperm (PEN), chalazal endosperm (CZE), general seed coat (SC) and chalazal seed coat (CSC). Data is from <xref ref-type="bibr" rid="bib5">Belmonte et al., 2013</xref>. Each tissue is organized by increasing developmental age from pre-globular to mature green. Data was clustered and visualized using GENE-E. Gene order is the same between <bold>A</bold> and <bold>B</bold>.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.012">http://dx.doi.org/10.7554/eLife.03198.012</ext-link></p></caption><graphic xlink:href="elife03198fs004"/></fig></fig-group></p><p>We concluded that most genes that show strong evidence for imprinting in one cross have evidence for the same parental bias in other crosses (<xref ref-type="fig" rid="fig1s3">Figure 1—figure supplement 3</xref>). The intersection of the endosperm datasets revealed 28 MEGs and 6 PEGs in common among all three pairs of reciprocal crosses (<xref ref-type="fig" rid="fig1">Figure 1B</xref>). An additional 53 MEGs and 23 PEGs were identified in two of three sets of reciprocal crosses. Most MEGs and PEGs that were identified in only one set of reciprocal crosses lacked sufficient data to assess imprinting in the other crosses, due to an absence of SNPs or because of low read counts, rather than because they were clearly not parentally biased. For example, of the 73 Col-Cvi MEGs that were not among the Col-Ler MEGs, 62 lacked sufficient allele-specific data to be assessed for imprinting in Col-Ler. Of the remaining 11 genes, 8 showed strong evidence for maternal bias but did not meet all criteria for imprinting (usually failing to meet the requirement for 85% maternal reads in both directions of the cross).</p><p>We also examined the expression of imprinted genes at other stages of the plant life cycle (<xref ref-type="fig" rid="fig1s4">Figure 1—figure supplement 4</xref>). Analysis of published microarray expression data (<xref ref-type="bibr" rid="bib52">Toufighi et al., 2005</xref>) showed that in Arabidopsis most imprinted genes are expressed at other stages of plant development (<xref ref-type="fig" rid="fig1s4">Figure 1—figure supplement 4</xref>). Within seeds, imprinted genes are most commonly expressed in chalazal endosperm (<xref ref-type="fig" rid="fig1s4">Figure 1—figure supplement 4</xref>), consistent with previous findings from individual loci (<xref ref-type="bibr" rid="bib24">Ingouff et al., 2005</xref>). Several PEGs and MEGs are most highly expressed in mature pollen (<xref ref-type="fig" rid="fig1s4">Figure 1—figure supplement 4</xref>), probably reflecting expression in the pollen vegetative nucleus, which also undergoes active DNA demethylation (<xref ref-type="bibr" rid="bib45">Schoft et al., 2011</xref>; <xref ref-type="bibr" rid="bib6">Calarco et al., 2012</xref>; <xref ref-type="bibr" rid="bib23">Ibarra et al., 2012</xref>).</p><p>Consistent with our previous study (<xref ref-type="bibr" rid="bib13">Gehring et al., 2011</xref>), compared to all genes that could be assessed for imprinting, the PEGs identified in any of the three sets of reciprocal crosses (n = 103) were enriched for genes encoding proteins with a SRA-YDG domain (65.6-fold; p value=3.3E−6), genes involved in the biological processes regulation of RNA metabolic processes (4.1-fold; p value=4.7E−4), DNA-dependent regulation of transcription (4.1-fold, p value=8.5E−4), and DNA binding proteins (2.6-fold; p=2.5E−4). Overall, PEGs consisted of many genes known or predicted to be involved in transcription and epigenome regulation. Maize PEGs are also enriched for chromatin modifiers (<xref ref-type="bibr" rid="bib59">Waters et al., 2013</xref>). The Arabidopsis MEGs were not enriched for any particular class of genes except for a slight enrichment for transcription factor activity (2.1-fold; p=0.035), particularly of the MYB and homeodomain types.</p></sec><sec id="s2-2"><title>A small number of genes exhibit allele-specific imprinting</title><p>We identified 9 PEGs and 3 MEGs that exhibited allele-specific imprinting (<xref ref-type="supplementary-material" rid="SD6-data">Figure 2—source data 1</xref>). Our method to identify imprinted genes explicitly relies on agreement between reciprocal crosses (‘Materials and methods’). However, genes that exhibit allele-specific imprinting will only be parentally biased when a particular strain is the male or female parent; for example a gene could be a PEG in all crosses except when Cvi is the male parent (<xref ref-type="fig" rid="fig2">Figure 2</xref>). From the ratio of maternal/paternal mRNA-seq reads in each cross we identified those loci that were potentially biased in one direction of the cross but not the other (‘Materials and methods’). Because each allele was included twice as the maternal or paternal parent in our experimental design, we were able to identify loci that consistently showed maternal or paternal bias when a particular strain was the male or female parent (<xref ref-type="fig" rid="fig2">Figure 2</xref>). These lists were then compared to the union of all MEGs and PEGs (<xref ref-type="fig" rid="fig1">Figure 1</xref>) to identify genes that are imprinted in one set of reciprocal crosses, but only in one direction in the other two sets of reciprocal crosses (<xref ref-type="fig" rid="fig2">Figure 2</xref>). We performed CAPs analysis or sequenced RT-PCR amplicons for 7 of the 12 allele-specific imprinted genes and further confirmed that they exhibited allele-specific imprinting with few exceptions (<xref ref-type="fig" rid="fig1s2">Figure 1—figure supplement 2</xref>, <xref ref-type="supplementary-material" rid="SD5-data">Figure 1—source data 5</xref>, <xref ref-type="supplementary-material" rid="SD6-data">Figure 2—source data 1</xref>).<fig id="fig2" position="float"><object-id pub-id-type="doi">10.7554/eLife.03198.013</object-id><label>Figure 2.</label><caption><title>A subset of genes is only imprinted when a certain strain is the male or female parent.</title><p>Process for identifying allele-specific imprinted genes that are PEGs except when Cvi is the male parent. Genes that are paternally biased in Cvi x Col but not Col x Cvi (blue dots) were identified. These genes were overlapped with the Ler-Cvi maternal/paternal log ratios for the same genes (green dots) to generate a list of candidate loci that are not PEGs when Cvi is the male parent. Intersection with Col-Ler PEGs (pink dots) identifies strain-specific imprinted genes that are PEGs except when Cvi is the male parent, including AT2G32370 and AT3G14205. All candidate allele-specific imprinted genes are in <xref ref-type="supplementary-material" rid="SD6-data">Figure 2—source data 1</xref>. m, maternal; p, paternal.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.013">http://dx.doi.org/10.7554/eLife.03198.013</ext-link></p><p><supplementary-material id="SD6-data"><object-id pub-id-type="doi">10.7554/eLife.03198.014</object-id><label>Figure 2—source data 1.</label><caption><title>Candidate allele-specific imprinted genes.</title><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.014">http://dx.doi.org/10.7554/eLife.03198.014</ext-link></p></caption><media mime-subtype="xlsx" mimetype="application" xlink:href="elife03198s006.xlsx"/></supplementary-material></p></caption><graphic xlink:href="elife03198f002"/></fig></p></sec><sec id="s2-3"><title>Embryo-endosperm DMRs are largely distinct from strain DMRs</title><p>To explore the potential relationship between DNA methylation and conserved and allele-specific imprinting, libraries for single base resolution DNA methylation profiling by bisulfite sequencing (BS-seq) were prepared from embryo and endosperm DNA (<xref ref-type="supplementary-material" rid="SD7-data">Figure 3—source data 1</xref>). All BS-seq libraries had a high cytosine to thymine conversion rate (at least 99.70%), indicating efficient bisulfite treatment (<xref ref-type="supplementary-material" rid="SD7-data">Figure 3—source data 1</xref>). Methylation profiles were generated from non-redundant uniquely mapping reads (‘Material and methods’). Endosperm DNA was consistently less methylated compared to embryo DNA in all sequence contexts (<xref ref-type="supplementary-material" rid="SD7-data">Figure 3—source data 1</xref>), as shown previously (<xref ref-type="bibr" rid="bib11">Gehring et al., 2009</xref>; <xref ref-type="bibr" rid="bib19">Hsieh et al., 2009</xref>; <xref ref-type="bibr" rid="bib23">Ibarra et al., 2012</xref>). Embryo tissue from crosses between strains primarily displayed additive total DNA methylation (<xref ref-type="supplementary-material" rid="SD7-data">Figure 3—source data 1</xref>). In the endosperm, total methylation was more closely aligned with the methylation level of the female parent, consistent with the 2:1 ratio of maternal to paternal genomic DNA in the endosperm (<xref ref-type="supplementary-material" rid="SD7-data">Figure 3—source data 1</xref>). Interestingly, CHH methylation was not substantially reduced on a global scale in Cvi x Col endosperm (3.0%) compared to the embryo (3.1%) (<xref ref-type="supplementary-material" rid="SD7-data">Figure 3—source data 1</xref>).</p><p>Our analysis revealed an unusual methylation profile in Cvi. CG methylation in Cvi embryos (16.3%) was lower than in Col and Ler embryos (28.1% and 22.4%, respectively) (<xref ref-type="supplementary-material" rid="SD7-data">Figure 3—source data 1</xref>). We further investigated the nature of CG hypomethylation in Cvi to determine whether it was specific to certain classes of sequences or whether CG methylation was uniformly reduced across the genome. Of the three strains, Cvi had the lowest median CG methylation levels in both genes and TEs in embryos (<xref ref-type="fig" rid="fig3">Figure 3</xref>), but was largely unaffected in those sequences in either the CHG or CHH contexts (<xref ref-type="fig" rid="fig3">Figure 3C</xref>, <xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1</xref>). Analysis of Cvi CG methylation data from leaves (<xref ref-type="bibr" rid="bib44">Schmitz et al., 2013</xref>) confirmed that hypomethylation was not specific to embryo and endosperm but is a general property of this strain (<xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1</xref>). Loss of CG methylation was most pronounced in gene bodies (<xref ref-type="fig" rid="fig3">Figure 3B,C</xref>, <xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1</xref>), where it was 50% lower in Cvi compared to either Ler or Col (<xref ref-type="supplementary-material" rid="SD8-data">Figure 3—source data 2</xref>). CG methylation in TEs was 14% lower in Cvi than in Col, but at the same level as in Ler (<xref ref-type="supplementary-material" rid="SD8-data">Figure 3—source data 2</xref>). Reduced gene body methylation in Cvi is unlikely to be a technical artifact of mapping biases: gene bodies have fewer SNPs and indels than TEs and thus mapping efficiency is better to genes than to TEs. All of our locus-specific bisulfite sequencing confirmed the whole-genome BS data. In Arabidopsis, gene body methylation is primarily in the CG context and is maintained after DNA replication by the maintenance methyltransferase MET1 (<xref ref-type="bibr" rid="bib36">Lister et al., 2008</xref>). Therefore, non-CG methylation pathways seem to operate normally in Cvi, but maintenance methylation appears to be compromised.<fig-group><fig id="fig3" position="float"><object-id pub-id-type="doi">10.7554/eLife.03198.015</object-id><label>Figure 3.</label><caption><title>Cvi is hypomethylated in CG contexts.</title><p>(<bold>A</bold>) Box and whiskers plots of CG DNA methylation levels of genes and TEs in Col, Ler, and Cvi embryos. Line: median; gray dots: outliers. (<bold>B</bold>) Average CG DNA methylation profiles of genes (blue colors) and TEs (orange colors) in Col, Ler, and Cvi embryos. Relative to Col, mean Cvi methylation level was decreased by 56% in genes (p=0.00, Tukey's HSD test) and by 14% in TEs (p=0.00, Tukey's HSD test). (<bold>C</bold>) DNA methylation in Col, Ler and Cvi embryos at a representative genomic region that includes genes and TEs. CG (red), CHG (blue) and CHH (green) methylation. Tick marks below the line indicate cytosines for which data was present but no methylation was detected. <xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1</xref> contains additonal analyses, <xref ref-type="supplementary-material" rid="SD7-data">Figure 3—source data 1</xref> has statistics on BS-libraries and <xref ref-type="supplementary-material" rid="SD8-data">Figure 3—source data 2</xref> shows the complete statistical analysis of methylation in Cvi compared to other strains.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.015">http://dx.doi.org/10.7554/eLife.03198.015</ext-link></p><p><supplementary-material id="SD7-data"><object-id pub-id-type="doi">10.7554/eLife.03198.016</object-id><label>Figure 3—source data 1.</label><caption><title>BS-Seq libraries generated in this study.</title><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.016">http://dx.doi.org/10.7554/eLife.03198.016</ext-link></p></caption><media mime-subtype="xlsx" mimetype="application" xlink:href="elife03198s007.xlsx"/></supplementary-material></p><p><supplementary-material id="SD8-data"><object-id pub-id-type="doi">10.7554/eLife.03198.017</object-id><label>Figure 3—source data 2.</label><caption><title>Statistical analysis of strain differential methylation in genes and TEs.</title><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.017">http://dx.doi.org/10.7554/eLife.03198.017</ext-link></p></caption><media mime-subtype="xlsx" mimetype="application" xlink:href="elife03198s008.xlsx"/></supplementary-material></p></caption><graphic xlink:href="elife03198f003"/></fig><fig id="fig3s1" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.03198.018</object-id><label>Figure 3—figure supplement 1.</label><caption><title>Cvi is hypomethylated in CG contexts regardless of tissue type but is not as hypomethylated in CHG and CHH contexts.</title><p>Box and whisker plots of DNA methylation levels of genes (left) and TEs (right). (<bold>A</bold>) CHG methylation in Col, Ler, and Cvi embryos. Relative to Col, mean Cvi methylation level was decreased by 22% in genes (p&lt;0.05, Tukey's HSD test) and by 2% in TEs (p&gt;0.05, Tukey's HSD test). (<bold>B</bold>) CHH methylation in Col, Ler, and Cvi embryos. Relative to Col, mean Cvi methylation level was decreased by 26% in genes (p&lt;0.05, Tukey's HSD test) and by 9% in TEs (p&lt;0.05, Tukey's HSD test). (<bold>C</bold>) Box and whisker plots of % CG DNA methylation of genes (left) and TEs (right) in Col and Cvi embryos in comparison to Col and Cvi leaves, using methylation data from <xref ref-type="bibr" rid="bib44">Schmitz et al. (2013)</xref>. Relative to Col, mean Cvi methylation level was decreased by 56% (embryo) and 54% (leaf) in genes and by 14% in TEs in both tissues (p&lt;0.05, Tukey's HSD test). Line: median; gray dots: outliers. Statistics are in <xref ref-type="supplementary-material" rid="SD8-data">Figure 3—source data 2</xref>.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.018">http://dx.doi.org/10.7554/eLife.03198.018</ext-link></p></caption><graphic xlink:href="elife03198fs005"/></fig></fig-group></p><p>Genomic regions that are subject to active DNA demethylation during endosperm development in at least one strain but are variably methylated among other strains could be important contributors to an epigenetic mechanism for allele-specific imprinting. To identify embryo-endosperm DMRs and strain DMRs, we calculated weighted methylation levels (<xref ref-type="bibr" rid="bib47">Schultz et al., 2012</xref>) in overlapping 300 nucleotide windows across the entire genome, requiring each cytosine to have at least five reads coverage to be included in the analysis (‘Materials and methods’). We then ran pairwise comparisons between all windows with sufficient coverage for embryo libraries and their matching endosperm libraries (embryo-endosperm DMRs) and for Col-0, Ler and Cvi embryo libraries against one another (strain DMRs). The distribution of differences highlighted global differences in methylation (<xref ref-type="fig" rid="fig4s1">Figure 4—figure supplement 1</xref>). To identify DMRs the analysis was restricted to differences in weighted methylation fraction of at least 35% for CG or CHG methylation, with a minimum overlap of three informative Cs between windows (i.e., at least 3 Cs at the exact same positions had sufficient coverage in both embryo and endosperm), and 10% for CHH methylation, with a minimum overlap of 10 informative Cs. We retained DMRs that had a FDR corrected p-value&lt;0.01, reflecting whether the fraction of methylated/unmethylated counts was the same for both samples. From 365,000 to 500,000 informative 300 bp windows, 12,000–14,000 Col-Cvi and Col-Ler positive CG strain DMRs were identified, corresponding to approximately 8000 features. Most strain DMRs were in genes (<xref ref-type="fig" rid="fig4">Figure 4A</xref>). In Col-Ler comparisons we also identified 7453 features where Ler was more methylated than Col, but only 1749 features where Cvi was more methylated than Col because of the overall reduction of CG gene body methylation in Cvi (<xref ref-type="fig" rid="fig3">Figure 3</xref>, <xref ref-type="fig" rid="fig4">Figure 4</xref>, <xref ref-type="fig" rid="fig4s1">Figure 4—figure supplement 1</xref>). In contrast to CG DMRs, strain CHH DMRs mostly mapped to TEs and intergenic regions (<xref ref-type="fig" rid="fig4">Figure 4B</xref>), which are the sequences most likely to contain non-CG methylation. Similar results were obtained for Ler-Cvi comparisons (<xref ref-type="fig" rid="fig4s2">Figure 4—figure supplement 2</xref>). Independent validation by methylation-sensitive PCR or locus-specific BS-PCR of six loci confirmed our genome-wide analyses (<xref ref-type="fig" rid="fig4s3">Figure 4—figure supplement 3</xref>).<fig-group><fig id="fig4" position="float"><object-id pub-id-type="doi">10.7554/eLife.03198.023</object-id><label>Figure 4.</label><caption><title>Strain DMRs and embryo-endosperm DMRs are in distinct genomic regions.</title><p>(<bold>A</bold>) Number of features overlapping strain DMRs between Col and Ler or Col and Cvi embryos. (<bold>B</bold>) Number of features overlapping embryo-endosperm DMRs in Col x Cvi and Cvi x Col crosses. (<bold>C</bold> and <bold>D</bold>) 24 nt small RNA quantities (reads per million) corresponding to Col-Cvi strain (<bold>C</bold>) and Col x Cvi or Cvi x Col embryo-endosperm DMRs (<bold>D</bold>). (<bold>E</bold>) Overlap between Col-Cvi strain positive CG DMRs (more methylated in Col than Cvi) and the union of Col x Cvi and Cvi x Col embryo-endosperm CG DMRs (embryo more methylated than endosperm) corresponding to genes, TEs, and intergenic regions. <xref ref-type="fig" rid="fig4s1">Figure 4—figure supplement 1</xref> show the distribution of all methylation differences; <xref ref-type="fig" rid="fig4s2">Figure 4—figure supplement 2</xref> shows DMR analysis in Ler-Cvi crosses and other datasets; <xref ref-type="fig" rid="fig4s3">Figure 4—figure supplement 3</xref> validates DMRs identified in this analysis; <xref ref-type="fig" rid="fig4s4">Figure 4—figure supplement 4</xref> examines small RNAs at TEs and <xref ref-type="fig" rid="fig4s5">Figure 4—figure supplement 5</xref> shows the overlap of embryo-endosperm CpG DMRs with previous studies. sRNA-seq library metrics are in <xref ref-type="supplementary-material" rid="SD9-data">Figure 4—source data 1</xref>.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.023">http://dx.doi.org/10.7554/eLife.03198.023</ext-link></p><p><supplementary-material id="SD9-data"><object-id pub-id-type="doi">10.7554/eLife.03198.024</object-id><label>Figure 4—source data 1.</label><caption><title>Whole seed sRNA-seq libraries generated in this study.</title><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.024">http://dx.doi.org/10.7554/eLife.03198.024</ext-link></p></caption><media mime-subtype="xlsx" mimetype="application" xlink:href="elife03198s009.xlsx"/></supplementary-material></p></caption><graphic xlink:href="elife03198f004"/></fig><fig id="fig4s1" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.03198.025</object-id><label>Figure 4—figure supplement 1.</label><caption><title>Distribution of endosperm-embryo and strain CG DNA methylation differences.</title><p>Histograms showing the distribution of all the 300 nt comparisons irrespective of the associated p-value. x axis: difference in weighted methylation; y axis: number of windows.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.025">http://dx.doi.org/10.7554/eLife.03198.025</ext-link></p></caption><graphic xlink:href="elife03198fs006"/></fig><fig id="fig4s2" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.03198.026</object-id><label>Figure 4—figure supplement 2.</label><caption><title>Ler and Cvi strain DMRs and embryo-endosperm DMRs in additional datasets.</title><p>(<bold>A</bold>) Number of features overlapping strain DMRs between Ler and Cvi embryos. (<bold>B</bold>) Number of features overlapping embryo-endosperm DMRs in Cvi x Ler and Ler x Cvi crosses. (<bold>C</bold>) Number of features overlapping embryo-endosperm DMRs in Ler x Col and Col x Ler crosses (analysis of dataset from <xref ref-type="bibr" rid="bib23">Ibarra et al., 2012</xref>).</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.026">http://dx.doi.org/10.7554/eLife.03198.026</ext-link></p></caption><graphic xlink:href="elife03198fs007"/></fig><fig id="fig4s3" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.03198.027</object-id><label>Figure 4—figure supplement 3.</label><caption><title>Validation of BS-seq results with locus-specific BS-PCR or McrBC-PCR.</title><p>(<bold>A</bold>) AT4G21430. (<bold>B</bold>) AT5G17320. (<bold>C</bold>) AT1G65330. Top: CG, CHG and CHH methylation profiles of Col, Ler, and Cvi embryos and strain DMRs selected for validation. Bottom: methylation of individual sequenced clones from locus-specific BS-PCR. Filled circles indicate methylation, whereas unmethylated positions remain unfilled. (<bold>D</bold>) McrBC digestion of leaf genomic DNA followed by PCR of AT2G34880 and AT1G48910.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.027">http://dx.doi.org/10.7554/eLife.03198.027</ext-link></p></caption><graphic xlink:href="elife03198fs008"/></fig><fig id="fig4s4" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.03198.028</object-id><label>Figure 4—figure supplement 4.</label><caption><title>Distribution of TE superfamilies and small RNAs within embryo-endosperm DMRs.</title><p>(<bold>A</bold>) TE superfamilies overlapped by CG or CHH DMRs (embryo &gt; endosperm methylation in Cvi x Cvi) in comparison to the whole genome TE representation. TE superfamilies are as defined by TAIR10. (<bold>B</bold>) Box plots depicting the number of 21–24 nt small RNAs (reads per million) overlapping: all TEs of the designated class (black), CG DMRs (red) or CHH DMRs (green). p-values were calculated using the Wilcoxon-Mann-Whitney test, followed by a Bonferroni correction. *p&lt;0.05; **p&lt;0.01; ***p&lt;0.001; ****p&lt;0.0001.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.028">http://dx.doi.org/10.7554/eLife.03198.028</ext-link></p></caption><graphic xlink:href="elife03198fs009"/></fig><fig id="fig4s5" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.03198.029</object-id><label>Figure 4—figure supplement 5.</label><caption><title>Overlap of embryo-endosperm CG DMRs with previous studies.</title><p>This study: DMRs identified from all matched comparisons, <xref ref-type="bibr" rid="bib11">Gehring et al., 2009</xref>: Col-glxCol-gl and LerxLer DMRs, <xref ref-type="bibr" rid="bib23">Ibarra et al., 2012</xref>: ColxLer and LerxCol DMRs combined. To identify the DMRs, this study and <xref ref-type="bibr" rid="bib23">Ibarra et al. (2012)</xref> datasets were analyzed with the same analysis pipeline described in ‘Materials and methods’. Minimum overlap required between DMRs = 100 nt.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.029">http://dx.doi.org/10.7554/eLife.03198.029</ext-link></p></caption><graphic xlink:href="elife03198fs010"/></fig></fig-group></p><p>We identified fewer embryo-endosperm DMRs than strain DMRs, although lower BS-seq coverage in the endosperm was likely a major contributing factor (<xref ref-type="fig" rid="fig4">Figure 4B</xref>, <xref ref-type="supplementary-material" rid="SD7-data">Figure 3—source data 1</xref>). From 23,000 informative windows in the Col x Cvi embryo-endosperm comparison we identified 2305 positive CG DMRs, corresponding to 1100 features where the embryo was more methylated than the endosperm (<xref ref-type="fig" rid="fig4">Figure 4B</xref>). In contrast to strain DMRs and consistent with previous findings (<xref ref-type="bibr" rid="bib11">Gehring et al., 2009</xref>; <xref ref-type="bibr" rid="bib23">Ibarra et al., 2012</xref>), most regions hypomethylated in the endosperm in both the CG and CHH contexts correspond to intergenic regions and annotated transposable element fragments. Helitron and Mu elements were most commonly represented among demethylated TEs overlapped by a DMR, reflecting their abundance in the genome (<xref ref-type="fig" rid="fig4s4">Figure 4—figure supplement 4</xref>; <xref ref-type="bibr" rid="bib11">Gehring et al., 2009</xref>). It is important to note that although Cvi has a global methylation profile distinct from Col and Ler (<xref ref-type="fig" rid="fig3">Figure 3</xref>, <xref ref-type="supplementary-material" rid="SD7-data">Figure 3—source data 1</xref>), endosperm demethylation dynamics appear to be the same. This reflects the fact that regions targeted for active DNA demethylation are depleted of genes, which is where most strain-specific methylation differences in Cvi reside.</p><p>Using our analysis pipeline we also identified embryo-endosperm DMRs from published BS-seq data from Col x Ler and Ler x Col embryo and endosperm isolated at a slightly later developmental stage (<xref ref-type="bibr" rid="bib23">Ibarra et al., 2012</xref>). These datasets have higher endosperm coverage and slightly lower embryo coverage than our datasets. 40% of DMRs were in common when our union set of DMRs (identified in any matching embryo-endosperm comparison among our datasets; n = 21,973) was compared to the Ibarra embryo-endosperm DMRs (<xref ref-type="fig" rid="fig4s5">Figure 4—figure supplement 5</xref>). 61% of the embryo-endosperm DMRs we previously identified in Col-<italic>gl</italic> and Ler seeds by meDIP-seq (<xref ref-type="bibr" rid="bib11">Gehring et al., 2009</xref>) were identified in our current study (<xref ref-type="fig" rid="fig4s5">Figure 4—figure supplement 5</xref>), indicating a high degree of overlap between this study and others.</p></sec><sec id="s2-4"><title>Embryo-endosperm DMRs are enriched for whole seed small RNAs</title><p>Because methylation of TEs and other repetitive sequences is often associated with small RNAs and because small RNAs are abundant in seeds (<xref ref-type="bibr" rid="bib39">Mosher et al., 2009</xref>), we sequenced small RNAs from whole seeds at 6 DAP, obtaining 20–30 million high-quality reads for biological replicates of each sample (<xref ref-type="supplementary-material" rid="SD9-data">Figure 4—source data 1</xref>). Data from whole seeds cannot distinguish among small RNAs from the seed coat, embryo, or endosperm, but at 6 DAP RdDM pathway genes are expressed in both embryo and endosperm (<xref ref-type="bibr" rid="bib26">Jullien et al., 2012</xref>; <xref ref-type="bibr" rid="bib5">Belmonte et al., 2013</xref>), suggesting that both tissues have the ability to produce small RNAs. Strain specific CG DMRs have very low levels of small RNAs, consistent with these DMRs residing mainly in genes, which are not targeted by the RdDM pathway (<xref ref-type="fig" rid="fig4">Figure 4C</xref>). In contrast, CG DMRs where the embryo is more methylated than the endosperm are enriched for small RNAs compared to strain DMRs (Wilcoxon-Mann-Whitney test, p&lt;0.0001) or compared to a set of random genomic loci (<xref ref-type="fig" rid="fig4">Figure 4D</xref>). TEs overlapping embryo-endosperm CG DMRs have on average higher levels of small RNAs in whole seeds than do all TEs on average from that family (<xref ref-type="fig" rid="fig4s4">Figure 4—figure supplement 4</xref>). Both strain and embryo-endosperm CHH DMRs are associated with small RNAs (<xref ref-type="fig" rid="fig4">Figure 4C,D</xref>).</p></sec><sec id="s2-5"><title>Correspondence between imprinted genes, differential methylation, and small RNAs</title><p>We examined the overlap of the union set of imprinted genes (including within the gene and 2 kb from the 5′ and 3′ ends) and the CG and/or CHH embryo-endosperm DMRs. Over 40% of the MEGs (121/285) overlapped a CG DMR within these regions, but this was not a significant enrichment compared to a random set of the same number of genes (Fisher's exact test p-value=0.3477), nor was the overlap (176/285) when Ibarra et al. CG DMRs were also included in the analysis. In contrast, PEGs were significantly enriched for CG DMRs (64/103; p=0.0174) (<xref ref-type="fig" rid="fig5">Figure 5</xref>). Furthermore, of the 29 PEGs that are in common among at least two of three sets of reciprocal crosses (<xref ref-type="fig" rid="fig1">Figure 1B</xref>), 22 are associated with a proximal TE, primarily within 1 kb 5′ of the transcription start site (<xref ref-type="fig" rid="fig5">Figure 5</xref>). Fewer MEGs exhibit a correlation with presence of a TE (40/85), consistent with the lower correlation between DNA demethylation and imprinted expression for MEGs (<xref ref-type="fig" rid="fig5">Figure 5</xref>).<fig-group><fig id="fig5" position="float"><object-id pub-id-type="doi">10.7554/eLife.03198.030</object-id><label>Figure 5.</label><caption><title>Correspondence between DNA methylation, TEs, and sRNAs for imprinted genes.</title><p>(<bold>A</bold>) Average CG methylation in embryo and endosperm for the union set of PEGs, MEGs and all genes. (<bold>B</bold>) Percentage of genes with TE at indicated position. (<bold>C</bold>) Distribution of TEs and 24 nt small RNAs around endosperm imprinted MEGs (n = 85) and PEGs (n = 29) identified in at least two of three sets of reciprocal crosses. TE heatmap indicates the presence or absence of TEs according to TAIR10 annotation. 24 nt small RNA data is from ColxCvi whole seeds. Other libraries showed the same overall small RNA profile. Values were calculated in 200 nt windows extending 2 kb upstream and downstream from the 5′ and 3′ ends of the gene and 1 kb into the gene body. White indicates the absence of data. <xref ref-type="fig" rid="fig5s1">Figure 5—figure supplement 1</xref> shows H3K27me3 profiles around imprinted genes in vegetative tissues. <xref ref-type="fig" rid="fig5s2">Figure 5—figure supplement 2</xref> and <xref ref-type="fig" rid="fig5s3">Figure 5—figure supplement 3</xref> further explore the distribution and allelic contribution of small RNAs associated with imprinted genes.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.030">http://dx.doi.org/10.7554/eLife.03198.030</ext-link></p></caption><graphic xlink:href="elife03198f005"/></fig><fig id="fig5s1" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.03198.031</object-id><label>Figure 5—figure supplement 1.</label><caption><title>Histone H3 lysine 27 trimethylation (H3K27me3) profiles of PEGs and MEGs in vegetative tissues.</title><p>H3K27me3 leaf data from <xref ref-type="bibr" rid="bib33">Lafos et al. (2011)</xref>.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.031">http://dx.doi.org/10.7554/eLife.03198.031</ext-link></p></caption><graphic xlink:href="elife03198fs011"/></fig><fig id="fig5s2" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.03198.032</object-id><label>Figure 5—figure supplement 2.</label><caption><title>Small RNA levels around imprinted genes.</title><p>Box plots depicting 24 nt sRNAs in reads per million reads (RPM) within 1 kb windows associated with MEGs, PEGs, or all genes that could be evaluated for imprinted expression within that cross. Asterisks indicate significance when compared to all genes analyzed. p-values were calculated using the Wilcoxon-Mann-Whitney test, followed by a Bonferroni correction. *p&lt;0.05; **p&lt;0.01; ***p&lt;0.001.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.032">http://dx.doi.org/10.7554/eLife.03198.032</ext-link></p></caption><graphic xlink:href="elife03198fs012"/></fig><fig id="fig5s3" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.03198.033</object-id><label>Figure 5—figure supplement 3.</label><caption><title>Fraction of maternal small RNAs near the 5’ end of imprinted genes.</title><p>Boxplots illustrating the fraction of classified 24 nt sRNA reads identified as derived from the maternally inherited genome for the set of all genes that were analyzed for imprinting, the union of all identified MEGs, and the union of all identified PEGs (<xref ref-type="fig" rid="fig1">Figure 1B</xref>). Windows had to exceed a threshold of five classified reads (i.e., reads that could be assigned to the maternal or paternal genome based on SNPs) to be included in the analysis. p-values were calculated using the Wilcoxon-Mann-Whitney test. *p&lt;0.05; **p&lt;0.01; ***p&lt;0.001.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.033">http://dx.doi.org/10.7554/eLife.03198.033</ext-link></p></caption><graphic xlink:href="elife03198fs013"/></fig></fig-group></p><p>We also examined the distribution of total and allele-specific small RNAs around MEGs and PEGs. The highest average levels of small RNAs are found at the 5′ end of the gene (<xref ref-type="fig" rid="fig5s2">Figure 5—figure supplement 2</xref>). Despite the lack of DMR enrichment, MEGs are enriched for small RNAs within the first kilobase of the gene in all crosses examined and in the first kb 5′ of the gene in a subset of the samples (<xref ref-type="fig" rid="fig5s2">Figure 5—figure supplement 2</xref>). Small RNAs associated with PEGs are enriched in the first kb 5′ of the gene—where most PEG-associated TEs are located (<xref ref-type="fig" rid="fig5">Figure 5</xref>)—and in the gene body, although levels 5′ of the gene are much higher (<xref ref-type="fig" rid="fig5s2">Figure 5—figure supplement 2</xref>).</p><p>We examined whether MEGs or PEGs differed in the maternal/paternal fraction of associated small RNAs. Previous data suggested that small RNAs corresponding to TEs associated with MEGs accumulate in sperm cells (<xref ref-type="bibr" rid="bib6">Calarco et al., 2012</xref>); in these instances the silent paternal allele would already be targeted for RdDM in sperm. Paternal small RNAs, which in whole seeds must be derived from the endosperm or embryo genomes, constituted 6–24% of RNAs that could be assigned to a specific allele, depending on the cross (<xref ref-type="supplementary-material" rid="SD9-data">Figure 4—source data 1</xref>). We calculated the fraction of maternal small RNA reads for the region 1 kb 5′ and 3′ of the transcription start site of imprinted genes, retaining only those regions with at least five allele-specific reads in our analysis. MEGs were enriched for small RNAs derived from the paternally-inherited genome compared to all genes that could be evaluated for imprinting (<xref ref-type="fig" rid="fig5s3">Figure 5—figure supplement 3</xref>). This suggests that silencing of the paternal allele of MEGs is associated with <italic>cis</italic> acting small RNAs produced from those alleles in the endosperm. Small RNA data from specific compartments of the seed will be necessary to conclusively address this question.</p></sec><sec id="s2-6"><title>Allele-specific imprinted genes are associated with variable DMRs</title><p>We identified regions of the genome that are subject to DNA demethylation in endosperm in at least one background but that are variably methylated among strains. Overlap between the strain DMRs and embryo-endosperm DMRs ranged from 12% for TEs to 31% for genes (<xref ref-type="fig" rid="fig4">Figure 4E</xref>). This suggests that there are sufficient epigenetic polymorphisms at embryo-endosperm DMRs to facilitate the formation of allele-specific imprinting. Differences in imprinting among alleles tied to differences in DNA methylation could be due to genetic or epigenetic differences (<xref ref-type="fig" rid="fig6s1 fig6s2 fig6s3">Figure 6—figure supplements 1,2, and 3</xref>). Of the 12 allele-specific imprinted genes we identified (<xref ref-type="fig" rid="fig2">Figure 2</xref>, <xref ref-type="supplementary-material" rid="SD6-data">Figure 2—source data 1</xref>), 10 were associated with coincident CG or CHH embryo-endosperm DMRs and strain DMRs, 6 of which occurred at TEs (<xref ref-type="supplementary-material" rid="SD6-data">Figure 2—source data 1</xref>, <xref ref-type="fig" rid="fig6">Figure 6</xref>, <xref ref-type="fig" rid="fig6s1">Figure 6—figure supplement 1</xref>, <xref ref-type="fig" rid="fig6s2">Figure 6—figure supplement 2</xref>). For all 6 genes we confirmed by sequencing that the TE annotated in Col was present in the same genomic location in Ler and Cvi with no major sequences changes except for a few SNPs. These 6 genes were also included among imprinting validation assays (<xref ref-type="supplementary-material" rid="SD5-data">Figure 1—source data 5</xref>, <xref ref-type="supplementary-material" rid="SD6-data">Figure 2—source data 1</xref>). We more closely investigated three allele-specific imprinted genes with strong differences in the ratio of maternal to paternal transcripts in imprinted and non-imprinted crosses: AT2G32370, AT2G34890, and AT3G14205 (<xref ref-type="fig" rid="fig2">Figure 2</xref>, <xref ref-type="fig" rid="fig6">Figure 6</xref>, <xref ref-type="fig" rid="fig6s2">Figure 6—figure supplement 2</xref>). AT2G32370, <italic>HDG3</italic>, was originally identified as a PEG because of its association with a Col and Ler embryo-endosperm DMR and because it was expressed specifically in the endosperm (<xref ref-type="bibr" rid="bib11">Gehring et al., 2009</xref>). Our new data showed that <italic>HDG3</italic> is not a PEG when Cvi is the male parent (<xref ref-type="fig" rid="fig2">Figure 2</xref>, <xref ref-type="fig" rid="fig6">Figure 6</xref>). The embryo-endosperm DMR associated with <italic>HDG3</italic> is located in a Helitron fragment (ATREP10D) 5′ of the gene, and the methylated paternal allele is predominantly expressed. This region is not methylated in Cvi (<xref ref-type="fig" rid="fig6">Figure 6B</xref>, <xref ref-type="fig" rid="fig6s1">Figure 6—figure supplement 1</xref>). In crosses between Cvi females and Col or Ler males, maternal and paternal alleles are differentially methylated and the gene is imprinted (the naturally hypomethylated Cvi maternal allele has the same methylation profile as an actively demethylated maternal allele). But in reciprocal crosses between Col or Ler females and Cvi males, both maternal and paternal alleles are hypomethylated and the gene is biallelically expressed in the expected 2:1 maternal:paternal ratio (<xref ref-type="fig" rid="fig2">Figure 2</xref>, <xref ref-type="fig" rid="fig6">Figure 6</xref>). This suggests that differential methylation of maternal and paternal alleles, rather than simply demethylation of the maternal allele, is required for imprinted expression. A similar logic applies to AT3G14205; the Cvi allele is hypomethylated at a 5′ RC/Helitron fragment (ATREP1) compared to Col and Ler and the gene is not a PEG when it is transmitted through the Cvi male (<xref ref-type="fig" rid="fig2">Figure 2</xref>, <xref ref-type="supplementary-material" rid="SD6-data">Figure 2—source data 1</xref>, <xref ref-type="fig" rid="fig6s2">Figure 6—figure supplement 2</xref>). AT2G34890 was a MEG except when Ler is the male parent. The Ler AT2G34890 allele is hypomethylated at a 5′ MuDR element in comparison to Cvi and Col, suggesting that loss of methylation of the paternal allele could lead to its transcription (<xref ref-type="fig" rid="fig6s2">Figure 6—figure supplement 2</xref>). However, consistent with a more ambiguous relationship between DNA demethylation and MEGs (<xref ref-type="fig" rid="fig5">Figure 5</xref>), closer inspection of AT2G34890 shows that at a region 5′ of the TE <italic>both</italic> the Ler and Cvi alleles are hypomethylated compared to Col, suggesting that a clear methylation distinction between imprinted (Col and Cvi) and non-imprinted (Ler) paternal alleles does not exist (<xref ref-type="fig" rid="fig6s2">Figure 6—figure supplement 2</xref>).<fig-group><fig id="fig6" position="float"><object-id pub-id-type="doi">10.7554/eLife.03198.019</object-id><label>Figure 6.</label><caption><title>Expression and methylation analysis of <italic>HDG3</italic>, an allele-specific imprinted gene.</title><p>(<bold>A</bold>) <italic>HDG3</italic> is a PEG except when Cvi is the paternal parent. Blue bars, % paternal allele expression; red bars, % maternal allele expression from combined mRNA-seq data; vertical line, expected percent paternal allele expression for a non-imprinted gene. (<bold>B</bold>) Methylation of <italic>HDG3</italic> 5′ flanking region in Col embryo, Ler embryo and endosperm, and Cvi embryo (additional analysis in <xref ref-type="fig" rid="fig6s1">Figure 6—figure supplement 1</xref>). Red track, CG; green track, CHH. (<bold>C</bold>) Methylation profile of maternal and paternal HDG3 alleles in Col x Cvi and Cvi x Col endosperm as determined by locus-specific bisulfite PCR. Red circles, CG; blue circles, CHG; green circle, CHH. Filled circles indicate methylation, whereas unmethylated positions are unfilled. (<bold>D</bold>) Methylation profile of HDG3 in Col, Ler, Cvi, Kz_9 and An_1 in leaves (<ext-link ext-link-type="uri" xlink:href="http://neomorph.salk.edu/1001_epigenomes.html">http://neomorph.salk.edu/1001_epigenomes.html</ext-link>). (<bold>E</bold>) <italic>HDG3</italic> is not imprinted in 6 DAP endosperm when another hypomethylated strain (Kz_9) is the pollen parent, but is a PEG in a cross with another methylated strain (An_1), as determined by sequencing RT-PCR products that span informative SNPs. Blue bars, % paternal allele expression; red bars, % maternal allele expression; vertical line, expected paternal allele expression for a non-imprinted gene. The number of RT-PCR clones sequenced is indicated. p value represents a binomial test of whether the observed maternal:total ratio is less than the expected 2:3 ratio. (<bold>F</bold>) Cartoon representation of results. Expression and methylation results for AT3G14205 and AT2G34890 are in <xref ref-type="fig" rid="fig6s2">Figure 6—figure supplement 2</xref>. Examples of genetic differences causing methylation differences are in <xref ref-type="fig" rid="fig6s3">Figure 6—figure supplement 3</xref>.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.019">http://dx.doi.org/10.7554/eLife.03198.019</ext-link></p></caption><graphic xlink:href="elife03198f006"/></fig><fig id="fig6s1" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.03198.020</object-id><label>Figure 6—figure supplement 1.</label><caption><title>Methylation analysis of <italic>HDG3</italic>.</title><p>(<bold>A</bold>) Allele-specific CG methylation of maternal and paternal <italic>HDG3</italic> alleles in Cvi x Col and Col x Cvi embryos from whole genome BS-seq data. (<bold>B</bold>) Methylation profile of the <italic>HDG3</italic> DMR in different strains and tissues and of maternal and paternal <italic>HDG3</italic> alleles in Col x Cvi and Cvi x Col embryos as determined by locus-specific bisulfite PCR. Filled circles indicate methylation, whereas unmethylated positions remain unfilled.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.020">http://dx.doi.org/10.7554/eLife.03198.020</ext-link></p></caption><graphic xlink:href="elife03198fs014"/></fig><fig id="fig6s2" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.03198.021</object-id><label>Figure 6—figure supplement 2.</label><caption><title>Expression and methylation analysis of other variably imprinted genes.</title><p>(<bold>A</bold>) AT3G14205 is a PEG except when Cvi is the paternal parent (mRNA-seq data). Blue bars, % paternal allele expression; red bars, % maternal allele expression from combined mRNA-seq data; vertical line, expected % paternal expression for a non-imprinted gene. (<bold>B</bold>) Methylation of AT3G14205 5′ flanking region in Col embryo, Ler embryo and endosperm, and Cvi embryo. Red track, CG; green track, CHH. (<bold>C</bold>) Leaf methylation profile of AT3G14205 in Col, Ler, Kz_9, Cvi and Seattle_0 (<ext-link ext-link-type="uri" xlink:href="http://neomorph.salk.edu/1001_epigenomes.html">http://neomorph.salk.edu/1001_epigenomes.html</ext-link>). (<bold>D</bold>) AT3G14205 is not imprinted when another hypomethylated strain (Seattle_0) is the pollen parent, but is a PEG in a cross with another methylated strain (Kz_9), as determined by sequencing RT-PCR products that span informative SNPs. The number of RT-PCR clones sequenced is indicated. p value, binomial test of whether the observed maternal:total ratio is less than the expected 2:3 ratio. (<bold>E</bold>) AT2G34890 is a MEG except when Ler is the paternal parent (mRNA-seq data). Vertical line, expected maternal allele expression for a non-imprinted gene. (<bold>F</bold>) Methylation of AT2G34890 5′ flanking region in Col and Ler embryo and Cvi embryo and endosperm. (<bold>G</bold>) Leaf methylation profile of AT2G34890 in Col, Cvi, Ler and Es_0 (<ext-link ext-link-type="uri" xlink:href="http://neomorph.salk.edu/1001_epigenomes.html">http://neomorph.salk.edu/1001_epigenomes.html</ext-link>). (<bold>H</bold>) AT2G34890 is still imprinted when another hypomethylated strain (Es_0) is the pollen parent. p value: binomial test of whether the observed maternal:total ratio is greater than the expected 2:3 ratio.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.021">http://dx.doi.org/10.7554/eLife.03198.021</ext-link></p></caption><graphic xlink:href="elife03198fs015"/></fig><fig id="fig6s3" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.03198.022</object-id><label>Figure 6—figure supplement 3.</label><caption><title>Genetic difference between strains can underlie differential methylation.</title><p>Differences in methylation between strains can be due to genetic differences (e.g., absence of a sequence in one strain). To uncover possible genetic differences between Col and Cvi strains, we compared the set of Col-Cvi methylation difference positive windows to regions of the Cvi genome not covered by any reads in the 1001 Genomes resequencing project (<ext-link ext-link-type="uri" xlink:href="http://signal.salk.edu/atg1001/index.php">http://signal.salk.edu/atg1001/index.php</ext-link>). We validated DMRs at one MEG (AT5G17165) and one PEG (AT1G57820) that were polymorphic between the two strains using PCR and sequencing. (<bold>A</bold>) In Cvi, the TE at the 3′ end of AT5G17165 lacks 600 nt, corresponding to a methylated region in Col and Ler. Red track, CG; blue track, CHG; green track, CHH. (<bold>B</bold>) In Cvi, the 86 nt long TE at the 5′ end of AT1G57820 has 9 SNPs, and the upstream and downstream intergenic DNA sequences have insertions and deletions compared to Col.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.022">http://dx.doi.org/10.7554/eLife.03198.022</ext-link></p></caption><graphic xlink:href="elife03198fs016"/></fig></fig-group></p><p>Allele-specific imprinted genes could represent epialleles whose expression phenotypes are observed in the endosperm. To assess how widespread allele-specific imprinting might be within the species, we determined the strain variability in methylation at regions we identified as being targeted for endosperm demethylation, using the methylation profiling data of leaves or floral buds from 140 strains (<xref ref-type="bibr" rid="bib44">Schmitz et al., 2013</xref>). This allowed us to more broadly estimate the potential for allele-specific imprinting outside of Col-Ler-Cvi strains. We divided regions corresponding to embryo-endosperm DMRs into five classes based on the range of methylation variability across all 140 strains: those with very low variability in methylation (less than 0.2 mean methylation difference across all strains), low variability (between 0.2 and 0.4 mean methylation difference across all strains), a strongly bimodal class (DMRs with a range greater than 0.4 but where most of the density of the distribution in the outer 50% of the range) and two intermediate classes, weakly bimodal and not bimodal (<xref ref-type="fig" rid="fig7">Figure 7A,B</xref>). DMRs with a high or intermediate methylation range and less strong clustering in the outer 50% of the distribution were considered weakly bimodal. All remaining DMRs were classified as ‘not bimodal’—these regions tend to have a more uniform or unimodal distribution across a large range of scores (<xref ref-type="fig" rid="fig7">Figure 7A,B</xref>). The majority of DMRs (69%) were consistently methylated across all strains examined, falling into the very low range, low range, or not bimodal categories (<xref ref-type="fig" rid="fig7">Figure 7A,B</xref>). However, about 16% of DMRs were in the strongly bimodal category, where methylation is consistently high or low across strains except for one or more strong outliers (<xref ref-type="fig" rid="fig7">Figure 7A,B</xref>).<fig id="fig7" position="float"><object-id pub-id-type="doi">10.7554/eLife.03198.034</object-id><label>Figure 7.</label><caption><title>Natural epigenetic variability across strains at embryo-endosperm CG DMRs.</title><p>(<bold>A</bold>) Methylation variability across strains for regions targeted for endosperm demethylation. Classification of methylation range in the <xref ref-type="bibr" rid="bib44">Schmitz et al., 2013</xref> dataset (total of 140 strains) for all all embryo-endosperm CG DMRs (n = 10,370) identified in this study. Only DMRs with at least 5 CG sites and a minimum of five reads coverage at each site in the Schmitz et al. dataset were classified. Additionally, only DMRs with at least 70 strains with sufficient data were included. (<bold>B</bold>) Examples of low range (gray), not bimodal (blue), weak bimodal (orange) and strongly bimodal (red) DMRs. (<bold>C</bold>) Association of the classified CG endosperm-embryo DMRs with PEGs. This study: DMRs identified from all pairwise matched endosperm-embryo comparisons from bisulfite datasets in <xref ref-type="supplementary-material" rid="SD7-data">Figure 3—source data 1</xref>; <xref ref-type="bibr" rid="bib23">Ibarra et al., 2012</xref>: ColxLer and LerxCol DMRs combined. Allele-specific PEGs are listed around the pie chart. n/a = not classifiable because gene was associated with DMR of more than one type.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.034">http://dx.doi.org/10.7554/eLife.03198.034</ext-link></p></caption><graphic xlink:href="elife03198f007"/></fig></p><p>We overlapped our union set of imprinted genes with the classified DMRs. 21 MEGs and 9 PEGs were associated with a very low or low variability DMR within the gene or two kb 5′ or 3′. These include the MEG <italic>FWA</italic>, a locus with high levels of promoter methylation in all strains. We thus expect that in all strains in the endosperm <italic>FWA</italic> will have a demethylated maternal allele and a highly methylated paternal allele, and be consistently imprinted within the species. In contrast, 27 MEGs and 17 PEGs (11% of all imprinted genes) were associated with strongly bimodal DMRs, including four PEGs we identified from our Col, Ler, and Cvi mRNA-seq and BS-seq data as exhibiting allele-specific imprinting and being associated with a shared embryo-endosperm and strain DMR (<xref ref-type="fig" rid="fig7">Figure 7C</xref>, <xref ref-type="supplementary-material" rid="SD6-data">Figure 2—source data 1</xref>). This includes the DMRs associated with the allele-specific imprinted genes <italic>HDG3</italic> and AT3G14205 (<xref ref-type="fig" rid="fig7">Figure 7C</xref>).</p><p>We tested whether the methylation status of the embryo-endosperm DMRs associated with allele-specific imprinted genes was predictive for imprinting. If the difference in imprinting among <italic>HDG3</italic> alleles was due to the <italic>cis</italic> epigenetic difference at the 5′ TE, we predicted that crosses with other male parents carrying naturally hypomethylated alleles would exhibit lack of imprinting in F<sub>1</sub> endosperm. The strain Kz_9 has reduced methylation at the 5′ TE, although it is more methylated than in Cvi (<xref ref-type="fig" rid="fig6">Figure 6D</xref>). We performed reciprocal crosses between Col and Kz_9, extracted the RNA from endosperm 6 DAP and performed RT-PCR around a Col/Kz_9 SNP. Cloning and sequencing of the PCR products confirmed that <italic>HDG3</italic> was a PEG when Col was the male parent. In the reciprocal cross, when the hypomethylated <italic>HDG3</italic> allele was inherited from the Kz_9 male, <italic>HDG3</italic> was not imprinted (<xref ref-type="fig" rid="fig6">Figure 6E,F</xref>). <italic>HDG3</italic> remains imprinted in crosses between Col and another strain with methylation, An_1 (<xref ref-type="fig" rid="fig6">Figure 6D–F</xref>). This suggests that the epigenetic state of the <italic>HDG3</italic> allele is sufficient to predict imprinting in other naturally occurring strains and is thus likely causal for lack of imprinting in Cvi. Similarly, the DMR variability analysis (<xref ref-type="fig" rid="fig7">Figure 7</xref>) identified another strain, Seattle_0, where the TE 5′ of AT3G14205 was hypomethylated. Similar to crosses with Cvi males, in crosses where Seattle_0 was the male parent, AT3G14205 was no longer a PEG (<xref ref-type="fig" rid="fig6s2">Figure 6—figure supplement 2</xref>), but was still a PEG when Seattle_0 was the female and Col the male. As expected for AT2G34890, where the methylation state of the 5′ region was variable but did not seem to correlate with whether the allele was imprinted or not among Col, Ler, and Cvi, we found that AT2G34890 is a MEG in crosses with Col regardless of whether Es_0, a strain with a hypomethylated allele like Ler, served as the female or the male parent (<xref ref-type="fig" rid="fig6s2">Figure 6—figure supplement 2</xref>).</p><p>As we have shown for <italic>HDG3</italic> and AT3G14205, crosses involving a methylated allele and a naturally hypomethylated allele can result in allele-specific imprinting in one direction of the cross. Thus, in addition to the allele-specific imprinted genes we identified based on our mRNA-seq data, the additional MEGs and PEGs associated with embryo-endosperm DMRs that are strongly bimodal for methylation within the population might not be imprinted in strains where the allele is naturally hypomethylated. This suggests that 11% of imprinted genes have the potential to be variably imprinted when a particular strain is the male or female parent.</p></sec></sec><sec id="s3" sec-type="discussion"><title>Discussion</title><p>By examining crosses among three of the thousands of Arabidopsis strains, we were able to identify genes imprinted among all crosses and a small number of strong candidates for allele-specific imprinting caused by a <italic>cis</italic> methylation difference at a proximal transposable element. We found that most imprinted genes identified in reciprocal crosses between two strains are imprinted in crosses between other strains, or have some evidence for parental bias even if all imprinting criteria were not met. Arabidopsis allele-specific imprinted genes represent a small fraction of all possible imprinted genes, approximately 6% in our mRNA-seq datasets. These results are consistent with the extent of allele-specific imprinting in maize, where around 12% of imprinted genes fall into this category (<xref ref-type="bibr" rid="bib59">Waters et al., 2013</xref>). Allele-specific imprinting could represent genes that have recently come under the control of a TE and may or may not have an endosperm function, or genes that are imprinted specifically in one strain and not the other due to differences in control over endosperm growth and development. Under the conflict theory (<xref ref-type="bibr" rid="bib16">Haig, 2013</xref>), differences in seed size could reflect strains that have reached different optima for imprinting—strains producing small seeds could be considered more maternalized and those producing larger seeds more paternalized. Arabidopsis allele-specific imprinted genes encode multiple types of proteins, including a putative transcription factor (<italic>HDG3)</italic>, a heat shock protein, a phosphoinositide phosphatase (AT3G14205), three chromatin proteins, and a gene required for normal levels of phytic acid accumulation in seeds (<xref ref-type="bibr" rid="bib29">Kim and Tai, 2010</xref>). Further experimentation exploring the function of these genes during seed development in each genetic background will be required to determine if differences in imprinting among strains contribute to seed phenotypes.</p><p>By considering population methylation variation at regions demethylated during reproductive development, we were able to estimate the possible extent of allele-specific imprinting within the species. Of the set of 388 imprinted genes we identified, 11% were associated with embryo-endosperm DMRs that are variably methylated in vegetative tissues in at least one of 140 strains (the strongly bimodal DMRs). Based on their methylation patterns, these genes have the potential to act as epialleles and exhibit allele-specific imprinting, as we demonstrated for <italic>HDG3</italic> and AT3G14205. However, we caution that imprinted genes associated with a strongly bimodal DMR do not always exhibit allele-specific imprinting when alleles with different methylation patterns are combined in F<sub>1</sub> endosperm. For example, we originally identified AT4G23110 as a candidate imprinted gene because it was associated with an embryo-endosperm DMR and only expressed in seeds (<xref ref-type="bibr" rid="bib11">Gehring et al., 2009</xref>), which was later confirmed by mRNA-seq (<xref ref-type="bibr" rid="bib13">Gehring et al., 2011</xref>). In this study we find that the embryo-endosperm DMR in the 5′ region of the gene is strongly bimodal within the population, with 118 strains exhibiting between 60–100% CG methylation in a 500 bp 5′ region, and 10 strains with no methylation. However, when we performed reciprocal crosses between one of the hypomethylated strains and Col, a methylated strain, imprinting was maintained in both directions of the cross. Thus, we expect that 11% is the maximal fraction of genes that would exhibit allele-specific imprinting due to strain-to-strain differences in methylation, with the actual number being less than this.</p><p>The predictive power for whether a gene will exhibit allele-specific imprinting is greater for PEGs than for MEGs. PEGs were more often associated with embryo-endosperm DMRs than MEGs, and showed stronger correlation with the presence of a TE, and the presence of H3K27me3 in vegetative tissues (<xref ref-type="fig" rid="fig5s1">Figure 5—figure supplement 1</xref>; <xref ref-type="bibr" rid="bib33">Lafos et al., 2011</xref>). Our data and that of many others (<xref ref-type="bibr" rid="bib30">Köhler et al., 2012</xref>; <xref ref-type="bibr" rid="bib10">Gehring, 2013</xref>; <xref ref-type="bibr" rid="bib63">Zhang et al., 2014</xref>) suggest that the mechanism of imprinting for PEGs in Arabidopsis and maize is that the methylated paternal allele is expressed while the hypomethylated maternal allele is silenced by the PRC2 complex. Thus, the imprinting state of PEGs is much easier to predict based on known genetic and epigenetic characteristics. MEGs represent a more diverse class of genes, and their imprinting status is more difficult to predict based on DNA methylation or TE presence, although we do find that MEGs are enriched for small RNAs in seeds.</p><p>The RC/Helitron class of TEs, the most abundant type in euchromatin, is prevalent among DMRs. RC/Helitrons are also one of the most variably methylated TEs, with more than half being poorly or unmethylated in Col (<xref ref-type="bibr" rid="bib1">Ahmed et al., 2011</xref>). The susceptibility of Helitrons to loss of methylation coupled with their overabundance among embryo-endosperm DMRs further suggests that imprinting could be highly dynamic if considered on a population scale. McClintock described the ability of TEs to cycle in nature and between active and inactive epigenetic states (<xref ref-type="bibr" rid="bib38">McClintock, 1965</xref>; <xref ref-type="bibr" rid="bib49">Slotkin and Martienssen, 2007</xref>). A conceptually similar phenomenon could cause imprinting to vary between closely related genotypes.</p><p>Our study also yielded several unanticipated findings. We discovered that the Cvi strain is globally hypomethylated, and primarily loses CG methylation in gene bodies. Despite its ubiquity, the function of CG gene body methylation in plants and animals is still unclear, although it may be important for regulating alternative splicing or preventing spurious transcription (<xref ref-type="bibr" rid="bib65">Zilberman et al., 2007</xref>; <xref ref-type="bibr" rid="bib48">Shukla et al., 2011</xref>). Mutations that reduce CG gene body methylation (e.g., mutations in the maintenance DNA methyltransferase) affect CG methylation in all genomic contexts. Because Cvi has little gene body methylation but nearly normal levels of CG methylation in other genomic features, Cvi could serve as a model genotype to further explore the function of gene body methylation in relation to gene expression or chromatin structure. Cytologically, Cvi has reduced heterochromatin and dispersed 45S rDNA repeats and DNA methylation compared to Col and Ler (<xref ref-type="bibr" rid="bib50">Tessadori et al., 2007</xref>, <xref ref-type="bibr" rid="bib51">2009</xref>). Decondensed chromatin might facilitate increased production of small RNAs (<xref ref-type="bibr" rid="bib46">Schoft et al., 2009</xref>), and Cvi x Col endosperm showed little reduction in CHH methylation compared to the embryo. Consistent with this, small RNAs produced from the maternal allele represented a greater fraction of small RNAs when Cvi was the female parent in a cross (<xref ref-type="supplementary-material" rid="SD9-data">Figure 4—source data 1</xref>). We also observed, in contrast to a previous study (<xref ref-type="bibr" rid="bib39">Mosher et al., 2009</xref>), that small RNAs derived from the paternally inherited genome were readily detected in seed tissue from all crosses. As expected, maternal small RNAs were much more abundant than paternal small RNAs, but because we could not distinguish the three components of the seed (embryo, endosperm, and seed coat), it is unknown whether this was due to predominantly maternal expression in the endosperm, or reflective of the overall maternal bias expected in whole seeds. However, the fraction of paternal small RNAs (6–24%) was comparable to the fraction of paternal reads when mRNAs were sequenced from whole seeds (15–20%) (<xref ref-type="supplementary-material" rid="SD1-data">Figure 1—source data 1</xref>, <xref ref-type="supplementary-material" rid="SD9-data">Figure 4—source data 1</xref>), perhaps suggesting that small RNAs in seeds reflect the ratio of maternal:paternal genomes in each tissue. Our analysis of the previously published data from Col x Ler and Ler x Col siliques (<xref ref-type="bibr" rid="bib39">Mosher et al., 2009</xref>) also revealed the presence of paternally derived small RNAs, although at lower levels than in our whole seed datasets (<xref ref-type="supplementary-material" rid="SD9-data">Figure 4—source data 1</xref>). Recent analysis of small RNAs in rice inter-strain crosses detected maternally and paternally derived small RNAs in the endosperm and suggested rice might be different from <italic>A. thaliana</italic> in this regard (<xref ref-type="bibr" rid="bib42">Rodrigues et al., 2013</xref>). Our data instead suggest that rice and Arabidopsis are likely similar in terms of parental small RNA composition in the endosperm, although endosperm-specific Arabidopsis profiles will be necessary to conclusively evaluate this. Interestingly, at 6 DAP the largest subunit of <italic>Pol IV</italic>, <italic>NRPD1a</italic>, was paternally biased in all crosses. <italic>NRPD1a</italic> has a 5′ embryo-endosperm DMR associated with small RNAs, further suggesting that there may be a complex interplay and crosstalk between active DNA demethylation and the small RNA production pathway. Other genes that promote DNA methylation were also primarily paternally expressed in all crosses (e.g., the <italic>VIM</italic> family genes)<italic>.</italic> A major unsolved question is how the maternal alleles of genes that are demethylated before fertilization remain hypomethylated several days after fertilization, in the spite of the presence of small RNAs that normally target DNA methylation to these sequences. It is possible that changes to maternal endosperm chromatin structure could alter the efficacy of RNA-directed DNA methylation.</p><p>In conclusion, our study demonstrates that epiallelic variation and genomic imprinting mechanisms intersect to produce novel gene expression patterns in seeds. We propose that the phenotypic impact of epialleles is likely to be most pronounced in the endosperm because changes in DNA methylation are a programmed part of endosperm development. Epialleles naturally circulating in plant populations might significantly impact seed development and lead to the production of novel phenotypes in hybrids.</p></sec><sec id="s4" sec-type="materials|methods"><title>Materials and methods</title><sec id="s4-1"><title>Plant material</title><p>Plants were grown in a greenhouse with 16-hr days at ∼21 C. Flowers were emasculated 2 days before pollination. Seeds were dissected at 6 DAP, which corresponds to the torpedo stage of embryogenesis under our growth conditions (<xref ref-type="fig" rid="fig1s1">Figure 1—figure supplement 1</xref>).</p></sec><sec id="s4-2"><title>mRNA-seq library construction</title><p>RNA was isolated from endosperm, embryo, and whole seeds 6 days after pollination as described (<xref ref-type="bibr" rid="bib13">Gehring et al., 2011</xref>) using either the RNAqueous kit with Plant RNA Isolation Aid or the RNAqueous Micro Kit (Ambion, Life Technologies Corporation, Carlsbad, CA). At least 600 ng of DNAse I-treated RNA (Invitrogen, Life Technologies Corporation, Carlsbad, CA) was used to prepare mRNA-Seq libraries as described (<xref ref-type="bibr" rid="bib13">Gehring et al., 2011</xref>), except that Illumina TruSeq primers were used in the final amplification step. Amplification was for 12 cycles. Strand-specific RNA-seq libraries were generated from at least 100 ng of total RNA using the Integenex PolyA prep protocol (Wafergen Biosystems, Fremont, CA) with 15 cycles of amplification. See <xref ref-type="supplementary-material" rid="SD1-data">Figure 1—source data 1</xref> for details of library prep for specific samples.</p></sec><sec id="s4-3"><title>mRNA-seq data analysis</title><p>Endosperm mRNA-seq was performed in triplicate (18 samples). Because we previously found little evidence for imprinting in embryos at this stage of development (<xref ref-type="bibr" rid="bib13">Gehring et al., 2011</xref>), embryo mRNA-seq was performed on single samples (<xref ref-type="supplementary-material" rid="SD1-data">Figure 1—source data 1</xref>). Single-end sequencing of mRNA-Seq libraries was performed on an Illumina HiSeq machine. Read length was 40 bp or 80 bp (<xref ref-type="supplementary-material" rid="SD1-data">Figure 1—source data 1</xref>). Sequencing quality was assessed using fastqc, and raw reads were filtered for overrepresented adapter sequences using fastx_clipper. Low quality reads were removed with fastq_quality_filter using the options –q 20 and –p 80 (<ext-link ext-link-type="uri" xlink:href="http://hannonlab.cshl.edu/fastx_toolkit/">http://hannonlab.cshl.edu/fastx_toolkit/</ext-link>). Filtered reads were then aligned to the TAIR10 version of the Arabidopsis genome using Tophat v2.0.8 (<xref ref-type="bibr" rid="bib53">Trapnell et al., 2009</xref>). For 40 bp libraries the options -solexa1.3-quals --segment-length 18 --segment-mismatches 1 --max-segment-intron 11,000 were used and for 80 bp libraries the options were --solexa1.3-quals --segment-length 30 --max-segment-intron 11,000. Reads counts for each gene and TE annotated in TAIR10 were quantified using htseq-count (<ext-link ext-link-type="uri" xlink:href="http://www-huber.embl.de/users/anders/HTSeq/doc/index.html">http://www-huber.embl.de/users/anders/HTSeq/doc/index.html</ext-link>) with options –m intersection-strict –-stranded = no (for non-strand-specific libraries) or –stranded = yes (for strand-specific libraries). After sorting reads by genome position, single nucleotide polymorphisms (SNPs) (<xref ref-type="supplementary-material" rid="SD11-data">Supplementary file 2</xref>) were used to classify reads by strain using a custom script (<xref ref-type="supplementary-material" rid="SD12-data">Supplementary file 3</xref>). Reads were discarded if classification at two SNP positions within the same read conflicted. Htseq-count with the same options was run on each allele-specific set of mapped reads to generate allele counts for each gene and TE. Libraries ranged in depth from 50 to 160 million high-quality reads per sample, of which approximately 4–10 million reads could be assigned to a specific parental allele (informative reads). The highest proportion of informative reads was in crosses between Ler and Cvi, which have the most SNPs (<xref ref-type="supplementary-material" rid="SD1-data">Figure 1—source data 1</xref>).</p></sec><sec id="s4-4"><title>Identifying imprinted genes</title><p>We slightly modified our previously published analysis method (<xref ref-type="bibr" rid="bib13">Gehring et al., 2011</xref>) to identify imprinted genes. We used Fisher's exact test on each set of reciprocal crosses to test the null hypothesis that <italic>p</italic><sub><italic>1</italic></sub> = 2<italic>p</italic><sub><italic>2</italic></sub> = 0.67 (<italic>p</italic><sub><italic>1</italic></sub> = portion of strain A reads in A female × B male and <italic>p</italic><sub><italic>2</italic></sub> = portion of strain A reads in B female × A male) for endosperm or <italic>p</italic><sub><italic>1</italic></sub> = 2<italic>p</italic><sub><italic>2</italic></sub> = 0.5 for embryo. We considered genes with a Benjamini corrected p value less than 0.01. We further filtered the list by removing genes with an imprinting factor (<xref ref-type="bibr" rid="bib13">Gehring et al., 2011</xref>) less than 2 and by removing genes that were more than twofold higher expressed in the seed coat than embryo or endosperm at the linear cotyledon stage, using data from <xref ref-type="bibr" rid="bib5">Belmonte et al. (2013)</xref>. To obtain values from the Belmonte et al. data, for endosperm we averaged the RMA values from the MCE, PEN, and CZE samples and for seed coat we averaged values from the CZSC and SC, all from the linear cotyledon stage. Averaged values were log transformed and genes with a seed coat-endosperm or seed coat-embryo differences <underline>&lt;</underline>1 retained. Finally, for maternally biased genes we required that at least 85% of informative reads were maternal in both directions of the reciprocal cross and for paternally biased genes that at least 50% of informative reads in both directions of the reciprocal cross were paternal. For embryo libraries the final filtering step required at least 70% of reads to be maternal in both directions of the cross for maternally biased genes and less than 30% maternal for paternally biased genes. For each set of endosperm reciprocal crosses we sequenced mRNA from three biological replicates. For a gene to be called imprinted in a particular set of endosperm crosses (Col-Ler, Ler-Cvi, or Col-Cvi), it had to be called imprinted in 2 of 3 reciprocal cross pairs of biological replicates. We chose two of three instead of three of three because of variation in sequencing depth among libraries.</p></sec><sec id="s4-5"><title>Identifying allele specific imprinting</title><p>We calculated the ratio of (maternal reads<sub>(strain A × strain B)</sub> + 1)/(paternal reads<sub>(strain A × strain B)</sub> + 1) and plotted it against the ratio of (maternal reads<sub>(strain B × strain A)</sub> + 1)/(paternal reads <sub>(strain B × strain A)</sub> + 1) for all loci with &gt;0 informative reads and seed coat-endosperm expression <underline>&lt;</underline>1 (<xref ref-type="bibr" rid="bib5">Belmonte et al., 2013</xref>). The Euclidean distance of every point to the lines x = 2 and y = 2 (no imprinting) was calculated using MATLAB. Loci within the distance of 1 to each line were retained for further analysis. For each locus we also calculated a parental bias factor, b(g) (b(g) = log<sub>2</sub> (maternal reads + 1) − log<sub>2</sub> (2 × paternal reads + 1)) and a normalized parental bias factor b<sub>norm</sub>(g) = b(g) – mean(b(g))/stdev(b(g)). For non-imprinted genes the value of b(g) = 0 and b<sub>norm</sub>(g) = 0. Loci within 1 of x = 2 or y = 2 that also fell above the 95<sup>th</sup> (maternal bias) or below the 5<sup>th</sup> (paternal bias) percentile distribution of b<sub>norm</sub>(g) values exhibited parental bias in only one set of reciprocal crosses. Loci that showed maternal or paternal preference when a particular strain was the parent were determined by intersecting lists from each cross (e.g., intersect Col-Ler maternal biases with Col-Cvi maternal biases to generate a list of loci that are maternally biased when Col is the female parent). To generate the final list of genes that exhibit potential allele-specific imprinting, the loci described above were intersected with the list of imprinted loci from the reciprocal crosses not involving the strain exhibiting the bias (e.g., intersection of loci maternally biased when Col is the male parent but not when it is the female parent with MEGs in Ler-Cvi reciprocal crosses).</p></sec><sec id="s4-6"><title>Validation of imprinted genes</title><p>Validation of the global RNA-seq analysis was by amplicon sequencing of RT-PCR products using miSeq or Sanger sequencing, or by CAPs digestion. RNA was collected from dissected embryo and endosperm, reverse transcribed, treated with DnaseI, and amplified with ExTaq for 30 cycles (PCR primers in <xref ref-type="supplementary-material" rid="SD10-data">Supplementary file 1</xref>). For miSeq analysis, amplicons from the same cross and tissue type were pooled and libraries were constructed using the Illumina NexteraXT kit (Illumina, Inc., San Diego, CA). Paired-end sequencing of RT-PCR amplicons was performed on an Illumina MiSeq machine, generating 150 bp reads. Raw reads were aligned to a pseudometagenome (see small RNA methods) using Tophat v2.0.8 alignment options –read-mismatches 10 –edit-distance 12. After sorting reads by genome position, SNPs (<xref ref-type="supplementary-material" rid="SD11-data">Supplementary file 2</xref>) were used to classify reads by strain just like for mRNA-seq. A goodness-of-fit binomial exact test was used to test the null hypothesis that the observed fraction of reads derived from the maternal allele for each assayed locus was described well by the binomial distribution parameterized by p = the observed fraction maternal reads from the combined counts of the RNA-seq libraries analyzed in this study.</p></sec><sec id="s4-7"><title>GO analysis</title><p>GO analysis was performed using the DAVID bioinformatics resource version 6.7 (<xref ref-type="bibr" rid="bib21">Huang et al., 2009a</xref>, <xref ref-type="bibr" rid="bib22">2009b</xref>). Reported p-values are corrected using the Benjamini method.</p></sec><sec id="s4-8"><title>Whole genome bisulfite sequencing library construction</title><p>Seeds from 30 to 40 siliques per sample were dissected and DNA was extracted as described (<xref ref-type="bibr" rid="bib11">Gehring et al., 2009</xref>). At least 1 μg of RNAse-treated DNA was used for library preparation (<xref ref-type="supplementary-material" rid="SD6-data">Figure 2—source data 1</xref>). Libraries were made using an Illumina TruSeq kit (Illumina, Inc.), with the following modifications. DNA was sheared using a Covaris instrument (settings: peak power 175 W, duty factor 10, cycles/burst 200, time 6 min, 6 C), purified using Agencourt AMPure beads (1.4× DNA:beads) (Beckman Coulter, Inc., Brea, CA), and resuspended in 50 μl of water followed by end repair and 3′ end adenylation. Illumina TruSeq DNA adapters, which contain 5-methylcytosines instead of cytosines, were ligated in a 50-μl overnight reaction at 16°C with 2.5 μl adapters, 5000 units T4 DNA Ligase (New England BioLabs, Ipswich, MA), and 1 × T4 Ligase buffer with ATP. DNA was cleaned twice using Agencourt AMPure beads before bisulfite treatment with the MethylCode Bisulfite Conversion Kit as per manual instructions (Invitrogen, Life Technologies Corporation). Bisulfite-treated DNA was eluted in 10 μl. Three μl were used as a template in each of two PCR reactions with 0.5 units Pfu Turbo, Cx Hotstart DNA Polymerase (New England BioLabs), 1 μl 10 mM dNTPs, and 1 × Turbo Cx buffer. PCR conditions were: 95°C for 2 min, 12–15 cycles (95°C for 20 s, 60°C for 30 s, 72°C for 1 min), and 72°C for 7 min. Libraries were subjected to QC on a bioanalyzer before sequencing on a Illumina HiSeq2000 using a single read 80 base pair protocol except for one library which was sequenced using 2 × 100 paired end reads.</p></sec><sec id="s4-9"><title>Whole genome bisulfite sequencing data analysis</title><p>Adapters and low quality reads (less than 75% quality scores above 25) were discarded after running quality control of sequencing reads with fastqc (<ext-link ext-link-type="uri" xlink:href="http://hannonlab.cshl.edu/fastx_toolkit/">http://hannonlab.cshl.edu/fastx_toolkit/</ext-link>). Libraries prepared from Col and Cvi were aligned to TAIR10 genome using Bismark (<xref ref-type="bibr" rid="bib32">Krueger and Andrews, 2011</xref>) with the following parameters: -n 1 -l 50, where n is the maximum number of mismatches and -l the length of seed (first number of nt that are mapped with less than n mismatches). For Cvi, reads that failed to map to TAIR10 were then mapped against the Cvi pseudogenome (TAIR10 genome with Cvi SNP substitutions). All mapped reads were combined. Libraries prepared from Ler were aligned to the Ler-0 genome (<xref ref-type="bibr" rid="bib9">Gan et al., 2011</xref>). After mapping, a 2-strain alignment was used to convert Ler-0 genome coordinates to TAIR10 coordinates, allowing subsequent pairwise comparisons between libraries. Redundant mapped reads were eliminated from each library starting from a sorted SAM file, keeping only one sequence per strand that mapped to the same position. To do this, reads were sorted by decreasing prevalence followed by increasing number of mismatches (not counting bisulfite conversions) to the genome. The most prevalent read with the total highest quality string was kept. In the case of a tie, the read with the fewest number of mismatches was retained. Bismark's methylation extractor script was used to calculate a methylation value for each cytosine.</p><p>For F<sub>1</sub> hybrid libraries, we first mapped the reads to one of the parental genomes (Col-Cvi reads to TAIR10 and Ler-Cvi reads to Ler). Reads that failed to map to either the TAIR10 or Ler genomes were mapped against the Cvi pseudogenome using the same alignment parameters (-n 1 -l 50). We discarded redundant reads and combined the remaining Cvi-mapped reads to the ones already mapped against Col-0 (TAIR10) or Ler. To assign reads to a particular strain and to retain as many unique reads as possible, we separated the reads by strand and ignored C&gt;T SNPs for forward reads and G&gt;A SNPs for reverse reads. Reads were classified as maternal, paternal, no evidence for either genome (for reads not overlapping any SNP), or both (conflicting data) based on their sequence at known SNP positions. After classification, redundant reads from each class were eliminated as described above, and methylation extractor was run for each class as well as for all reads combined. The mean bisulfite conversion rate for each library was calculated based on the methylation status of each cytosine from reads mapping to the chloroplast genome, which are expected to be unmethylated.</p></sec><sec id="s4-10"><title>Identifying differentially methylated regions (DMRs)</title><p>Bismark's methylation extractor output was summarized by chromosome position by converting the methylation string into ummethylated counts, methylated counts, and percent methylation. The genome was divided into 300 nt windows that overlapped by 100 nt. Using Bismark's methylation extractor output files as input, weighted methylation levels for each window were calculated as described (<xref ref-type="bibr" rid="bib47">Schultz et al., 2012</xref>), with the requirement of at least 5-read coverage at each site. Differential methylation was assayed by calculating the difference (sample 1 − sample 2 of weighted methylation fractions) and confidence (p-value from Fisher's exact test) for each window in all sequence contexts. p values were corrected with the Benjamini and Hochberg False discovery rate (FDR). We defined CG and CHG DMRs as windows with a weighted methylation difference of at least 35, with a minimum overlap of three informative Cs between windows and a corrected p value&lt;0.01. CHH DMRs had a weighted methylation difference of at least 10, with a minimum 10 overlapping informative cytosines and a p value&lt;0.01.</p><p>To compare methylation levels between strains, methylation fractions of sites in genes and TEs were scaled relative to the mean level of the Col strain in that context. Following analysis by ANOVA, the magnitudes of differences in the normalized methylation levels between strains were calculated using Tukey's HSD test, with alpha set at 0.05 (<xref ref-type="supplementary-material" rid="SD8-data">Figure 3—source data 2</xref>).</p><p>To visualize methylation profiles around imprinted genes, the methylation level of each assayed position (with at least five informative reads) was summarized into a set of bed files and used as input to calculate the average methylation in 200 nt windows spanning extended gene bodies (from 2 kb upstream of the transcription start to 2 kb downstream of the transcription end) of the conserved imprinted genes. We also compared Col, Ler, and Cvi embryo CG average methylation using 50 nt windows spanning extended bodies of genes and TEs. Using a set of genome features of a specific type (e.g., list of genes, TEs), we summarized the methylation level across that set of features. We calculated the weighted mean methylation (wmean) for a particular region (R) containing n sites (i) with methylation data (me_i) with the equation: wmean(R) = Σ[i = 1 to n](me_i/tot_i) where tot_i is the total number of reads. The results of these analyses were displayed using R (<xref ref-type="fig" rid="fig5">Figure 5</xref>). Plots for <xref ref-type="fig" rid="fig3">Figure 3</xref> and <xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1</xref> were also generated using R.</p></sec><sec id="s4-11"><title>Validation of BS-Seq results with locus-specific BS-PCR or McrBC-PCR</title><p>DNA from embryo, endosperm and leaves was extracted using a CTAB protocol. Bisulfite treatment was performed using the MethylCode Bisulfite Conversion Kit (Invitrogen, Life Technologies Corporation) following the manufacturer's protocols. PCRs were performed using the primer pairs listed in <xref ref-type="supplementary-material" rid="SD10-data">Supplementary file 1</xref>. PCR products were gel purified, cloned and sequenced. Sequences were aligned using SeqMan and methylation was measured using Kismeth (<xref ref-type="bibr" rid="bib15">Gruntman et al., 2008</xref>). For validation using McrBC, approximately 800 ng of genomic DNA were digested overnight at 37°C with 50 U of McrBC (New England Biolabs) in a 30 μl reaction. 5 μl were used as template in PCR along with an untreated DNA sample. Primer pairs are listed in <xref ref-type="supplementary-material" rid="SD10-data">Supplementary file 1</xref>.</p></sec><sec id="s4-12"><title>Assessing DMR variability among 140 strains</title><p>To determine how variably the identified embryo-endosperm DMRs were methylated across various wild-type strains, we downloaded BS-seq data from NCBI GEO accession GSE43857 (<xref ref-type="bibr" rid="bib44">Schmitz et al., 2013</xref>). For strains with both leaf and bud data, only the leaf data was used, resulting in data for 140 different Arabidopsis strains. Methylation data were extracted from the Schmitz et al. data for all of our embryo-endosperm DMRs; contiguous or overlapping DMRs were merged prior to the analysis. For each DMR we assigned a methylation score equal to the weighted mean methylation at each CpG site in the DMR (<xref ref-type="bibr" rid="bib47">Schultz et al., 2012</xref>) for each of the 140 strains. Only CpG sites with at least five reads of support and only strains with five or more CpG sites for a DMR were included in the analysis. DMRs were censored from the analysis if more than 70 of the 140 strains had missing scores. The remaining DMRs (n = 10,370) were classified into five categories that describe the distribution of methylation across the Schmitz et al. strains. DMRs with a low range of methylation scores, defined as a difference of less than 0.4 between the scores of the most and least methylated strains, were considered to have roughly consistent methylation patterns across all strains. This was further divided into a ‘very low range’ subcategory consisting of all DMRs with a range of methylation scores less than 0.2 across all strains. These DMRs have very consistent methylation scores across all strains, and tend to correspond to highly methylated transposable elements or regions near centromeres. DMRs with a score range greater than 0.4 were further subdivided according to whether the strain scores tended to be unimodal or uniformly distributed across the range of the data, or whether they tended to be bimodally distributed. This was determined by counting the number of strains whose methylation scores fell in the middle 50% of the data range, and comparing this to the number of strains whose methylation scores fell in the top or bottom 25% of the range. DMRs with a high range but with most of the density of the distribution in outer 50% of the range of the data were considered ‘strongly bimodal’ (range &gt;0.7 and fraction strains in upper or lower 25% of the range ≥0.8). These DMRs include cases where methylation is consistently high or low across strains except for one or two strong outliers. DMRs with high or intermediate range and less strong clustering in the outer 50% of the distribution were considered ‘weakly bimodal’ (range &gt;0.7 and fraction in outer 50% ≥0.5 or 0.7 ≥range ≥0.4 and fraction in outer 50% ≥0.8). All remaining DMRs were classified as ‘not bimodal’—these tend to have a more uniform or unimodal distribution across a large range of scores.</p></sec><sec id="s4-13"><title>Small RNA library construction</title><p>RNAs less than 200 bp were isolated from whole seeds 6 DAP using the miRVana RNA isolation kit (Ambion, Life Technologies Corporation). Libraries for Illumina sequencing were constructed following the method of <xref ref-type="bibr" rid="bib14">Grimson et al. (2008)</xref>, with only minor modifications. Instead of <sup>32</sup>P-labelled oligos, 18 nt and 30 nt unlabeled marker RNAs were used in conjunction with SYBR-Gold for size selection and monitoring of ligation reactions. Marker RNAs were kept in separate lanes on the polyacrylamide-urea gels instead of being directly mixed with the RNA samples, but were processed in an identical manner. We enabled multiplexing of libraries by using four different 3′ PCR primers (<xref ref-type="supplementary-material" rid="SD10-data">Supplementary file 1</xref>) during library amplification, each of which was 94 bases in length as opposed to the 44 nt 3′ PCR primer from the referenced protocol. As a result, the sequences obtained in the final gel purification step ranged in size from 135 to 155 nt in length.</p></sec><sec id="s4-14"><title>Small RNA analysis</title><p>Single-end sequencing of sRNA libraries was performed on an Illumina HiSeq machine (four libraries of 40 bases per lane). We trimmed low-quality read ends (with fastq_quality_trimmer –t 20 and –l 25) and removed adapters (fastx_clipper tool –a TCGTATGCCGTCTTCTGCTTG –i 18; <ext-link ext-link-type="uri" xlink:href="http://hannonlab.cshl.edu/fastx_toolkit/">http://hannonlab.cshl.edu/fastx_toolkit/</ext-link>). Reads were aligned using Bowtie 1.0.0 (<xref ref-type="bibr" rid="bib34">Langmead et al., 2009</xref>) using the parameters –v 2 and --best, such that up to two mismatches were allowed and any read mapping to multiple locations was randomly assigned to one of the locations that had the best match to the read. We used the resequenced Ler genome (<xref ref-type="bibr" rid="bib9">Gan et al., 2011</xref>), and TAIR10 for the Col genome. We constructed a Cvi pseudogenome in which Cvi SNPs and 1 bp indels (obtained from <ext-link ext-link-type="uri" xlink:href="http://signal.salk.edu/atg1001/download.php">http://signal.salk.edu/atg1001/download.php</ext-link>) were used to modify the TAIR10 genome at the appropriate positions. To facilitate unbiased mapping, sRNA reads from hybrids were aligned to a metagenome composed of the two parental genomes. The reads were then converted to TAIR10 coordinates, regardless of the parent strain of origin, and were classified using the same SNP classification approach described for the mRNA-Seq analysis. All reads that overlapped annotated tRNAs, snRNAs, rRNAs, or snoRNAs were removed. We normalized libraries by converting read values within windows into RPM (reads per million) values. The conversion from reads to RPM used the total number of reads aligning to the genome for each library following the subtraction of structural RNAs.</p></sec><sec id="s4-15"><title>Generating SNP lists</title><p>To generate a Col/Ler SNP list, we used the previously described Col/Ler SNP list (<xref ref-type="bibr" rid="bib13">Gehring et al., 2011</xref>) supplemented with novel SNPs having an unambiguous consensus base (A,C,T,G), PHRED ≥ 25, detection score = 1 from the resquenced Ler genome (<xref ref-type="bibr" rid="bib9">Gan et al., 2011</xref>) (<ext-link ext-link-type="uri" xlink:href="http://mus.well.ox.ac.uk/19genomes/variants.SDI/">http://mus.well.ox.ac.uk/19genomes/variants.SDI/</ext-link>). In total, this yielded a list of 384,612 SNPs. To generate an initial Col/Cvi SNP list, we downloaded the SALK Cvi_0 (accession CS28198) data from <ext-link ext-link-type="uri" xlink:href="http://signal.salk.edu/atg1001/download.php">http://signal.salk.edu/atg1001/download.php</ext-link>. From the quality_variant_filtered_Cvi_0.txt file, we removed SNPs with &lt;0.95 or less concordance (n = 66,272) as well as 1 bp deletions (n = 11,444). This yielded 579,310 remaining SNPs. We derived an initial Ler/Cvi SNP list using the following logic: (1) if the SNP was present in Col/Cvi list but not Col/Ler list, the Col/Cvi SNP was added to the Ler/Cvi list; (2) if the opposite scenario was true (present in Col/Ler but absent from Col/Cvi), the Col/Ler SNP was inverted (e.g., C&gt;T becomes T&gt;C) and added to the Ler/Cvi SNP list; (3) if the same SNP was found in both Col/Ler and Col/Cvi SNP lists, it was not added to the Ler/Cvi list since these SNPs arise from a difference between Col and both Ler and Cvi genomes. This yielded a list of 645,212 SNPs. In order to assess the rates of erroneous read classification using these SNP lists, we used them to classify reads of known origin from mRNA-seq and small RNA-seq libraries made from Col x Col, Ler x Ler, and Cvi x Cvi embryo and endosperm or whole seeds. SNPs that systematically misclassified reads were filtered out by using a one-tailed binomial hypothesis test with the null hypothesis that ‘good SNPs’ have an underlying acceptable error rate of ≤5% (H_0: Percent_misclassified ≤ 5%). SNPs with p&lt;0.05 were removed. This filtration method removed 5869 and 24,137 SNPs from the Col/Ler and Col/Cvi SNP lists respectively, after which we regenerated the Ler/Cvi SNP list to create the final lists of 378,743 Col/Ler SNPs, 555,801 Col/Cvi SNPs, and 619,477 Ler/Cvi SNPs (<xref ref-type="supplementary-material" rid="SD11-data">Supplementary file 2</xref>).</p></sec><sec id="s4-16"><title>Data access</title><p>Data is deposited under GEO accession number GSE52814 and is also available from the Dryad Digital Repository: <ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.5061/dryad.gv536">http://dx.doi.org/10.5061/dryad.gv536</ext-link>.</p></sec></sec></body><back><ack id="ack"><title>Acknowledgements</title><p>We thank Prat Thiru and Bingbing Yuan for assistance with data analysis, Morgan Moeglein for technical assistance, the Whitehead Genome Technology core for strand-specific RNA-seq library preparation, high-throughput sequencing and sharing of equipment and reagents, Hongcang Gu and Alex Meissner for advice on bisulfite sequencing library preparation, members of the Bartel lab for advice and protocols on small RNA library preparation, and Nathan Springer for extensive discussions and comments on the manuscript. RME and CLP are recipients of NSF Graduate Research Fellowships. This work was funded by the NSF (MCB 1121952) and by a Pew Scholars award to MG from The Pew Charitable Trust's Pew Scholars Program in the Biomedical Sciences.</p></ack><sec sec-type="additional-information"><title>Additional information</title><fn-group content-type="competing-interest"><title>Competing interests</title><fn fn-type="conflict" id="conf1"><p>The authors declare that no competing interests exist.</p></fn></fn-group><fn-group content-type="author-contribution"><title>Author contributions</title><fn fn-type="con" id="con1"><p>DP, Conception and design, Acquisition of data, Analysis and interpretation of data, Drafting or revising the article</p></fn><fn fn-type="con" id="con2"><p>MG, Conception and design, Acquisition of data, Analysis and interpretation of data, Drafting or revising the article</p></fn><fn fn-type="con" id="con3"><p>RME, Acquisition of data, Analysis and interpretation of data, Drafting or revising the article</p></fn><fn fn-type="con" id="con4"><p>ES, Acquisition of data, Analysis and interpretation of data, Drafting or revising the article</p></fn><fn fn-type="con" id="con5"><p>CLP, Analysis and interpretation of data, Drafting or revising the article</p></fn><fn fn-type="con" id="con6"><p>GWB, Analysis and interpretation of data, Drafting or revising the article</p></fn></fn-group></sec><sec sec-type="supplementary-material"><title>Additional files</title><supplementary-material id="SD10-data"><object-id pub-id-type="doi">10.7554/eLife.03198.035</object-id><label>Supplementary file 1.</label><caption><p>Primers used in this study.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.035">http://dx.doi.org/10.7554/eLife.03198.035</ext-link></p></caption><media mime-subtype="xlsx" mimetype="application" xlink:href="elife03198s010.xlsx"/></supplementary-material><supplementary-material id="SD11-data"><object-id pub-id-type="doi">10.7554/eLife.03198.036</object-id><label>Supplementary file 2.</label><caption><p>SNPs used in this study.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.036">http://dx.doi.org/10.7554/eLife.03198.036</ext-link></p></caption><media mime-subtype="xlsx" mimetype="application" xlink:href="elife03198s011.xlsx"/></supplementary-material><supplementary-material id="SD12-data"><object-id pub-id-type="doi">10.7554/eLife.03198.037</object-id><label>Supplementary file 3.</label><caption><p>Script to classify mRNA-seq reads by strain.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.03198.037">http://dx.doi.org/10.7554/eLife.03198.037</ext-link></p></caption><media mime-subtype="pl" mimetype="text" xlink:href="elife03198s012.pl"/></supplementary-material><sec sec-type="datasets"><title>Major datasets</title><p>The following datasets were generated:</p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro1"><name><surname>Gehring</surname><given-names>M</given-names></name>, <name><surname>Pignatta</surname><given-names>D</given-names></name>, <name><surname>Erdmann</surname><given-names>RM</given-names></name>, <name><surname>Bell</surname><given-names>GW</given-names></name>, <name><surname>Scheer</surname><given-names>E</given-names></name>, <year>2013</year><x>, </x><source>Data from: Natural epigenetic polymorphisms lead to intraspecific variation in Arabidopsis gene imprinting</source><x>, </x><ext-link ext-link-type="uri" xlink:href="https://datadryad.org/resource/doi:10.5061/dryad.gv536">https://datadryad.org/resource/doi:10.5061/dryad.gv536</ext-link><x>, </x><comment>Available at Dryad Digital Repository under a CC0 Public Domain Dedication.</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro2"><name><surname>Mary</surname><given-names>Gehring</given-names></name>, <year>2013</year><x>, </x><source>Data from: Natural epigenetic polymorphisms lead to intraspecific variation in Arabidopsis gene imprinting</source><x>, </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?token=glkjwaugdhatvut%26acc=GSE52814">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?token=glkjwaugdhatvut&amp;acc=GSE52814</ext-link><x>, </x><comment>Publicly available at NCBI Gene Exression Omnibus.</comment></related-object></p></sec></sec><ref-list><title>References</title><ref id="bib1"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ahmed</surname><given-names>I</given-names></name><name><surname>Sarazin</surname><given-names>A</given-names></name><name><surname>Bowler</surname><given-names>C</given-names></name><name><surname>Colot</surname><given-names>V</given-names></name><name><surname>Quesneville</surname><given-names>H</given-names></name></person-group><year>2011</year><article-title>Genome-wide evidence for local DNA methylation spreading from small RNA-targeted sequences in Arabidopsis</article-title><source>Nucleic Acids Research</source><volume>39</volume><fpage>6919</fpage><lpage>6931</lpage><pub-id pub-id-type="doi">10.1093/nar/gkr324</pub-id></element-citation></ref><ref id="bib2"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Alleman</surname><given-names>M</given-names></name><name><surname>Doctor</surname><given-names>J</given-names></name></person-group><year>2000</year><article-title>Genomic imprinting in plants: observations and evolutionary implications</article-title><source>Plant Molecular Biology</source><volume>43</volume><fpage>147</fpage><lpage>161</lpage><pub-id pub-id-type="doi">10.1023/A:1006419025155</pub-id></element-citation></ref><ref id="bib3"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Alonso-Blanco</surname><given-names>C</given-names></name><name><surname>Blankestijn-De Vries</surname><given-names>H</given-names></name><name><surname>Hanhart</surname><given-names>CJ</given-names></name><name><surname>Koornneef</surname><given-names>M</given-names></name></person-group><year>1999</year><article-title>Natural allelic variation at seed size loci in relation to other life history traits of Arabidopsis thaliana</article-title><source>Proceedings of the National Academy of Sciences of the United States of America</source><volume>96</volume><fpage>4710</fpage><lpage>4717</lpage><pub-id pub-id-type="doi">10.1073/pnas.96.8.4710</pub-id></element-citation></ref><ref id="bib4"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Becker</surname><given-names>C</given-names></name><name><surname>Hagmann</surname><given-names>J</given-names></name><name><surname>Müller</surname><given-names>J</given-names></name><name><surname>Koenig</surname><given-names>D</given-names></name><name><surname>Stegle</surname><given-names>O</given-names></name><name><surname>Borgwardt</surname><given-names>K</given-names></name><name><surname>Weigel</surname><given-names>D</given-names></name></person-group><year>2011</year><article-title>Spontaneous epigenetic variation in the <italic>Arabidopsis thaliana</italic> methylome</article-title><source>Nature</source><volume>480</volume><fpage>245</fpage><lpage>249</lpage><pub-id pub-id-type="doi">10.1038/nature10555</pub-id></element-citation></ref><ref id="bib5"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Belmonte</surname><given-names>MF</given-names></name><name><surname>Kirkbride</surname><given-names>RC</given-names></name><name><surname>Stone</surname><given-names>SL</given-names></name><name><surname>Pelletier</surname><given-names>JM</given-names></name><name><surname>Bui</surname><given-names>AQ</given-names></name><name><surname>Yeung</surname><given-names>EC</given-names></name><name><surname>Hashimoto</surname><given-names>M</given-names></name><name><surname>Fei</surname><given-names>J</given-names></name><name><surname>Harada</surname><given-names>CM</given-names></name><name><surname>Munoz</surname><given-names>MD</given-names></name><name><surname>Le</surname><given-names>BH</given-names></name><name><surname>Drews</surname><given-names>GN</given-names></name><name><surname>Brady</surname><given-names>SM</given-names></name><name><surname>Goldberg</surname><given-names>RB</given-names></name><name><surname>Harada</surname><given-names>JJ</given-names></name></person-group><year>2013</year><article-title>Comprehensive developmental profiles of gene activity in regions and subregions of the Arabidopsis seed</article-title><source>Proceedings of the National Academy of Sciences of the United States of America</source><volume>110</volume><fpage>E435</fpage><lpage>E444</lpage><pub-id pub-id-type="doi">10.1073/pnas.1222061110</pub-id></element-citation></ref><ref id="bib6"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Calarco</surname><given-names>JP</given-names></name><name><surname>Borges</surname><given-names>F</given-names></name><name><surname>Donoghue</surname><given-names>MT</given-names></name><name><surname>Van Ex</surname><given-names>F</given-names></name><name><surname>Jullien</surname><given-names>PE</given-names></name><name><surname>Lopes</surname><given-names>T</given-names></name><name><surname>Gardner</surname><given-names>R</given-names></name><name><surname>Berger</surname><given-names>F</given-names></name><name><surname>Feijó</surname><given-names>JA</given-names></name><name><surname>Becker</surname><given-names>JD</given-names></name><name><surname>Martienssen</surname><given-names>RA</given-names></name></person-group><year>2012</year><article-title>Reprogramming of DNA methylation in pollen guides epigenetic inheritance via small RNA</article-title><source>Cell</source><volume>151</volume><fpage>194</fpage><lpage>205</lpage><pub-id pub-id-type="doi">10.1016/j.cell.2012.09.001</pub-id></element-citation></ref><ref id="bib7"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Cao</surname><given-names>J</given-names></name><name><surname>Schneeberger</surname><given-names>K</given-names></name><name><surname>Ossowski</surname><given-names>S</given-names></name><name><surname>Günther</surname><given-names>T</given-names></name><name><surname>Bender</surname><given-names>S</given-names></name><name><surname>Fitz</surname><given-names>J</given-names></name><name><surname>Koenig</surname><given-names>D</given-names></name><name><surname>Lanz</surname><given-names>C</given-names></name><name><surname>Stegle</surname><given-names>O</given-names></name><name><surname>Lippert</surname><given-names>C</given-names></name><name><surname>Wang</surname><given-names>X</given-names></name><name><surname>Ott</surname><given-names>F</given-names></name><name><surname>Müller</surname><given-names>J</given-names></name><name><surname>Alonso-Blanco</surname><given-names>C</given-names></name><name><surname>Borgwardt</surname><given-names>K</given-names></name><name><surname>Schmid</surname><given-names>KJ</given-names></name><name><surname>Weigel</surname><given-names>D</given-names></name></person-group><year>2011</year><article-title>Whole-genome sequencing of multiple <italic>Arabidopsis thaliana</italic> populations</article-title><source>Nature Genetics</source><volume>43</volume><fpage>956</fpage><lpage>963</lpage><pub-id pub-id-type="doi">10.1038/ng.911</pub-id></element-citation></ref><ref id="bib8"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>DeVeale</surname><given-names>B</given-names></name><name><surname>van der Kooy</surname><given-names>D</given-names></name><name><surname>Babak</surname><given-names>T</given-names></name></person-group><year>2012</year><article-title>Critical evaluation of imprinted gene expression by RNA-Seq: a new perspective</article-title><source>PLOS Genetics</source><volume>8</volume><fpage>e1002600</fpage><pub-id pub-id-type="doi">10.1371/journal.pgen.1002600</pub-id></element-citation></ref><ref id="bib9"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gan</surname><given-names>X</given-names></name><name><surname>Stegle</surname><given-names>O</given-names></name><name><surname>Behr</surname><given-names>J</given-names></name><name><surname>Steffen</surname><given-names>JG</given-names></name><name><surname>Drewe</surname><given-names>P</given-names></name><name><surname>Hildebrand</surname><given-names>KL</given-names></name><name><surname>Lyngsoe</surname><given-names>R</given-names></name><name><surname>Schultheiss</surname><given-names>SJ</given-names></name><name><surname>Osborne</surname><given-names>EJ</given-names></name><name><surname>Sreedharan</surname><given-names>VT</given-names></name><name><surname>Kahles</surname><given-names>A</given-names></name><name><surname>Bohnert</surname><given-names>R</given-names></name><name><surname>Jean</surname><given-names>G</given-names></name><name><surname>Derwent</surname><given-names>P</given-names></name><name><surname>Kersey</surname><given-names>P</given-names></name><name><surname>Belfield</surname><given-names>EJ</given-names></name><name><surname>Harberd</surname><given-names>NP</given-names></name><name><surname>Kemen</surname><given-names>E</given-names></name><name><surname>Toomajian</surname><given-names>C</given-names></name><name><surname>Kover</surname><given-names>PX</given-names></name><name><surname>Clark</surname><given-names>RM</given-names></name><name><surname>Rätsch</surname><given-names>G</given-names></name><name><surname>Mott</surname><given-names>R</given-names></name></person-group><year>2011</year><article-title>Multiple reference genomes and transcriptomes for <italic>Arabidopsis thaliana</italic></article-title><source>Nature</source><volume>477</volume><fpage>419</fpage><lpage>423</lpage><pub-id pub-id-type="doi">10.1038/nature10414</pub-id></element-citation></ref><ref id="bib10"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gehring</surname><given-names>M</given-names></name></person-group><year>2013</year><article-title>Genomic imprinting: insights from plants</article-title><source>Annual Review of Genetics</source><volume>47</volume><fpage>187</fpage><lpage>208</lpage><pub-id pub-id-type="doi">10.1146/annurev-genet-110711-155527</pub-id></element-citation></ref><ref id="bib11"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gehring</surname><given-names>M</given-names></name><name><surname>Bubb</surname><given-names>KL</given-names></name><name><surname>Henikoff</surname><given-names>S</given-names></name></person-group><year>2009</year><article-title>Extensive demethylation of repetitive elements during seed development underlies gene imprinting</article-title><source>Science</source><volume>324</volume><fpage>1447</fpage><lpage>1451</lpage><pub-id pub-id-type="doi">10.1126/science.1171609</pub-id></element-citation></ref><ref id="bib12"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gehring</surname><given-names>M</given-names></name><name><surname>Huh</surname><given-names>JH</given-names></name><name><surname>Hsieh</surname><given-names>TF</given-names></name><name><surname>Penterman</surname><given-names>J</given-names></name><name><surname>Choi</surname><given-names>Y</given-names></name><name><surname>Harada</surname><given-names>JJ</given-names></name><name><surname>Goldberg</surname><given-names>RB</given-names></name><name><surname>Fischer</surname><given-names>RL</given-names></name></person-group><year>2006</year><article-title>DEMETER DNA glycosylase establishes MEDEA polycomb gene self-imprinting by allele-specific demethylation</article-title><source>Cell</source><volume>124</volume><fpage>495</fpage><lpage>506</lpage><pub-id pub-id-type="doi">10.1016/j.cell.2005.12.034</pub-id></element-citation></ref><ref id="bib13"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gehring</surname><given-names>M</given-names></name><name><surname>Missirian</surname><given-names>V</given-names></name><name><surname>Henikoff</surname><given-names>S</given-names></name></person-group><year>2011</year><article-title>Genomic analysis of parent-of-origin allelic expression in <italic>Arabidopsis thaliana</italic> seeds</article-title><source>PLOS ONE</source><volume>6</volume><fpage>e23687</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0023687</pub-id></element-citation></ref><ref id="bib14"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Grimson</surname><given-names>A</given-names></name><name><surname>Srivastava</surname><given-names>M</given-names></name><name><surname>Fahey</surname><given-names>B</given-names></name><name><surname>Woodcroft</surname><given-names>BJ</given-names></name><name><surname>Chiang</surname><given-names>HR</given-names></name><name><surname>King</surname><given-names>N</given-names></name><name><surname>Degnan</surname><given-names>BM</given-names></name><name><surname>Rokhsar</surname><given-names>DS</given-names></name><name><surname>Bartel</surname><given-names>DP</given-names></name></person-group><year>2008</year><article-title>Early origins and evolution of microRNAs and Piwi-interacting RNAs in animals</article-title><source>Nature</source><volume>455</volume><fpage>1193</fpage><lpage>1197</lpage><pub-id pub-id-type="doi">10.1038/nature07415</pub-id></element-citation></ref><ref id="bib15"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gruntman</surname><given-names>E</given-names></name><name><surname>Qi</surname><given-names>Y</given-names></name><name><surname>Slotkin</surname><given-names>RK</given-names></name><name><surname>Roeder</surname><given-names>T</given-names></name><name><surname>Martienssen</surname><given-names>RA</given-names></name><name><surname>Sachidanandam</surname><given-names>R</given-names></name></person-group><year>2008</year><article-title>Kismeth: analyzer of plant methylation states through bisulfite sequencing</article-title><source>BMC Bioinformatics</source><volume>9</volume><fpage>371</fpage><pub-id pub-id-type="doi">10.1186/1471-2105-9-371</pub-id></element-citation></ref><ref id="bib16"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Haig</surname><given-names>D</given-names></name></person-group><year>2013</year><article-title>Kin conflict in seed development: an interdependent but fractious collective</article-title><source>Annual Review of Cell and Developmental Biology</source><volume>29</volume><fpage>189</fpage><lpage>211</lpage><pub-id pub-id-type="doi">10.1146/annurev-cellbio-101512-122324</pub-id></element-citation></ref><ref id="bib17"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hollister</surname><given-names>JD</given-names></name><name><surname>Gaut</surname><given-names>BS</given-names></name></person-group><year>2009</year><article-title>Epigenetic silencing of transposable elements: a trade-off between reduced transposition and deleterious effects on neighboring gene expression</article-title><source>Genome Research</source><volume>19</volume><fpage>1419</fpage><lpage>1428</lpage><pub-id pub-id-type="doi">10.1101/gr.091678.109</pub-id></element-citation></ref><ref id="bib18"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hollister</surname><given-names>JD</given-names></name><name><surname>Smith</surname><given-names>LM</given-names></name><name><surname>Guo</surname><given-names>YL</given-names></name><name><surname>Ott</surname><given-names>F</given-names></name><name><surname>Weigel</surname><given-names>D</given-names></name><name><surname>Gaut</surname><given-names>BS</given-names></name></person-group><year>2011</year><article-title>Transposable elements and small RNAs contribute to gene expression divergence between <italic>Arabidopsis thaliana</italic> and Arabidopsis lyrata</article-title><source>Proceedings of the National Academy of Sciences of the United States of America</source><volume>108</volume><fpage>2322</fpage><lpage>2327</lpage><pub-id pub-id-type="doi">10.1073/pnas.1018222108</pub-id></element-citation></ref><ref id="bib19"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hsieh</surname><given-names>TF</given-names></name><name><surname>Ibarra</surname><given-names>CA</given-names></name><name><surname>Silva</surname><given-names>P</given-names></name><name><surname>Zemach</surname><given-names>A</given-names></name><name><surname>Eshed-Williams</surname><given-names>L</given-names></name><name><surname>Fischer</surname><given-names>RL</given-names></name><name><surname>Zilberman</surname><given-names>D</given-names></name></person-group><year>2009</year><article-title>Genome-wide demethylation of Arabidopsis endosperm</article-title><source>Science</source><volume>324</volume><fpage>1451</fpage><lpage>1454</lpage><pub-id pub-id-type="doi">10.1126/science.1172417</pub-id></element-citation></ref><ref id="bib20"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hsieh</surname><given-names>TF</given-names></name><name><surname>Shin</surname><given-names>J</given-names></name><name><surname>Uzawa</surname><given-names>R</given-names></name><name><surname>Silva</surname><given-names>P</given-names></name><name><surname>Cohen</surname><given-names>S</given-names></name><name><surname>Bauer</surname><given-names>MJ</given-names></name><name><surname>Hashimoto</surname><given-names>M</given-names></name><name><surname>Kirkbride</surname><given-names>RC</given-names></name><name><surname>Harada</surname><given-names>JJ</given-names></name><name><surname>Zilberman</surname><given-names>D</given-names></name><name><surname>Fischer</surname><given-names>RL</given-names></name></person-group><year>2011</year><article-title>Regulation of imprinted gene expression in Arabidopsis endosperm</article-title><source>Proceedings of the National Academy of Sciences of the United States of America</source><volume>108</volume><fpage>1755</fpage><lpage>1762</lpage><pub-id pub-id-type="doi">10.1073/pnas.1019273108</pub-id></element-citation></ref><ref id="bib21"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname><given-names>DW</given-names></name><name><surname>Sherman</surname><given-names>BT</given-names></name><name><surname>Lempicki</surname><given-names>RA</given-names></name></person-group><year>2009a</year><article-title>Bioinformatics enrichment tools: paths toward the comprehensive functional analysis of large gene lists</article-title><source>Nucleic Acids Research</source><volume>37</volume><fpage>1</fpage><lpage>13</lpage><pub-id pub-id-type="doi">10.1093/nar/gkn923</pub-id></element-citation></ref><ref id="bib22"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname><given-names>DW</given-names></name><name><surname>Sherman</surname><given-names>BT</given-names></name><name><surname>Lempicki</surname><given-names>RA</given-names></name></person-group><year>2009b</year><article-title>Systematic and integrative analysis of large gene lists using DAVID bioinformatics resources</article-title><source>Nature Protocols</source><volume>4</volume><fpage>44</fpage><lpage>57</lpage><pub-id pub-id-type="doi">10.1038/nprot.2008.211</pub-id></element-citation></ref><ref id="bib23"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ibarra</surname><given-names>CA</given-names></name><name><surname>Feng</surname><given-names>X</given-names></name><name><surname>Schoft</surname><given-names>VK</given-names></name><name><surname>Hsieh</surname><given-names>TF</given-names></name><name><surname>Uzawa</surname><given-names>R</given-names></name><name><surname>Rodrigues</surname><given-names>JA</given-names></name><name><surname>Zemach</surname><given-names>A</given-names></name><name><surname>Chumak</surname><given-names>N</given-names></name><name><surname>Machlicova</surname><given-names>A</given-names></name><name><surname>Nishimura</surname><given-names>T</given-names></name><name><surname>Rojas</surname><given-names>D</given-names></name><name><surname>Fischer</surname><given-names>RL</given-names></name><name><surname>Tamaru</surname><given-names>H</given-names></name><name><surname>Zilberman</surname><given-names>D</given-names></name></person-group><year>2012</year><article-title>Active DNA demethylation in plant companion cells reinforces transposon methylation in gametes</article-title><source>Science</source><volume>337</volume><fpage>1360</fpage><lpage>1364</lpage><pub-id pub-id-type="doi">10.1126/science.1224839</pub-id></element-citation></ref><ref id="bib24"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ingouff</surname><given-names>M</given-names></name><name><surname>Fitz Gerald</surname><given-names>JN</given-names></name><name><surname>Guérin</surname><given-names>C</given-names></name><name><surname>Robert</surname><given-names>H</given-names></name><name><surname>Sørensen</surname><given-names>MB</given-names></name><name><surname>Van Damme</surname><given-names>D</given-names></name><name><surname>Geelen</surname><given-names>D</given-names></name><name><surname>Blanchoin</surname><given-names>L</given-names></name><name><surname>Berger</surname><given-names>F</given-names></name></person-group><year>2005</year><article-title>Plant formin AtFH5 is an evolutionarily conserved actin nucleator involved in cytokinesis</article-title><source>Nature Cell Biology</source><volume>7</volume><fpage>374</fpage><lpage>380</lpage><pub-id pub-id-type="doi">10.1038/ncb1238</pub-id></element-citation></ref><ref id="bib25"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Jiang</surname><given-names>H</given-names></name><name><surname>Köhler</surname><given-names>C</given-names></name></person-group><year>2012</year><article-title>Evolution, function, and regulation of genomic imprinting in plant seed development</article-title><source>Journal of Experimental Botany</source><volume>63</volume><fpage>4713</fpage><lpage>4722</lpage><pub-id pub-id-type="doi">10.1093/jxb/ers145</pub-id></element-citation></ref><ref id="bib26"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Jullien</surname><given-names>PE</given-names></name><name><surname>Susaki</surname><given-names>D</given-names></name><name><surname>Yelagandula</surname><given-names>R</given-names></name><name><surname>Higashiyama</surname><given-names>T</given-names></name><name><surname>Berger</surname><given-names>F</given-names></name></person-group><year>2012</year><article-title>DNA methylation dynamics during sexual reproduction in <italic>Arabidopsis thaliana</italic></article-title><source>Current Biology</source><volume>22</volume><fpage>1825</fpage><lpage>1830</lpage><pub-id pub-id-type="doi">10.1016/j.cub.2012.07.061</pub-id></element-citation></ref><ref id="bib27"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kermicle</surname><given-names>JL</given-names></name></person-group><year>1970</year><article-title>Dependence of the R-mottled aleurone phenotype in maize on mode of sexual transmission</article-title><source>Genetics</source><volume>66</volume><fpage>69</fpage><lpage>85</lpage></element-citation></ref><ref id="bib28"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kermicle</surname><given-names>J</given-names></name></person-group><year>1978</year><article-title>Imprinting of gene action in maize endosperm</article-title><source>Maize Breeding and Genetics</source><fpage>357</fpage><lpage>371</lpage></element-citation></ref><ref id="bib29"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname><given-names>SI</given-names></name><name><surname>Tai</surname><given-names>TH</given-names></name></person-group><year>2010</year><article-title>Genetic analysis of two OsLpa1-like genes in Arabidopsis reveals that only one is required for wild-type seed phytic acid levels</article-title><source>Planta</source><volume>232</volume><fpage>1241</fpage><lpage>1250</lpage><pub-id pub-id-type="doi">10.1007/s00425-010-1243-5</pub-id></element-citation></ref><ref id="bib30"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Köhler</surname><given-names>C</given-names></name><name><surname>Wolff</surname><given-names>P</given-names></name><name><surname>Spillane</surname><given-names>C</given-names></name></person-group><year>2012</year><article-title>Epigenetic mechanisms underlying genomic imprinting in plants</article-title><source>Annual Review of Plant Biology</source><volume>63</volume><fpage>331</fpage><lpage>352</lpage><pub-id pub-id-type="doi">10.1146/annurev-arplant-042811-105514</pub-id></element-citation></ref><ref id="bib31"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kradolfer</surname><given-names>D</given-names></name><name><surname>Wolff</surname><given-names>P</given-names></name><name><surname>Jiang</surname><given-names>H</given-names></name><name><surname>Siretskiy</surname><given-names>A</given-names></name><name><surname>Köhler</surname><given-names>C</given-names></name></person-group><year>2013</year><article-title>An imprinted gene underlies postzygotic reproductive isolation in <italic>Arabidopsis thaliana</italic></article-title><source>Developmental Cell</source><volume>26</volume><fpage>525</fpage><lpage>535</lpage><pub-id pub-id-type="doi">10.1016/j.devcel.2013.08.006</pub-id></element-citation></ref><ref id="bib32"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Krueger</surname><given-names>F</given-names></name><name><surname>Andrews</surname><given-names>SR</given-names></name></person-group><year>2011</year><article-title>Bismark: a flexible aligner and methylation caller for Bisulfite-Seq applications</article-title><source>Bioinformatics</source><volume>27</volume><fpage>1571</fpage><lpage>1572</lpage><pub-id pub-id-type="doi">10.1093/bioinformatics/btr167</pub-id></element-citation></ref><ref id="bib33"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lafos</surname><given-names>M</given-names></name><name><surname>Kroll</surname><given-names>P</given-names></name><name><surname>Hohenstatt</surname><given-names>ML</given-names></name><name><surname>Thorpe</surname><given-names>FL</given-names></name><name><surname>Clarenz</surname><given-names>O</given-names></name><name><surname>Schubert</surname><given-names>D</given-names></name></person-group><year>2011</year><article-title>Dynamic regulation of H3K27 trimethylation during Arabidopsis differentiation</article-title><source>PLOS Genetics</source><volume>7</volume><fpage>e1002040</fpage><pub-id pub-id-type="doi">10.1371/journal.pgen.1002040</pub-id></element-citation></ref><ref id="bib34"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Langmead</surname><given-names>B</given-names></name><name><surname>Trapnell</surname><given-names>C</given-names></name><name><surname>Pop</surname><given-names>M</given-names></name><name><surname>Salzberg</surname><given-names>SL</given-names></name></person-group><year>2009</year><article-title>Ultrafast and memory-efficient alignment of short DNA sequences to the human genome</article-title><source>Genome Biology</source><volume>10</volume><fpage>R25</fpage><pub-id pub-id-type="doi">10.1186/gb-2009-10-3-r25</pub-id></element-citation></ref><ref id="bib35"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Law</surname><given-names>JA</given-names></name><name><surname>Jacobsen</surname><given-names>SE</given-names></name></person-group><year>2010</year><article-title>Establishing, maintaining and modifying DNA methylation patterns in plants and animals</article-title><source>Nature Reviews Genetics</source><volume>11</volume><fpage>204</fpage><lpage>220</lpage><pub-id pub-id-type="doi">10.1038/nrg2719</pub-id></element-citation></ref><ref id="bib36"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lister</surname><given-names>R</given-names></name><name><surname>O'Malley</surname><given-names>RC</given-names></name><name><surname>Tonti-Filippini</surname><given-names>J</given-names></name><name><surname>Gregory</surname><given-names>BD</given-names></name><name><surname>Berry</surname><given-names>CC</given-names></name><name><surname>Millar</surname><given-names>AH</given-names></name><name><surname>Ecker</surname><given-names>JR</given-names></name></person-group><year>2008</year><article-title>Highly integrated single-base resolution maps of the epigenome in Arabidopsis</article-title><source>Cell</source><volume>133</volume><fpage>523</fpage><lpage>536</lpage><pub-id pub-id-type="doi">10.1016/j.cell.2008.03.029</pub-id></element-citation></ref><ref id="bib37"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Luo</surname><given-names>M</given-names></name><name><surname>Taylor</surname><given-names>JM</given-names></name><name><surname>Spriggs</surname><given-names>A</given-names></name><name><surname>Zhang</surname><given-names>H</given-names></name><name><surname>Wu</surname><given-names>X</given-names></name><name><surname>Russell</surname><given-names>S</given-names></name><name><surname>Singh</surname><given-names>M</given-names></name><name><surname>Koltunow</surname><given-names>A</given-names></name></person-group><year>2011</year><article-title>A genome-wide survey of imprinted genes in rice seeds reveals imprinting primarily occurs in the endosperm</article-title><source>PLOS Genetics</source><volume>7</volume><fpage>e1002125</fpage><pub-id pub-id-type="doi">10.1371/journal.pgen.1002125</pub-id></element-citation></ref><ref id="bib38"><element-citation publication-type="book"><person-group person-group-type="author"><name><surname>McClintock</surname><given-names>B</given-names></name></person-group><year>1965</year><article-title>Components of action of the regulators Spm and Ac</article-title><source>Carnegie Institution of Washington Year Book</source><fpage>527</fpage><lpage>535</lpage><volume>64</volume></element-citation></ref><ref id="bib39"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Mosher</surname><given-names>RA</given-names></name><name><surname>Melnyk</surname><given-names>CW</given-names></name><name><surname>Kelly</surname><given-names>KA</given-names></name><name><surname>Dunn</surname><given-names>RM</given-names></name><name><surname>Studholme</surname><given-names>DJ</given-names></name><name><surname>Baulcombe</surname><given-names>DC</given-names></name></person-group><year>2009</year><article-title>Uniparental expression of PolIV-dependent siRNAs in developing endosperm of Arabidopsis</article-title><source>Nature</source><volume>460</volume><fpage>283</fpage><lpage>286</lpage><pub-id pub-id-type="doi">10.1038/nature08084</pub-id></element-citation></ref><ref id="bib40"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nordborg</surname><given-names>M</given-names></name><name><surname>Hu</surname><given-names>TT</given-names></name><name><surname>Ishino</surname><given-names>Y</given-names></name><name><surname>Jhaveri</surname><given-names>J</given-names></name><name><surname>Toomajian</surname><given-names>C</given-names></name></person-group><year>2005</year><article-title>The pattern of polymorphism in <italic>Arabidopsis thaliana</italic></article-title><source>PLOS Biology</source><volume>3</volume><fpage>e196</fpage><pub-id pub-id-type="doi">10.1371/journal.pbio.0030196</pub-id></element-citation></ref><ref id="bib42"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Rodrigues</surname><given-names>JA</given-names></name><name><surname>Ruan</surname><given-names>R</given-names></name><name><surname>Nishimura</surname><given-names>T</given-names></name><name><surname>Sharma</surname><given-names>MK</given-names></name><name><surname>Sharma</surname><given-names>R</given-names></name><name><surname>Ronald</surname><given-names>PC</given-names></name><name><surname>Fischer</surname><given-names>RL</given-names></name><name><surname>Zilberman</surname><given-names>D</given-names></name></person-group><year>2013</year><article-title>Imprinted expression of genes and small RNA is associated with localized hypomethylation of the maternal genome in rice endosperm</article-title><source>Proceedings of the National Academy of Sciences of the United States of America</source><volume>110</volume><fpage>7934</fpage><lpage>7939</lpage><pub-id pub-id-type="doi">10.1073/pnas.1306164110</pub-id></element-citation></ref><ref id="bib43"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Schmitz</surname><given-names>RJ</given-names></name><name><surname>Schultz</surname><given-names>MD</given-names></name><name><surname>Lewsey</surname><given-names>MG</given-names></name><name><surname>O'Malley</surname><given-names>RC</given-names></name><name><surname>Urich</surname><given-names>MA</given-names></name><name><surname>Libiger</surname><given-names>O</given-names></name><name><surname>Schork</surname><given-names>NJ</given-names></name><name><surname>Ecker</surname><given-names>JR</given-names></name></person-group><year>2011</year><article-title>Transgenerational epigenetic instability is a source of novel methylation variants</article-title><source>Science</source><volume>334</volume><fpage>369</fpage><lpage>373</lpage><pub-id pub-id-type="doi">10.1126/science.1212959</pub-id></element-citation></ref><ref id="bib44"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Schmitz</surname><given-names>RJ</given-names></name><name><surname>Schultz</surname><given-names>MD</given-names></name><name><surname>Urich</surname><given-names>MA</given-names></name><name><surname>Nery</surname><given-names>JR</given-names></name><name><surname>Pelizzola</surname><given-names>M</given-names></name><name><surname>Libiger</surname><given-names>O</given-names></name><name><surname>Alix</surname><given-names>A</given-names></name><name><surname>McCosh</surname><given-names>RB</given-names></name><name><surname>Chen</surname><given-names>H</given-names></name><name><surname>Schork</surname><given-names>NJ</given-names></name><name><surname>Ecker</surname><given-names>JR</given-names></name></person-group><year>2013</year><article-title>Patterns of population epigenomic diversity</article-title><source>Nature</source><volume>495</volume><fpage>193</fpage><lpage>198</lpage><pub-id pub-id-type="doi">10.1038/nature11968</pub-id></element-citation></ref><ref id="bib45"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Schoft</surname><given-names>VK</given-names></name><name><surname>Chumak</surname><given-names>N</given-names></name><name><surname>Choi</surname><given-names>Y</given-names></name><name><surname>Hannon</surname><given-names>M</given-names></name><name><surname>Garcia-Aguilar</surname><given-names>M</given-names></name><name><surname>Machlicova</surname><given-names>A</given-names></name><name><surname>Slusarz</surname><given-names>L</given-names></name><name><surname>Mosiolek</surname><given-names>M</given-names></name><name><surname>Park</surname><given-names>JS</given-names></name><name><surname>Park</surname><given-names>GT</given-names></name><name><surname>Fischer</surname><given-names>RL</given-names></name><name><surname>Tamaru</surname><given-names>H</given-names></name></person-group><year>2011</year><article-title>Function of the DEMETER DNA glycosylase in the <italic>Arabidopsis thaliana</italic> male gametophyte</article-title><source>Proceedings of the National Academy of Sciences of the United States of America</source><volume>108</volume><fpage>8042</fpage><lpage>8047</lpage><pub-id pub-id-type="doi">10.1073/pnas.1105117108</pub-id></element-citation></ref><ref id="bib46"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Schoft</surname><given-names>VK</given-names></name><name><surname>Chumak</surname><given-names>N</given-names></name><name><surname>Mosiolek</surname><given-names>M</given-names></name><name><surname>Slusarz</surname><given-names>L</given-names></name><name><surname>Komnenovic</surname><given-names>V</given-names></name><name><surname>Brownfield</surname><given-names>L</given-names></name><name><surname>Twell</surname><given-names>D</given-names></name><name><surname>Kakutani</surname><given-names>T</given-names></name><name><surname>Tamaru</surname><given-names>H</given-names></name></person-group><year>2009</year><article-title>Induction of RNA-directed DNA methylation upon decondensation of constitutive heterochromatin</article-title><source>EMBO Reports</source><volume>10</volume><fpage>1015</fpage><lpage>1021</lpage><pub-id pub-id-type="doi">10.1038/embor.2009.152</pub-id></element-citation></ref><ref id="bib47"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Schultz</surname><given-names>MD</given-names></name><name><surname>Schmitz</surname><given-names>RJ</given-names></name><name><surname>Ecker</surname><given-names>JR</given-names></name></person-group><year>2012</year><article-title>‘Leveling’ the playing field for analyses of single-base resolution DNA methylomes</article-title><source>Trends in Genetics</source><volume>28</volume><fpage>583</fpage><lpage>585</lpage><pub-id pub-id-type="doi">10.1016/j.tig.2012.10.012</pub-id></element-citation></ref><ref id="bib48"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Shukla</surname><given-names>S</given-names></name><name><surname>Kavak</surname><given-names>E</given-names></name><name><surname>Gregory</surname><given-names>M</given-names></name><name><surname>Imashimizu</surname><given-names>M</given-names></name><name><surname>Shutinosööi</surname><given-names>B</given-names></name><name><surname>Kashlev</surname><given-names>M</given-names></name><name><surname>Oberdoerffer</surname><given-names>P</given-names></name><name><surname>Sandberg</surname><given-names>R</given-names></name><name><surname>Oberdoerffer</surname><given-names>S</given-names></name></person-group><year>2011</year><article-title>CTCF-promoted RNA polymerase II pausing links DNA methylation to splicing</article-title><source>Nature</source><volume>479</volume><fpage>74</fpage><lpage>79</lpage><pub-id pub-id-type="doi">10.1038/nature10442</pub-id></element-citation></ref><ref id="bib49"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Slotkin</surname><given-names>RK</given-names></name><name><surname>Martienssen</surname><given-names>R</given-names></name></person-group><year>2007</year><article-title>Transposable elements and the epigenetic regulation of the genome</article-title><source>Nature Reviews Genetics</source><volume>8</volume><fpage>272</fpage><lpage>285</lpage><pub-id pub-id-type="doi">10.1038/nrg2072</pub-id></element-citation></ref><ref id="bib50"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tessadori</surname><given-names>F</given-names></name><name><surname>Schulkes</surname><given-names>RK</given-names></name><name><surname>van Driel</surname><given-names>R</given-names></name><name><surname>Fransz</surname><given-names>P</given-names></name></person-group><year>2007</year><article-title>Light-regulated large-scale reorganization of chromatin during the floral transition in Arabidopsis</article-title><source>The Plant Journal</source><volume>50</volume><fpage>848</fpage><lpage>857</lpage><pub-id pub-id-type="doi">10.1111/j.1365-313X.2007.03093.x</pub-id></element-citation></ref><ref id="bib51"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tessadori</surname><given-names>F</given-names></name><name><surname>van Zanten</surname><given-names>M</given-names></name><name><surname>Pavlova</surname><given-names>P</given-names></name><name><surname>Clifton</surname><given-names>R</given-names></name><name><surname>Pontvianne</surname><given-names>F</given-names></name><name><surname>Snoek</surname><given-names>LB</given-names></name><name><surname>Millenaar</surname><given-names>FF</given-names></name><name><surname>Schulkes</surname><given-names>RK</given-names></name><name><surname>van Driel</surname><given-names>R</given-names></name><name><surname>Voesenek</surname><given-names>LA</given-names></name><name><surname>Spillane</surname><given-names>C</given-names></name><name><surname>Pikaard</surname><given-names>CS</given-names></name><name><surname>Fransz</surname><given-names>P</given-names></name><name><surname>Peeters</surname><given-names>AJ</given-names></name></person-group><year>2009</year><article-title>Phytochrome B and histone deacetylase 6 control light-induced chromatin compaction in <italic>Arabidopsis thaliana</italic></article-title><source>PLOS Genetics</source><volume>5</volume><fpage>e1000638</fpage><pub-id pub-id-type="doi">10.1371/journal.pgen.1000638</pub-id></element-citation></ref><ref id="bib52"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Toufighi</surname><given-names>K</given-names></name><name><surname>Brady</surname><given-names>SM</given-names></name><name><surname>Austin</surname><given-names>R</given-names></name><name><surname>Ly</surname><given-names>E</given-names></name><name><surname>Provart</surname><given-names>NJ</given-names></name></person-group><year>2005</year><article-title>The Botany Array Resource: e-Northerns, Expression Angling, and promoter analyses</article-title><source>The Plant Journal</source><volume>43</volume><fpage>153</fpage><lpage>163</lpage><pub-id pub-id-type="doi">10.1111/j.1365-313X.2005.02437.x</pub-id></element-citation></ref><ref id="bib53"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Trapnell</surname><given-names>C</given-names></name><name><surname>Pachter</surname><given-names>L</given-names></name><name><surname>Salzberg</surname><given-names>SL</given-names></name></person-group><year>2009</year><article-title>TopHat: discovering splice junctions with RNA-Seq</article-title><source>Bioinformatics</source><volume>25</volume><fpage>1105</fpage><lpage>1111</lpage><pub-id pub-id-type="doi">10.1093/bioinformatics/btp120</pub-id></element-citation></ref><ref id="bib54"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tycko</surname><given-names>B</given-names></name><name><surname>Morison</surname><given-names>IM</given-names></name></person-group><year>2002</year><article-title>Physiological functions of imprinted genes</article-title><source>Journal of Cellular Physiology</source><volume>192</volume><fpage>245</fpage><lpage>258</lpage><pub-id pub-id-type="doi">10.1002/jcp.10129</pub-id></element-citation></ref><ref id="bib55"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Vu</surname><given-names>TM</given-names></name><name><surname>Nakamura</surname><given-names>M</given-names></name><name><surname>Calarco</surname><given-names>JP</given-names></name><name><surname>Susaki</surname><given-names>D</given-names></name><name><surname>Lim</surname><given-names>PQ</given-names></name><name><surname>Kinoshita</surname><given-names>T</given-names></name><name><surname>Higashiyama</surname><given-names>T</given-names></name><name><surname>Martienssen</surname><given-names>RA</given-names></name><name><surname>Berger</surname><given-names>F</given-names></name></person-group><year>2013</year><article-title>RNA-directed DNA methylation regulates parental genomic imprinting at several loci in Arabidopsis</article-title><source>Development</source><volume>140</volume><fpage>2953</fpage><lpage>2960</lpage><pub-id pub-id-type="doi">10.1242/dev.092981</pub-id></element-citation></ref><ref id="bib56"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Walker</surname><given-names>EL</given-names></name></person-group><year>1998</year><article-title>Paramutation of the r1 locus of maize is associated with increased cytosine methylation</article-title><source>Genetics</source><volume>148</volume><fpage>1973</fpage><lpage>1981</lpage></element-citation></ref><ref id="bib57"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname><given-names>X</given-names></name><name><surname>Weigel</surname><given-names>D</given-names></name><name><surname>Smith</surname><given-names>LM</given-names></name></person-group><year>2013a</year><article-title>Transposon variants and their effects on gene expression in Arabidopsis</article-title><source>PLOS Genetics</source><volume>9</volume><fpage>e1003255</fpage><pub-id pub-id-type="doi">10.1371/journal.pgen.1003255</pub-id></element-citation></ref><ref id="bib58"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname><given-names>X</given-names></name><name><surname>Miller</surname><given-names>DC</given-names></name><name><surname>Harman</surname><given-names>R</given-names></name><name><surname>Antczak</surname><given-names>DF</given-names></name><name><surname>Clark</surname><given-names>AG</given-names></name></person-group><year>2013b</year><article-title>Paternally expressed genes predominate in the placenta</article-title><source>Proceedings of the National Academy of Sciences of the United States of America</source><volume>110</volume><fpage>10705</fpage><lpage>10710</lpage><pub-id pub-id-type="doi">10.1073/pnas.1308998110</pub-id></element-citation></ref><ref id="bib59"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Waters</surname><given-names>AJ</given-names></name><name><surname>Bilinski</surname><given-names>P</given-names></name><name><surname>Eichten</surname><given-names>SR</given-names></name><name><surname>Vaughn</surname><given-names>MW</given-names></name><name><surname>Ross-Ibarra</surname><given-names>J</given-names></name><name><surname>Gehring</surname><given-names>M</given-names></name><name><surname>Springer</surname><given-names>NM</given-names></name></person-group><year>2013</year><article-title>Comprehensive analysis of imprinted genes in maize reveals allelic variation for imprinting and limited conservation with other species</article-title><source>Proceedings of the National Academy of Sciences of the United States of America</source><volume>110</volume><fpage>19639</fpage><lpage>19644</lpage><pub-id pub-id-type="doi">10.1073/pnas.1309182110</pub-id></element-citation></ref><ref id="bib60"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Waters</surname><given-names>AJ</given-names></name><name><surname>Makarevitch</surname><given-names>I</given-names></name><name><surname>Eichten</surname><given-names>SR</given-names></name><name><surname>Swanson-Wagner</surname><given-names>RA</given-names></name><name><surname>Yeh</surname><given-names>CT</given-names></name><name><surname>Xu</surname><given-names>W</given-names></name><name><surname>Schnable</surname><given-names>PS</given-names></name><name><surname>Vaughn</surname><given-names>MW</given-names></name><name><surname>Gehring</surname><given-names>M</given-names></name><name><surname>Springer</surname><given-names>NM</given-names></name></person-group><year>2012</year><article-title>Parent-of-origin effects on gene expression and DNA methylation in the Maize endosperm</article-title><source>The Plant Cell</source><volume>23</volume><fpage>4221</fpage><lpage>4233</lpage><pub-id pub-id-type="doi">10.1105/tpc.111.092668</pub-id></element-citation></ref><ref id="bib61"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wolff</surname><given-names>P</given-names></name><name><surname>Weinhofer</surname><given-names>I</given-names></name><name><surname>Seguin</surname><given-names>J</given-names></name><name><surname>Roszak</surname><given-names>P</given-names></name><name><surname>Beisel</surname><given-names>C</given-names></name><name><surname>Donoghue</surname><given-names>MT</given-names></name><name><surname>Spillane</surname><given-names>C</given-names></name><name><surname>Nordborg</surname><given-names>M</given-names></name><name><surname>Rehmsmeier</surname><given-names>M</given-names></name><name><surname>Köhler</surname><given-names>C</given-names></name></person-group><year>2011</year><article-title>High-resolution analysis of parent-of-origin allelic expression in the Arabidopsis endosperm</article-title><source>PLOS Genetics</source><volume>7</volume><fpage>e1002126</fpage><pub-id pub-id-type="doi">10.1371/journal.pgen.1002126</pub-id></element-citation></ref><ref id="bib62"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Xin</surname><given-names>M</given-names></name><name><surname>Yang</surname><given-names>R</given-names></name><name><surname>Li</surname><given-names>G</given-names></name><name><surname>Chen</surname><given-names>H</given-names></name><name><surname>Laurie</surname><given-names>J</given-names></name><name><surname>Ma</surname><given-names>C</given-names></name><name><surname>Wang</surname><given-names>D</given-names></name><name><surname>Yao</surname><given-names>Y</given-names></name><name><surname>Larkins</surname><given-names>BA</given-names></name><name><surname>Sun</surname><given-names>Q</given-names></name><name><surname>Yadegari</surname><given-names>R</given-names></name><name><surname>Wang</surname><given-names>X</given-names></name><name><surname>Ni</surname><given-names>Z</given-names></name></person-group><year>2013</year><article-title>Dynamic expression of imprinted genes associates with maternally controlled nutrient allocation during maize endosperm development</article-title><source>The Plant Cell</source><volume>9</volume><fpage>3212</fpage><lpage>3227</lpage><pub-id pub-id-type="doi">10.1105/tpc.113.115592</pub-id></element-citation></ref><ref id="bib63"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname><given-names>M</given-names></name><name><surname>Xie</surname><given-names>S</given-names></name><name><surname>Dong</surname><given-names>X</given-names></name><name><surname>Zhao</surname><given-names>X</given-names></name><name><surname>Zeng</surname><given-names>B</given-names></name><name><surname>Chen</surname><given-names>J</given-names></name><name><surname>Li</surname><given-names>H</given-names></name><name><surname>Yang</surname><given-names>W</given-names></name><name><surname>Zhao</surname><given-names>H</given-names></name><name><surname>Wang</surname><given-names>G</given-names></name><name><surname>Chen</surname><given-names>Z</given-names></name><name><surname>Sun</surname><given-names>S</given-names></name><name><surname>Hauck</surname><given-names>A</given-names></name><name><surname>Jin</surname><given-names>W</given-names></name><name><surname>Lai</surname><given-names>J</given-names></name></person-group><year>2014</year><article-title>Genome-wide high resolution parental-specific DNA and histone methylation maps uncover patterns of imprinting regulation in maize</article-title><source>Genome Research</source><volume>24</volume><fpage>167</fpage><lpage>176</lpage><pub-id pub-id-type="doi">10.1101/gr.155879.113</pub-id></element-citation></ref><ref id="bib64"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname><given-names>M</given-names></name><name><surname>Zhao</surname><given-names>H</given-names></name><name><surname>Xie</surname><given-names>S</given-names></name><name><surname>Chen</surname><given-names>J</given-names></name><name><surname>Xu</surname><given-names>Y</given-names></name><name><surname>Wang</surname><given-names>K</given-names></name><name><surname>Zhao</surname><given-names>H</given-names></name><name><surname>Guan</surname><given-names>H</given-names></name><name><surname>Hu</surname><given-names>X</given-names></name><name><surname>Jiao</surname><given-names>Y</given-names></name><name><surname>Song</surname><given-names>W</given-names></name><name><surname>Lai</surname><given-names>J</given-names></name></person-group><year>2011</year><article-title>Extensive, clustered parental imprinting of protein-coding and noncoding RNAs in developing maize endosperm</article-title><source>Proceedings of the National Academy of Sciences of the United States of America</source><volume>108</volume><fpage>20042</fpage><lpage>20047</lpage><pub-id pub-id-type="doi">10.1073/pnas.1112186108</pub-id></element-citation></ref><ref id="bib65"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zilberman</surname><given-names>D</given-names></name><name><surname>Gehring</surname><given-names>M</given-names></name><name><surname>Tran</surname><given-names>RK</given-names></name><name><surname>Ballinger</surname><given-names>T</given-names></name><name><surname>Henikoff</surname><given-names>S</given-names></name></person-group><year>2007</year><article-title>Genome-wide analysis of <italic>Arabidopsis thaliana</italic> DNA methylation uncovers an interdependence between methylation and transcription</article-title><source>Nature Genetics</source><volume>39</volume><fpage>61</fpage><lpage>69</lpage><pub-id pub-id-type="doi">10.1038/ng1929</pub-id></element-citation></ref></ref-list></back><sub-article article-type="article-commentary" id="SA1"><front-stub><article-id pub-id-type="doi">10.7554/eLife.03198.038</article-id><title-group><article-title>Decision letter</article-title></title-group><contrib-group content-type="section"><contrib contrib-type="editor"><name><surname>Weigel</surname><given-names>Detlef</given-names></name><role>Reviewing editor</role><aff><institution>Max Planck Institute for Developmental Biology</institution>, <country>Germany</country></aff></contrib></contrib-group></front-stub><body><boxed-text><p>eLife posts the editorial decision letter and author response on a selection of the published articles (subject to the approval of the authors). An edited version of the letter sent to the authors after peer review is shown, indicating the substantive concerns or comments; minor concerns are not usually shown. Reviewers have the opportunity to discuss the decision before the letter is sent (see <ext-link ext-link-type="uri" xlink:href="http://elifesciences.org/review-process">review process</ext-link>). Similarly, the author response typically shows only responses to the major concerns raised by the reviewers.</p></boxed-text><p>Thank you for resubmitting your work entitled “Natural epigenetic polymorphisms lead to intraspecific variation in Arabidopsis gene imprinting” for further consideration at <italic>eLife</italic>. Your revised article has been reviewed by Detlef Weigel (Senior editor) and two other peer reviewers. The manuscript has been improved but there are some remaining issues that need to be addressed before acceptance, as outlined below:</p><p>You use an impressive dataset of gene expression, DNA methylation and small RNAs from seeds of reciprocal hybrid plants between two Arabidopsis ecotypes to determine how many genes are imprinted in Arabidopsis. Although there have been several reports published in the past two years regarding epigenetic differences within and among Arabidopsis inbred lines, these data go one step farther by showing how these epigenetic differences can be associated with allele-specific imprinting.</p><p>While the reviewers would have liked to see a connection between imprinting polymorphisms and phenotypic effects, there was agreement that this is a difficult task. Nevertheless, there were two principal suggestions how the manuscript could be improved:</p><p>Despite their impressive dataset, you identify only six examples for allele-specific imprinting, only three of which are investigated in detail. You either need to investigate the other three, or if you tried to investigate them, explain what you found. If the global analysis had a 50% false discovery rate, then this would be important to know.</p><p>As importantly, the Discussion of the importance of epigenetic variation being linked or unlinked to genetic variation tends to obscure the important new points in the current work. The Discussion should focus on methylation variation being causal for imprinting differences, regardless of the proximate cause for methylation variation. Of course, it is ultimately important as well to partition methylation variation into ’pure’ methylation variation and methylation variation that is the result of nearby sequence changes, but this need not be the take home message of the current work.</p><p><italic>Reviewer #2</italic> major concerns:</p><p>1) From the start, this paper reads like a thesis and not a research paper. So much information is thrown at the reader that I didn't know what is important. For example, the Introduction is 4 pages long and attempts to review this entire field. Entire paragraphs should be removed so the reader doesn't get bogged down. In the Discussion, the writing is very repetitive between the first and last paragraphs on the page. Because of the way it is written (starting with very large datasets and narrowing down to 2-3 confirmed genes) the manuscript seems as if it has a very high data: conclusions ratio.</p><p>2) Throughout the manuscript the authors use CHH context methylation as a signature of RNA-directed DNA methylation. In the past year we have seen several high-profile publications demonstrating that CHH methylation can be maintained by CMT2. Therefore, CHH methylation is not just a signature of RdDM. The author's analysis of CHH methylation is out of date and their calculation of the rate of RdDM based on CHH methylation is fundamentally flawed. In the Discussion, the fact that CHH is retained is provided as evidence of functional RdDM. This is simply incorrect logic.</p><p>3) The major experimental issue with this manuscript is that some of the genomes that are being analyzed by deep sequencing datasets have not been de novo assembled. Therefore, there is no guarantee that the gene-neighboring TE is even in the same location in the different genome. The bench work in the later figures proves for some examples that the TEs are in the correct locations, but these are just 2-3 out of hundreds analyzed. For example, the authors find 6 examples of allele-specific imprinted genes. However only 3 were confirmed by bench work and resequencing. Did the other 3 simply not have TEs next to those genes?</p><p>4) In the small RNA analysis, all sized small RNAs are lumped together, while only 24nt siRNAs direct DNA methylation. Why lump them all together? Instead, the analysis should focus on just the 24mers.</p><p>5) Do mutations in the 2-3 confirmed genes, such as HDG3, have seed phenotypes? For this manuscript to be on the Nature/Science/Cell level, the authors would need to show that these genes matter for phenotype and have an imprinted function, and it isn't just transcriptional noise or a random one-off. When studying transposable elements, you can always find one, two or a few out of tens of thousands have some odd expression or regulation pattern. However, this doesn't mean that these are larger modes of regulation, but rather just one or two positions that act strangely. Can the authors provide any evidence that this is a general mechanism and not just something weird that 2-3 out of thousands of genes or transposable elements do?</p><p>6) Lastly, as a major comment, I feel that the data visualization does not provide the reader with any way observe the conclusions that the data is showing. For example, from <xref ref-type="fig" rid="fig2">Figure 2</xref> the authors argue that 12 genes have allele-specific imprinting... However, when I look closely at <xref ref-type="fig" rid="fig2">Figure 2A, I</xref> don't see any pattern or even understand what each row is. Sure, this is colorful, but I couldn't see any patterns or observe anything in the data for much of <xref ref-type="fig" rid="fig2">Figure 2</xref>, <xref ref-type="fig" rid="fig4">Figure 4A</xref>, all of <xref ref-type="fig" rid="fig5">Figure 5</xref>, and a significant portion of <xref ref-type="fig" rid="fig7">Figure 7</xref>. I personally think that the authors should step back, determine what they are trying to show, and then find alternate ways to display their large datasets in a way that the reader can see the same thing.</p><p><italic>Reviewer #3</italic> major concerns:</p><p>The authors point out that their ultimate goal is to connect imprinting polymorphisms to seed phenotypes. That is a difficult task, but that connection is not made in this manuscript. The Abstract includes the prediction that natural epialleles are likely to exert their strongest effect on plant development during the reproductive phase. This claim is intriguing, but drawing this conclusion from the data presented is difficult as the imprinting variation noted has not been connected to developmental phenotypes.</p><p>Short of making that connection, the results could be extended by investigating in more detail other allele-specific imprinted loci involving transposable elements (currently 3 of 6 are studied in more detail). In addition, the strength of the prediction about variable imprinting behavior could be explored by looking at more examples of intraspecific crosses with hypomethylated loci corresponding to PEGs in other interstrain crosses.</p><p>The question of whether the differences in DNA methylation are caused by genetic polymorphisms or not is addressed briefly in the text and <xref ref-type="fig" rid="fig6s3">Figure 6–figure supplement 3</xref>. This important point needs more consideration in the Discussion.</p><p>[Editors’ note: a previous version of this study was rejected after peer review, but the authors submitted for reconsideration. The previous decision letter after peer review is shown below.]</p><p>Thank you for choosing to send your work, “Natural epigenetic polymorphisms lead to intraspecific variation in Arabidopsis gene imprinting”, for consideration at <italic>eLife</italic>. Your submission has been reviewed by Detlef Weigel in consultation with two outside peer reviewers. Although the work is of interest, we regret to inform you that the findings at this stage are too preliminary for further consideration at <italic>eLife.</italic></p><p>The major concern was that it is difficult to draw definitive conclusions because of the design of the crosses, with an accession that stands out for its low overall methylation level playing a central role, together with the limitations imposed by the relatively small amount of BS-seq data. A further concern was that you did not take advantage of the opportunity to study a connection to a biological phenotype, large seeds when Cvi is the maternal parent.</p><p><italic>Reviewer 1:</italic></p><p>Substantive concerns:</p><p>The authors directly compared expression pattern and DNA methylation in six combinations of inter-accession crosses. They found intraspecific variation in imprinting associated with variation in DNA methylation. The most interesting observation is, however, that the Cvi accession is unique for its big seed phenotype, which is seen when Cvi is the female parent. Cvi is also unique in the low CpG methylation level in gene bodies. The Cvi-specific seed phenotype might be due to Cvi-specific variation in epigenetic state of imprinted gene(s). This very interesting possibility should be proven by identifying the gene(s) responsible for the seed phenotype. If substantiated through the action of specific gene(s), this would greatly elevate the work.</p><p><italic>Reviewer 2:</italic></p><p>Substantive concerns:</p><p>Pignatta and colleagues analyzed gene imprinting in crosses of three different accessions of <italic>A. thaliana</italic> (Col-0, Ler and Cvi) and its link to changes in TE and small RNA composition as well as DNA methylation. These specific accessions were chosen because of their differences in seed size and their degree of genetic divergence.</p><p>The authors identified 420 maternally and 159 paternally expressed genes. DNA methylation analysis revealed differentially methylated regions (DMRs) that were in most parts either specific for comparisons between accessions or for comparisons between endosperm and embryo. The authors identified three imprinted genes that were associated with DMRs (endosperm-embryo as well as across-accession comparisons). These genes were P/MEGs depending on the epigenetic configuration of the parents and are thus examples of epialle-specific imprinted genes.</p><p>The authors address the interesting question if and how variations in the epigenetic configuration of the parents influence seed and embryo development through variations in imprinting. The authors have chosen an adequate model to address this question and have employed a broad spectrum of analyses. Unfortunately, the study suffers from weaknesses with regard to the technical and statistical procedures; furthermore the conclusions drawn by the authors are not entirely supported by the experimental evidence. In my view, with only three examples of epialleles influencing imprinting in the endosperm/embryo, the validity of extrapolating the results is not provided. The authors state that:</p><p>“Given the epigenetic diversity present within the species, we extrapolate that allele-specific imprinting will be widespread.” Cvi is the most highly differentially methylated <italic>A. thaliana</italic> accession analyzed to date (<xref ref-type="bibr" rid="bib44">Schmitz et al., 2013</xref>). If only three epialleles with effect on imprinting could be found in a comparison with this outlier strain, it is questionable that the effect is actually widespread.</p><p>On the technical side, I mainly criticize the low coverage of the BS-seq experiments, which to my opinion do not provide enough information for the performed analyses; and the RNA-seq experimental setup with essentially no replication.</p><p>The design of the mRNA-seq experiment is questionable. While two replicates were used for the Col-Cvi reciprocal crosses, there is only one for the respective Ler-Cvi crosses. For Col-Ler, the authors combined newly generated data with a previously published dataset (<xref ref-type="bibr" rid="bib13">Gehring et al., 2011</xref>). Not only does this mean that these crosses were done at completely different time points, the experiment also lacks the necessary replicates. In addition, the authors combined the reads of different replicates before doing the analysis. I recommend that at least three biological replicates should be used to gain enough statistical power for the confident detection of allele-specific gene expression. On a related note, I also wonder why the authors did not use long reads to increase their chances of allele-specific mapping of the reads?</p><p>The coverage obtained by BS-sequencing is very low! The Col-0 endosperm sample has 1,7 million reads, which results in a theoretical coverage of 0.5 x genome-wide. There are less than 1 million cytosines sufficiently covered in these samples and I doubt that this allows a representative and unbiased representation of the genome-wide DNA methylation.</p></body></sub-article><sub-article article-type="reply" id="SA2"><front-stub><article-id pub-id-type="doi">10.7554/eLife.03198.039</article-id><title-group><article-title>Author response</article-title></title-group></front-stub><body><p>We thank the reviewers for their continued consideration of the manuscript and their comments. In the revision we have further validated additional genes that were identified as allele-specific imprinted genes from the global RNA-seq analysis, including the three genes reference above that were not investigated earlier. We performed RT-PCR on independently isolated endosperm samples (ColxLer, LerxCol, ColxCvi, CvixCol) and sequenced the cloned PCR products by Sanger sequencing (AT4G13460, AT1G26620, AT5G60760), or performed CAPs digestion (AT4G00750), to distinguish the maternal and paternal allelic contributions to gene expression. In agreement with the RNA-seq data, AT4G00750 was a MEG except when Ler was the male in the cross (<xref ref-type="fig" rid="fig1s2">Figure 1–figure supplement 2</xref>). The data for AT5G60760 were also in complete agreement with the RNA-seq data (PEG except when Ler is male in the cross). For AT1G26620 (PEG except when Cvi is the male) the Col-Cvi reciprocal crosses and Col x Ler data agreed with the RNA-seq data, but for Ler x Col there was more maternal allele expression than in the RNA-seq data. For AT4G13460 (PEG except when Ler is the male) Col-Ler reciprocal crosses and the Cvi x Col cross agreed with the RNA-seq data; in the Col x Cvi cross there was greater maternal allele expression. These data are in <xref ref-type="supplementary-material" rid="SD5-data">Figure 1–source data 5</xref> and, combined with our previous validation efforts, further support our global mRNA-seq analysis.</p><p>Additionally, we cloned and sequenced the 5’ regions in Ler and Cvi for the three additional allele-specific imprinted genes (AT4G13460, AT1G26620, AT5G60760) where the overlapping embryo-endosperm and strain DMRs fell within a TE. As expected given our mapping and analysis strategy, the methylation differences we observed are not due to absence or major sequence alteration of the TE. The sequencing confirmed the presence of the relevant TE in Ler and Cvi at the same genomic location as in Col. These results are stated in the text and further detailed in the response to reviewer 2 below.</p><p>As suggested, we have modulated the Results and Discussion to emphasize methylation variation as causal for the imprinting differences, rather than focusing on whether or not this variation is purely epigenetic.</p><p>Finally, as detailed in the response to specific reviewer comments below, we have further edited the manuscript for length, included analysis specifically of 24 nt small RNAs, and revised figures for clarity.</p><p>Reviewer #2 major concerns:</p><p><italic>1) From the start, this paper reads like a thesis and not a research paper. So much information is thrown at the reader that I didn't know what is important. For example, the Introduction is 4 pages long and attempts to review this entire field. Entire paragraphs should be removed so the reader doesn't get bogged down. In the Discussion, the writing is very repetitive between the first and last paragraphs on the page. Because of the way it is written (starting with very large datasets and narrowing down to 2-3 confirmed genes) the manuscript seems as if it has a very high data: conclusions ratio</italic>.</p><p>The manuscript has been edited for conciseness and clarity, and the Introduction is considerably shorter. With regard to the ratio of data to conclusions, we note that it would have been impossible to identify allele-specific imprinted genes without performing global mRNA-seq experiments from multiple accessions. We have primarily focused the paper on allele-specific imprinting in order to tell a comprehensive story. However, our work has several other novel and important conclusions, some of which we list here. This is the most comprehensive analysis of imprinting in Arabidopsis, and we find that most imprinted genes are consistently parentally biased among strains (<xref ref-type="fig" rid="fig1">Figure 1</xref> and associated supplemental figures); this is an important conclusion in its own right. We present the first data on allele-specific small RNAs from Arabidopsis seeds and find that paternal 24 nt small RNAs are present, despite a widely accepted view in the field (based on small RNA data from whole siliques) to the contrary (<xref ref-type="supplementary-material" rid="SD9-data">Figure 4–source data 1</xref>; <xref ref-type="fig" rid="fig5s3">Figure 5–figure supplement 3</xref>). We find that MEGs are enriched for small RNAs derived from the paternally inherited allele, suggesting that the paternal allele might be specifically silenced by <italic>cis</italic> acting small RNAs (<xref ref-type="fig" rid="fig5s3">Figure 5–figure supplement 3</xref>). We also show that the Cvi strain is strikingly hypomethylated in gene bodies (<xref ref-type="fig" rid="fig3">Figure 3</xref> and associated supplemental figures). Although the functional consequence of this, if any, is presently unknown, this observation is another important contribution to the field.</p><p><italic>2) Throughout the manuscript the authors use CHH context methylation as a signature of RNA-directed DNA methylation. In the past year we have seen several high-profile publications demonstrating that CHH methylation can be maintained by CMT2. Therefore, CHH methylation is not just a signature of RdDM. The author's analysis of CHH methylation is out of date and their calculation of the rate of RdDM based on CHH methylation is fundamentally flawed. In the Discussion, the fact that CHH is retained is provided as evidence of functional RdDM. This is simply incorrect logic</italic>.</p><p>We agree with the reviewer that the genome-wide % CHH methylation is not strictly informative of RdDM, but disagree that our analysis is fundamentally flawed. As shown by Zemach et al (<italic>Cell</italic> 153, 2013), CMT2 is primarily responsible for DNA methylation in heterochromatic TEs. The TEs demethylated in endosperm are not of the CMT2-type; they are primarily euchromatic TEs of the Helitron class (<xref ref-type="fig" rid="fig4s4">Figure 4–figure supplement 4</xref>).</p><p><italic>3) The major experimental issue with this manuscript is that some of the genomes that are being analyzed by deep sequencing datasets have not been de novo assembled. Therefore, there is no guarantee that the gene-neighboring TE is even in the same location in the different genome. The bench work in the later figures proves for some examples that the TEs are in the correct locations, but these are just 2-3 out of hundreds analyzed. For example, the authors find 6 examples of allele-specific imprinted genes. However only 3 were confirmed by bench work and resequencing</italic>. <italic>Did the other 3 simply not have TEs next to those genes?</italic></p><p>We have resequenced the 5’ regions containing the DMR and TE for the three other genes, AT4G13460, AT5G60760 and AT1G26620, from Ler and Cvi. In all cases the annotated TE is present at the same genomic location as in Col and contains a few SNPs but no major sequence alterations. Specifically, for AT1G26620 we sequenced 3400 bp 5’ of gene, encompassing the DMR in AT1TE29660. The TE (at -900 to -1800) was present in the same location in Ler and Cvi as in Col, although in Cvi there was a 183 bp insertion at -420 and a 321 bp deletion at -2870 bp. These sequences differences are outside of the TE. For AT4G13460 we sequenced the entire 5’ region (2080 bp). Apart from a few SNPs there were no DNA sequence changes in Cvi. In Ler there were two small deletions (45 bp and 38 bp) 329 and 684 bp 5’ of the relevant TE, but no changes to the TE itself. For AT5G60760 we sequenced 2700 bp 5’ of the gene, encompassing AT5TE87930 and AT5TE87925, two contiguous TEs in the 5’ region. Both TEs are unaltered in Ler and Cvi except for a few SNPs.</p><p><italic>4) In the small RNA analysis, all sized small RNAs are lumped together, while only 24nt siRNAs direct DNA methylation. Why lump them all together? Instead, the analysis should focus on just the 24mers</italic>.</p><p>RdDM is primarily directed by 24 nt small RNAs (the Pol IV-RdDM pathway) but it has also been shown that RDR6-dependent 21 nt small RNAs can direct DNA methylation of TEs (see for example Pontier et al, <italic>Mol Cell</italic>, 2012 and Nuthikattu et al, <italic>Plant Physiol</italic>, 2013). However, the majority of small RNAs overlapping DMRs are of the 24 nt type. In response to the reviewer, we present the analysis on 24mers only in <xref ref-type="fig" rid="fig5">Figure 5</xref>, <xref ref-type="fig" rid="fig5s2">Figure 5–figure supplement 2</xref>, and <xref ref-type="fig" rid="fig5s3">Figure 5–figure supplement 3</xref>. This revision does not alter our conclusions.</p><p><italic>5) Do mutations in the 2-3 confirmed genes, such as HDG3, have seed phenotypes? For this manuscript to be on the Nature/Science/Cell level, the authors would need to show that these genes matter for phenotype and have an imprinted function, and it isn't just transcriptional noise or a random one-off. When studying transposable elements, you can always find one, two or a few out of tens of thousands have some odd expression or regulation pattern. However, this doesn't mean that these are larger modes of regulation, but rather just one or two positions that act strangely</italic>. <italic>Can the authors provide any evidence that this is a general mechanism and not just something weird that 2-3 out of thousands of genes or transposable elements do?</italic></p><p>We addressed how widespread allele-specific imprinting might be by looking at variation for all DMRs within the population (<xref ref-type="fig" rid="fig7">Figure 7</xref>). Based on this analysis, we believe that there are more examples of allele-specific imprinting than those that we specifically discovered in our Col/Ler/Cvi datasets, and we demonstrated this in additional strains for AT3G14205 and AT2G32370 (<xref ref-type="fig" rid="fig6">Figure 6</xref>, <xref ref-type="fig" rid="fig6s2">Figure 6–figure supplement 2</xref>). From our analysis we projected that maximally 11% of imprinted genes would be subject to allele specific imprinting. We would have been surprised if allele-specific imprinting was rampant. The ’general mechanism’ here is that natural variation in the methylation status of genes can alter whether or not they are imprinted. Even if a TE losing (or gaining) methylation in a particular strain is an infrequent event, the point is that these changes in methylation have consequences for gene expression. The analysis of population variation in DNA methylation shows that 15% of DMRs (the strongly bimodal class; <xref ref-type="fig" rid="fig7">Figure 7A</xref>) exist in highly methylated and lowly methylated states within the species. While not all of these methylation differences will impact imprinting, we have shown that it does for AT2G32370 and AT3G14205 (<xref ref-type="fig" rid="fig6">Figure 6</xref> and <xref ref-type="fig" rid="fig6s2">Figure 6–figure supplement 2</xref>). We do not yet know if <italic>HDG3</italic> (AT2G32370) or other allele-specific imprinted genes have phenotypes when mutated.</p><p><italic>6) Lastly, as a major comment, I feel that the data visualization does not provide the reader with any way observe the conclusions that the data is showing. For example, from</italic> <xref ref-type="fig" rid="fig2"><italic>Figure 2</italic></xref> <italic>the authors argue that 12 genes have allele-specific imprinting... However, when I look closely at</italic> <xref ref-type="fig" rid="fig2"><italic>Figure 2A, I</italic></xref> <italic>don't see any pattern or even understand what each row is. Sure, this is colorful, but I couldn't see any patterns or observe anything in the data for much of</italic> <xref ref-type="fig" rid="fig2"><italic>Figure 2</italic></xref><italic>,</italic> <xref ref-type="fig" rid="fig4"><italic>Figure 4A</italic></xref><italic>, all of</italic> <xref ref-type="fig" rid="fig5"><italic>Figure 5</italic></xref><italic>, and a significant portion of</italic> <xref ref-type="fig" rid="fig7"><italic>Figure 7</italic></xref><italic>. I personally think that the authors should step back, determine what they are trying to show, and then find alternate ways to display their large datasets in a way that the reader can see the same thing</italic>.</p><p>We have amended the figures as follows: part A has been removed from <xref ref-type="fig" rid="fig2">Figure 2</xref>, the heat map showing methylation difference at imprinted genes has been replaced with a methylation metagene analysis in <xref ref-type="fig" rid="fig5">Figure 5</xref>, and <xref ref-type="fig" rid="fig7">Figure 7</xref> has been modified to include examples of each class of DMR and part C has been modified for visual consistency with part A.</p><p>Reviewer #3 major concerns:</p><p><italic>The authors point out that their ultimate goal is to connect imprinting polymorphisms to seed phenotypes. That is a difficult task, but that connection is not made in this manuscript. The Abstract includes the prediction that natural epialleles are likely to exert their strongest effect on plant development during the reproductive phase. This claim is intriguing, but drawing this conclusion from the data presented is difficult as the imprinting variation noted has not been connected to developmental phenotypes</italic>.</p><p>We have tried to clarify in the Abstract and text that what we have shown is an expression phenotype. We are careful not to claim a developmental phenotype beyond speculating that this is a possible outcome of the expression phenotype we observed.</p><p><italic>Short of making that connection, the results could be extended by investigating in more detail other allele-specific imprinted loci involving transposable elements (currently 3 of 6 are studied in more detail). In addition, the strength of the prediction about variable imprinting behavior could be explored by looking at more examples of intraspecific crosses with hypomethylated loci corresponding to PEGs in other interstrain crosses</italic>.</p><p>As detailed above, in the revised version we have further validated allele-specific imprinting for four genes and demonstrated that the all of the TEs associated with allele-specific imprinted genes are present at the same genomic location in all three strains.</p><p><italic>The question of whether the differences in DNA methylation are caused by genetic polymorphisms or not is addressed briefly in the text and</italic> <xref ref-type="fig" rid="fig6s3"><italic>Figure 6–figure supplement 3</italic></xref><italic>. This important point needs more consideration in the Discussion</italic>.</p><p>As suggested in the summary review statement above, we have focused on methylation variation being casual for differences in imprinting rather than focusing on whether or not this variation is purely epigenetic or whether it has a genetic basis.</p><p>[Editors’ note: the author responses to the previous round of peer review follow.]</p><p>We thank the reviewers for their careful review of the original submission. We have significantly strengthened and extended the manuscripts’ Conclusions by addressing the reviewers’ comments. The following major changes have been made; we have estimated how widespread allele-specific imprinting might be by analyzing methylation variation at the population scale for regions targeted for endosperm demethylation (<xref ref-type="fig" rid="fig7">Figure 7</xref>), predicted and confirmed an additional example of allele-specific imprinting based on this analysis (<xref ref-type="fig" rid="fig6s2">Figure 6–figure supplement 2</xref>), performed additional analyses on the allele-specific imprinted gene <italic>HDG3</italic> (<xref ref-type="fig" rid="fig6">Figure 6</xref>), and performed three endosperm RNA-seq replicates for each set of reciprocal crosses (<xref ref-type="fig" rid="fig1">Figure 1</xref>, <xref ref-type="supplementary-material" rid="SD3-data">Figure 1–source data 3</xref>) . The Results section has been reorganized for greater clarity and the Introduction and Abstract revised to better reflect the aims and Conclusions of our study.</p><p>Detailed responses to each reviewer’s comments follow.</p><p>Reviewer 1:</p><p><italic>Substantive concerns</italic>:</p><p><italic>The authors directly compared expression pattern and DNA methylation in six combinations of inter-accession crosses. They found intraspecific variation in imprinting associated with variation in DNA methylation. The most interesting observation is, however, that the Cvi accession is unique for its big seed phenotype, which is seen when Cvi is the female parent. Cvi is also unique in the low CpG methylation level in gene bodies. The Cvi-specific seed phenotype might be due to Cvi-specific variation in epigenetic state of imprinted gene(s). This very interesting possibility should be proven by identifying the gene(s) responsible for the seed phenotype. If substantiated through the action of specific gene(s), this would greatly elevate the work</italic>.</p><p>We have uncovered interesting candidate genes that have the potential to contribute to seed size, including genes that are differentially expressed when Cvi is the male or female parent and genes, such as <italic>HDG3</italic>, that are differentially imprinted between Cvi and other strains. We have not made an explicit analysis of their connection to seed phenotype for two reasons:</p><p>1) Alonso-Blanco et al (PNAS, 1999) performed QTL mapping of seed size differences between Ler and Cvi and discovered 11 significant loci. The fact that seed size is not a single locus trait means that uncovering the network of genes that contribute to differences, regardless of whether or not they are imprinted, will be a considerable undertaking and thus the subject of a different study.</p><p>2) The primary aim of our study was not to determine what genes are responsible for making Cvi seeds larger than Col or Ler seeds, but to understand whether or not variation existed in the population for gene imprinting, and if it did whether this might be due to epigenetic differences between strains. We believe we have demonstrated that this variation exists.</p><p>Reviewer 2:</p><p><italic>Substantive concerns</italic>:</p><p><italic>Pignatta and colleagues analyzed gene imprinting in crosses of three different accessions of</italic> A. thaliana <italic>(Col-0, Ler and Cvi) and its link to changes in TE and small RNA composition as well as DNA methylation. These specific accessions were chosen because of their differences in seed size and their degree of genetic divergence</italic>.</p><p><italic>The authors identified 420 maternally and 159 paternally expressed genes. DNA methylation analysis revealed differentially methylated regions (DMRs) that were in most parts either specific for comparisons between accessions or for comparisons between endosperm and embryo. The authors identified three imprinted genes that were associated with DMRs (endosperm-embryo as well as across-accession comparisons). These genes were P/MEGs depending on the epigenetic configuration of the parents and are thus examples of epialle-specific imprinted genes</italic>.</p><p><italic>The authors address the interesting question if and how variations in the epigenetic configuration of the parents influence seed and embryo development through variations in imprinting. The authors have chosen an adequate model to address this question and have employed a broad spectrum of analyses. Unfortunately, the study suffers from weaknesses with regard to the technical and statistical procedures; furthermore the conclusions drawn by the authors are not entirely supported by the experimental evidence. In my view, with only three examples of epialleles influencing imprinting in the endosperm/embryo, the validity of extrapolating the results is not provided. The authors state that</italic>:</p><p><italic>“Given the epigenetic diversity present within the species, we extrapolate that allele-specific imprinting will be widespread.” Cvi is the most highly differentially methylated</italic> A. thaliana <italic>accession analyzed to date (</italic><xref ref-type="bibr" rid="bib44"><italic>Schmitz et al., 2013</italic></xref><italic>). If only three epialleles with effect on imprinting could be found in a comparison with this outlier strain, it is questionable that the effect is actually widespread</italic>.</p><p>We disagree that Cvi is an outlier or anomalous strain with regard to imprinting and thus the source of the maximal number of allele- specific imprinted genes. First, our data show that of the 12 allele-specific imprinted genes we identified, 5 are variable in Cvi and 7 are variable in Ler (<xref ref-type="supplementary-material" rid="SD6-data">Figure 2–Source data 1</xref>). 4 of the Cvi genes and 6 of the Ler genes are associated with an embryo-endosperm DMR that is variably methylated among the Col, Ler, and Cvi strains. We further focus on three genes, AT2G32370 (not imprinted in Cvi), AT3G14205 (not imprinted in Cvi), and AT2G34890 (not imprinted in Ler). Thus the phenomenon of allele-specific imprinting is not restricted to Cvi.</p><p>Second, to convince the reviewer of our assertion, in the revision we directly addressed how widespread allelic variation in imprinting might be. To this end we took the set of embryo-endosperm CG DMRs we found in any of our comparisons (the union) and queried these regions against the Ecker whole genome BS-seq data from 140 strains for which vegetative methylation patterns are known (Schmitz et al, Nature, 2013). We determined how variably methylated these regions were among all strains with sufficient BS-seq data (<xref ref-type="fig" rid="fig7">Figure 7</xref>). Many of the DMRs (41%) show little variability in DNA methylation within the population – we define these as very low range DMRs (less than 0.2 mean methylation difference across all strains) and low range (between 0.2 and 0.4 mean methylation difference across all strains). For example, the endosperm DMR at <italic>FWA</italic> falls into this category; it is highly methylated in all strains.</p><p>Imprinted genes associated with invariable DMRs are likely to be targeted for demethylation, and imprinted, in all strains. However, we also find bimodal DMRs, with clustering of mean methylation towards one end of the spectrum, but with one or a few clear outliers. We define these as strong (n=1654) and weak (n=1545). Of the shared endosperm and strain CG DMRs associated with 8 allele-specific imprinted genes, 6 are in the strong or weak bimodal category, including those at AT2G32370 and AT3G14205 (<xref ref-type="supplementary-material" rid="SD6-data">Figure 2-Source data 1</xref> and <xref ref-type="fig" rid="fig7">Figure 7B</xref> ). We further show that of the union set of imprinted genes we identified in this study (n=388), 27 MEGs and 17 PEGs, including 4 PEGs we find as exhibiting allele-specific imprinting among Col, Ler, and Cvi, are associated with DMRs that are strongly bimodal for methylation within the population. This would represent the maximal number of allele-specific imprinted genes, approximately 11% of all imprinted genes. Our genome-wide analysis identified another strain, in addition to Cvi, where the DMR at AT3G14205 was hypomethylated. We showed that reciprocal crosses with this strain also exhibit allele-specific imprinting (<xref ref-type="fig" rid="fig6s2">Figure 6–figure supplement 2</xref>).</p><p><italic>On the technical side, I mainly criticize the low coverage of the BS-seq experiments, which to my opinion do not provide enough information for the performed analyses; and the RNA-seq experimental setup with essentially no replication</italic>.</p><p>To identify embryo-endosperm differentially methylated regions (DMRs), we only compared regions of the genome where we had sufficient coverage. In the revised version we show that the DMRs we identified were consistent with previous studies (<xref ref-type="bibr" rid="bib11">Gehring et al 2009</xref>; <xref ref-type="bibr" rid="bib23">Ibarra et al 2012</xref>, comparison in <xref ref-type="fig" rid="fig4s5">Figure 4–figure supplement 5</xref> ). In the revised version, we used our analysis method to identify DMRs from the <xref ref-type="bibr" rid="bib23">Ibarra et al (2012)</xref> Col x Ler and Ler x Col embryo and endosperm BS-seq data (from tissue isolated at 7-8 DAP). These DMRs are now included in the analyses of the relationship between DNA demethylation and imprinting at several points (<xref ref-type="supplementary-material" rid="SD6-data">Figure 2–source data 1</xref>, <xref ref-type="fig" rid="fig4s2">Figure 4–figure supplement 2</xref>, and <xref ref-type="fig" rid="fig7">Figure 7B</xref>).</p><p>We agree that our endosperm BS coverage is low. Our intent was not to identify all differentially methylated regions between embryo and endosperm. Rather, we wanted to know whether regions targeted for demethylation in the endosperm were ever variably methylated among strains, which we have shown (to identify strain-DMRs between Col, Ler, and Cvi we used the embryo data, where our coverage was much better). Despite our repeated efforts at optimization and considerable sequencing, the same starting amount of endosperm gDNA did not make a BS-seq library as diverse as embryo gDNA collected and treated at the exact same time; most endosperm BS-seq reads were discarded because they were redundant (mapped to same start position).</p><p><italic>The design of the mRNA-seq experiment is questionable. While two replicates were used for the Col-Cvi reciprocal crosses, there is only one for the respective Ler-Cvi crosses. For Col-Ler, the authors combined newly generated data with a previously published dataset (</italic><xref ref-type="bibr" rid="bib13"><italic>Gehring et al., 2011</italic></xref><italic>). Not only does this mean that these crosses were done at completely different time points, the experiment also lacks the necessary replicates</italic>. <italic>In addition, the authors combined the reads of different replicates before doing the analysis. I recommend that at least three biological replicates should be used to gain enough statistical power for the confident detection of allele-specific gene expression. On a related note, I also wonder why the authors did not use long reads to increase their chances of allele-specific mapping of the reads?</italic></p><p>As suggested by the reviewers, we have now included three endosperm biological replicates for each of the crosses used to identify imprinted genes. The additional RNA-seq libraries were sequenced using 80 bp reads. We no longer combine read counts or include our 2011 data. To call a gene imprinted in a particular set of reciprocal crosses (Col -Ler, Col- Cvi, or Ler- Cvi) it had to meet all of our criteria for imprinting in at least two of the three replicate sets. We chose to use two of three rather than three of three because of variability in the sequencing depth of our libraries. In the revised version we have also validated the mRNA-seq data by using the miSeq platform; we isolated 2 additional endosperm biological replicates for each set of reciprocal crosses and one additional embryo and performed RT -PCR for 25 genes from these sets and sequenced the PCR amplicons. The results agreed quite well with the mRNA-seq data (see <xref ref-type="supplementary-material" rid="SD5-data">Figure 1–source data 5</xref>).</p><p><italic>The coverage obtained by BS-sequencing is very low! The Col-0 endosperm sample has 1,7 million reads, which results in a theoretical coverage of 0.5 x genome-wide. There are less than 1 million cytosines sufficiently covered in these samples and I doubt that this allows a representative and unbiased representation of the genome-wide DNA methylation</italic>.</p><p>We agree that the Col-0 endosperm coverage is very low; therefore it also contributed few reads to the overall analysis compared to the many more reads derived from other libraries. It was never used as a stand-alone dataset to draw broad conclusions on genome-wide methylation or DMRs.</p></body></sub-article></article>