Permalink
Switch branches/tags
Nothing to show
Find file
Fetching contributors…
Cannot retrieve contributors at this time
1 lines (1 sloc) 157 KB
<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Archiving and Interchange DTD v1.1d1 20130915//EN" "JATS-archivearticle1.dtd"><article article-type="research-article" dtd-version="1.1d1" xmlns:xlink="http://www.w3.org/1999/xlink"><front><journal-meta><journal-id journal-id-type="nlm-ta">elife</journal-id><journal-id journal-id-type="hwp">eLife</journal-id><journal-id journal-id-type="publisher-id">eLife</journal-id><journal-title-group><journal-title>eLife</journal-title></journal-title-group><issn publication-format="electronic">2050-084X</issn><publisher><publisher-name>eLife Sciences Publications, Ltd</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">02105</article-id><article-id pub-id-type="doi">10.7554/eLife.02105</article-id><article-categories><subj-group subj-group-type="display-channel"><subject>Short report</subject></subj-group><subj-group subj-group-type="heading"><subject>Genes and chromosomes</subject></subj-group><subj-group subj-group-type="heading"><subject>Genomics and evolutionary biology</subject></subj-group></article-categories><title-group><article-title>Tyrosine phosphorylation of RNA polymerase II CTD is associated with antisense promoter transcription and active enhancers in mammalian cells</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes" id="author-9814"><name><surname>Descostes</surname><given-names>Nicolas</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="aff" rid="aff2"/><xref ref-type="aff" rid="aff5"/><xref ref-type="aff" rid="aff6"/><xref ref-type="fn" rid="equal-contrib">†</xref><xref ref-type="other" rid="par-4"/><xref ref-type="fn" rid="con1"/><xref ref-type="fn" rid="conf1"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/><xref ref-type="other" rid="dataro4"/><xref ref-type="other" rid="dataro5"/><xref ref-type="other" rid="dataro6"/><xref ref-type="other" rid="dataro7"/><xref ref-type="other" rid="dataro8"/><xref ref-type="other" rid="dataro9"/><xref ref-type="other" rid="dataro10"/><xref ref-type="other" rid="dataro11"/><xref ref-type="other" rid="dataro12"/></contrib><contrib contrib-type="author" equal-contrib="yes" id="author-9994"><name><surname>Heidemann</surname><given-names>Martin</given-names></name><xref ref-type="aff" rid="aff3"/><xref ref-type="fn" rid="equal-contrib">†</xref><xref ref-type="other" rid="par-5"/><xref ref-type="fn" rid="con2"/><xref ref-type="fn" rid="conf1"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/><xref ref-type="other" rid="dataro4"/><xref ref-type="other" rid="dataro5"/><xref ref-type="other" rid="dataro6"/><xref ref-type="other" rid="dataro7"/><xref ref-type="other" rid="dataro8"/><xref ref-type="other" rid="dataro9"/><xref ref-type="other" rid="dataro10"/><xref ref-type="other" rid="dataro11"/><xref ref-type="other" rid="dataro12"/></contrib><contrib contrib-type="author" id="author-9995"><name><surname>Spinelli</surname><given-names>Lionel</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="aff" rid="aff2"/><xref ref-type="aff" rid="aff5"/><xref ref-type="other" rid="par-1"/><xref ref-type="fn" rid="con3"/><xref ref-type="fn" rid="conf1"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/><xref ref-type="other" rid="dataro4"/><xref ref-type="other" rid="dataro5"/><xref ref-type="other" rid="dataro6"/><xref ref-type="other" rid="dataro7"/><xref ref-type="other" rid="dataro8"/><xref ref-type="other" rid="dataro9"/><xref ref-type="other" rid="dataro10"/><xref ref-type="other" rid="dataro11"/><xref ref-type="other" rid="dataro12"/></contrib><contrib contrib-type="author" id="author-10007"><name><surname>Schüller</surname><given-names>Roland</given-names></name><xref ref-type="aff" rid="aff3"/><xref ref-type="other" rid="par-5"/><xref ref-type="fn" rid="con4"/><xref ref-type="fn" rid="conf1"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/><xref ref-type="other" rid="dataro4"/><xref ref-type="other" rid="dataro5"/><xref ref-type="other" rid="dataro6"/><xref ref-type="other" rid="dataro7"/><xref ref-type="other" rid="dataro8"/><xref ref-type="other" rid="dataro9"/><xref ref-type="other" rid="dataro10"/><xref ref-type="other" rid="dataro11"/><xref ref-type="other" rid="dataro12"/></contrib><contrib contrib-type="author" id="author-9997"><name><surname>Maqbool</surname><given-names>Muhammad Ahmad</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="aff" rid="aff2"/><xref ref-type="aff" rid="aff5"/><xref ref-type="aff" rid="aff6"/><xref ref-type="other" rid="par-1"/><xref ref-type="fn" rid="con5"/><xref ref-type="fn" rid="conf1"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/><xref ref-type="other" rid="dataro4"/><xref ref-type="other" rid="dataro5"/><xref ref-type="other" rid="dataro6"/><xref ref-type="other" rid="dataro7"/><xref ref-type="other" rid="dataro8"/><xref ref-type="other" rid="dataro9"/><xref ref-type="other" rid="dataro10"/><xref ref-type="other" rid="dataro11"/><xref ref-type="other" rid="dataro12"/></contrib><contrib contrib-type="author" id="author-9998"><name><surname>Fenouil</surname><given-names>Romain</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="aff" rid="aff2"/><xref ref-type="aff" rid="aff5"/><xref ref-type="other" rid="par-2"/><xref ref-type="fn" rid="con6"/><xref ref-type="fn" rid="conf1"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/><xref ref-type="other" rid="dataro4"/><xref ref-type="other" rid="dataro5"/><xref ref-type="other" rid="dataro6"/><xref ref-type="other" rid="dataro7"/><xref ref-type="other" rid="dataro8"/><xref ref-type="other" rid="dataro9"/><xref ref-type="other" rid="dataro10"/><xref ref-type="other" rid="dataro11"/><xref ref-type="other" rid="dataro12"/></contrib><contrib contrib-type="author" id="author-9999"><name><surname>Koch</surname><given-names>Frederic</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="aff" rid="aff2"/><xref ref-type="aff" rid="aff5"/><xref ref-type="fn" rid="con7"/><xref ref-type="fn" rid="conf1"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/><xref ref-type="other" rid="dataro4"/><xref ref-type="other" rid="dataro5"/><xref ref-type="other" rid="dataro6"/><xref ref-type="other" rid="dataro7"/><xref ref-type="other" rid="dataro8"/><xref ref-type="other" rid="dataro9"/><xref ref-type="other" rid="dataro10"/><xref ref-type="other" rid="dataro11"/><xref ref-type="other" rid="dataro12"/></contrib><contrib contrib-type="author" id="author-10000"><name><surname>Innocenti</surname><given-names>Charlène</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="aff" rid="aff2"/><xref ref-type="aff" rid="aff5"/><xref ref-type="other" rid="par-3"/><xref ref-type="fn" rid="con8"/><xref ref-type="fn" rid="conf1"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/><xref ref-type="other" rid="dataro4"/><xref ref-type="other" rid="dataro5"/><xref ref-type="other" rid="dataro6"/><xref ref-type="other" rid="dataro7"/><xref ref-type="other" rid="dataro8"/><xref ref-type="other" rid="dataro9"/><xref ref-type="other" rid="dataro10"/><xref ref-type="other" rid="dataro11"/><xref ref-type="other" rid="dataro12"/></contrib><contrib contrib-type="author" id="author-10001"><name><surname>Gut</surname><given-names>Marta</given-names></name><xref ref-type="aff" rid="aff4"/><xref ref-type="fn" rid="con9"/><xref ref-type="fn" rid="conf1"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/><xref ref-type="other" rid="dataro4"/><xref ref-type="other" rid="dataro5"/><xref ref-type="other" rid="dataro6"/><xref ref-type="other" rid="dataro7"/><xref ref-type="other" rid="dataro8"/><xref ref-type="other" rid="dataro9"/><xref ref-type="other" rid="dataro10"/><xref ref-type="other" rid="dataro11"/><xref ref-type="other" rid="dataro12"/></contrib><contrib contrib-type="author" id="author-10002"><name><surname>Gut</surname><given-names>Ivo</given-names></name><xref ref-type="aff" rid="aff4"/><xref ref-type="fn" rid="con10"/><xref ref-type="fn" rid="conf1"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/><xref ref-type="other" rid="dataro4"/><xref ref-type="other" rid="dataro5"/><xref ref-type="other" rid="dataro6"/><xref ref-type="other" rid="dataro7"/><xref ref-type="other" rid="dataro8"/><xref ref-type="other" rid="dataro9"/><xref ref-type="other" rid="dataro10"/><xref ref-type="other" rid="dataro11"/><xref ref-type="other" rid="dataro12"/></contrib><contrib contrib-type="author" corresp="yes" id="author-10005"><name><surname>Eick</surname><given-names>Dirk</given-names></name><xref ref-type="aff" rid="aff3"/><xref ref-type="corresp" rid="cor1">*</xref><xref ref-type="other" rid="par-5"/><xref ref-type="fn" rid="con11"/><xref ref-type="fn" rid="conf1"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/><xref ref-type="other" rid="dataro4"/><xref ref-type="other" rid="dataro5"/><xref ref-type="other" rid="dataro6"/><xref ref-type="other" rid="dataro7"/><xref ref-type="other" rid="dataro8"/><xref ref-type="other" rid="dataro9"/><xref ref-type="other" rid="dataro10"/><xref ref-type="other" rid="dataro11"/><xref ref-type="other" rid="dataro12"/></contrib><contrib contrib-type="author" corresp="yes" id="author-12581"><name><surname>Andrau</surname><given-names>Jean-Christophe</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="aff" rid="aff2"/><xref ref-type="aff" rid="aff5"/><xref ref-type="aff" rid="aff6"/><xref ref-type="corresp" rid="cor2">*</xref><xref ref-type="fn" rid="con12"/><xref ref-type="fn" rid="conf1"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/><xref ref-type="other" rid="dataro4"/><xref ref-type="other" rid="dataro5"/><xref ref-type="other" rid="dataro6"/><xref ref-type="other" rid="dataro7"/><xref ref-type="other" rid="dataro8"/><xref ref-type="other" rid="dataro9"/><xref ref-type="other" rid="dataro10"/><xref ref-type="other" rid="dataro11"/><xref ref-type="other" rid="dataro12"/></contrib><aff id="aff1"><institution content-type="dept">Centre d'Immunologie de Marseille-Luminy</institution>, <institution>Université Aix-Marseille</institution>, <addr-line><named-content content-type="city">Marseille</named-content></addr-line>, <country>France</country></aff><aff id="aff2"><institution>Centre National de la Recherche Scientifique (CNRS) UMR6102</institution>, <addr-line><named-content content-type="city">Marseille</named-content></addr-line>, <country>France</country></aff><aff id="aff3"><institution content-type="dept">Department of Molecular Epigenetics</institution>, <institution>Helmholtz Center Munich, Center of Integrated Protein Science Munich</institution>, <addr-line><named-content content-type="city">Munich</named-content></addr-line>, <country>Germany</country></aff><aff id="aff4"><institution>Centre Nacional D'Anàlisi Genòmica</institution>, <addr-line><named-content content-type="city">Barcelona</named-content></addr-line>, <country>Spain</country></aff><aff id="aff5"><institution>Inserm U631</institution>, <addr-line><named-content content-type="city">Marseille</named-content></addr-line>, <country>France</country></aff><aff id="aff6"><institution>Institut de Génétique Moléculaire de Montpellier (IGMM), CNRS-UMR5535</institution>, <addr-line><named-content content-type="city">Montpellier</named-content></addr-line>, <country>France</country></aff></contrib-group><contrib-group content-type="section"><contrib contrib-type="editor"><name><surname>Reinberg</surname><given-names>Danny</given-names></name><role>Reviewing editor</role><aff><institution>Howard Hughes Medical Institute, New York University School of Medicine</institution>, <country>United States</country></aff></contrib></contrib-group><author-notes><corresp id="cor1"><label>*</label>For correspondence: <email>eick@helmholtz-muenchen.de</email> (DE);</corresp><corresp id="cor2"><label>*</label>For correspondence: <email>jean-christophe.andrau@igmm.cnrs.fr</email> (J-CA)</corresp><fn fn-type="con" id="equal-contrib"><label>†</label><p>These authors contributed equally to this work</p></fn></author-notes><pub-date date-type="pub" publication-format="electronic"><day>09</day><month>05</month><year>2014</year></pub-date><pub-date pub-type="collection"><year>2014</year></pub-date><volume>3</volume><elocation-id>e02105</elocation-id><history><date date-type="received"><day>17</day><month>12</month><year>2013</year></date><date date-type="accepted"><day>08</day><month>05</month><year>2014</year></date></history><permissions><copyright-statement>© 2014, Descostes et al</copyright-statement><copyright-year>2014</copyright-year><copyright-holder>Descostes et al</copyright-holder><license xlink:href="http://creativecommons.org/licenses/by/3.0/"><license-p>This article is distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/3.0/">Creative Commons Attribution License</ext-link>, which permits unrestricted use and redistribution provided that the original author and source are credited.</license-p></license></permissions><self-uri content-type="pdf" xlink:href="elife02105.pdf"/><related-article ext-link-type="doi" id="ra1" related-article-type="article-reference" xlink:href="10.7554/eLife.02112"/><abstract><object-id pub-id-type="doi">10.7554/eLife.02105.001</object-id><p>In mammals, the carboxy-terminal domain (CTD) of RNA polymerase (Pol) II consists of 52 conserved heptapeptide repeats containing the consensus sequence Tyr1-Ser2-Pro3-Thr4-Ser5-Pro6-Ser7. Post-translational modifications of the CTD coordinate the transcription cycle and various steps of mRNA maturation. Here we describe Tyr1 phosphorylation (Tyr1P) as a hallmark of promoter (5′ associated) Pol II in mammalian cells, in contrast to what was described in yeast. Tyr1P is predominantly found in antisense orientation at promoters but is also specifically enriched at active enhancers. Mutation of Tyr1 to phenylalanine (Y1F) prevents the formation of the hyper-phosphorylated Pol IIO form, induces degradation of Pol II to the truncated Pol IIB form, and results in a lethal phenotype. Our results suggest that Tyr1P has evolved specialized and essential functions in higher eukaryotes associated with antisense promoter and enhancer transcription, and Pol II stability.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.001">http://dx.doi.org/10.7554/eLife.02105.001</ext-link></p></abstract><abstract abstract-type="executive-summary"><object-id pub-id-type="doi">10.7554/eLife.02105.002</object-id><title>eLife digest</title><p>When a gene is expressed, the DNA is first transcribed to produce an intermediate molecule called a messenger RNA (mRNA), which is then translated to produce a protein. RNA Polymerase II is an enzyme that makes mRNA molecules in organisms as diverse as plants, animals, and yeast.</p><p>RNA Polymerase II is a complex made of a number of proteins. The largest protein in this complex includes a ‘carboxy-terminal domain’ that has multiple repeats of seven amino acids one after the other. The first amino acid in each repeat, a tyrosine, is referred to as tyrosine-1. Adding various chemical tags to the amino acids in these repeats co-ordinates the steps involved in the transcription of genes. In yeast, for example, adding a phosphate group to tyrosine-1 seems to help the polymerase to proceed to make long mRNA molecules. However, it is not known what these chemical tags do in humans or other animals.</p><p>Now Descostes, Heidemann et al. (and independently Hsin et al.) have shown that the same phosphate groups on tyrosine-1 perform functions in vertebrates (animals with backbones) that are different to those performed in yeast. These functions include protecting the carboxy-terminal domain from being broken down inside cells, and transcribing the DNA that is upstream of genes.</p><p>Descostes, Heidemann et al. found that in human cells, RNA Polymerase II with phosphate groups on tyrosine-1 tends to bind to the beginning of genes. However, rather than moving along each gene and transcribing it, the polymerase then moves in the opposite (or ‘antisense’) direction to transcribe the DNA that is upstream of the gene. In most cases, however, the transcription of these ‘upstream antisense RNAs’ does not make a functional RNA molecule and transcription is paused. Furthermore, Descostes, Heidemann et al. found that when RNA Polymerase II that is not tagged with these phosphate groups is degraded in human cells, these cells rapidly die.</p><p>Descostes, Heidemann et al. also found that RNA Polymerase II with phosphate tags on tyrosine-1 also binds to, and transcribes, sections of DNA called ‘enhancers’, which are outside of the genes but that help to activate nearby genes. Importantly, these transcribed enhancers are those that work to define the type of cell and tissue—for example a white blood cell—that any given cell will become.</p><p>Future studies should help to answer remaining questions such as: how do these chemical tags affect the transcription of genes that are specific to certain tissue types? And do these tags on RNA Polymerase II help to direct cells to become specific cell types?</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.002">http://dx.doi.org/10.7554/eLife.02105.002</ext-link></p></abstract><kwd-group kwd-group-type="author-keywords"><title>Author keywords</title><kwd>RNA polymerase II</kwd><kwd>carboxyl terminal domain</kwd><kwd>antisense transcription</kwd><kwd>enhancers</kwd><kwd>initiation</kwd><kwd>transcription</kwd></kwd-group><kwd-group kwd-group-type="research-organism"><title>Research organism</title><kwd>human</kwd></kwd-group><funding-group><award-group id="par-1"><funding-source><institution-wrap><institution-id institution-id-type="FundRef">http://dx.doi.org/10.13039/501100001665</institution-id><institution>Agence Nationale de la Recherche</institution></institution-wrap></funding-source><principal-award-recipient><name><surname>Spinelli</surname><given-names>Lionel</given-names></name><name><surname>Maqbool</surname><given-names>Muhammad Ahmad</given-names></name></principal-award-recipient></award-group><award-group id="par-2"><funding-source><institution-wrap><institution>Centre National de la Recherche Scientifique</institution></institution-wrap></funding-source><principal-award-recipient><name><surname>Fenouil</surname><given-names>Romain</given-names></name></principal-award-recipient></award-group><award-group id="par-3"><funding-source><institution-wrap><institution>FRM</institution></institution-wrap></funding-source><principal-award-recipient><name><surname>Innocenti</surname><given-names>Charlène</given-names></name></principal-award-recipient></award-group><award-group id="par-4"><funding-source><institution-wrap><institution>Ministère de la Recherche/Ligue Nationale contre le Cancer</institution></institution-wrap></funding-source><principal-award-recipient><name><surname>Descostes</surname><given-names>Nicolas</given-names></name></principal-award-recipient></award-group><award-group id="par-5"><funding-source><institution-wrap><institution-id institution-id-type="FundRef">http://dx.doi.org/10.13039/501100001659</institution-id><institution>Deutsche Forschungsgemeinschaft</institution></institution-wrap></funding-source><award-id>SFB1064 and SFB684</award-id><principal-award-recipient><name><surname>Heidemann</surname><given-names>Martin</given-names></name><name><surname>Schüller</surname><given-names>Roland</given-names></name><name><surname>Eick</surname><given-names>Dirk</given-names></name></principal-award-recipient></award-group><funding-statement>The funders had no role in study design, data collection and interpretation, or the decision to submit the work for publication.</funding-statement></funding-group><custom-meta-group><custom-meta><meta-name>elife-xml-version</meta-name><meta-value>2</meta-value></custom-meta><custom-meta specific-use="meta-only"><meta-name>Author impact statement</meta-name><meta-value>Genome-wide analysis reveals novel functions for a post-translational modification to the carboxy-terminal domain (CTD) of RNA Polymerase II in mammals.</meta-value></custom-meta></custom-meta-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>The activity of RNA Polymerase (Pol) II is responsible for transcription of mRNAs and many noncoding RNAs. Essential for Pol II function is the carboxy-terminal domain (CTD) of its largest subunit Rpb1 that consists of a highly conserved YSPTSPS heptad repetition (<xref ref-type="bibr" rid="bib2">Buratowski, 2009</xref>; <xref ref-type="bibr" rid="bib13">Heidemann et al., 2012</xref>). Post-translational modifications (PTMs) of the CTD coordinate both transcription cycle transitions and loading of RNA processing complexes. In the recent years, novel PTMs were described in addition to the well-known Ser5P and Ser2P associated with early transcription and elongation, respectively. These include Ser7P, involved in snRNA gene transcription (<xref ref-type="bibr" rid="bib4">Chapman et al., 2007</xref>; <xref ref-type="bibr" rid="bib9">Egloff et al., 2007</xref>), Thr4P associated to transcription elongation in mammals (<xref ref-type="bibr" rid="bib14">Hintermair et al., 2012</xref>) and to histone gene transcription in chicken (<xref ref-type="bibr" rid="bib15">Hsin et al., 2011</xref>), and Tyr1P that in yeast is found at gene body locations, consistent with a role in transcription elongation (<xref ref-type="bibr" rid="bib21">Mayer et al., 2012</xref>). This latter modification remains however so far uncharacterized in mammalian cells and we aimed at deciphering its function in human cells using biochemical and genome-wide approaches.</p></sec><sec id="s2" sec-type="results|discussion"><title>Results and discussion</title><p>To analyze expression and pattern of Tyr1P modified Pol II, we took advantage of our previously developed Tyr1P specific antibodies (3D12) (<xref ref-type="bibr" rid="bib21">Mayer et al., 2012</xref>). We investigated various mouse and human cells and could detect Tyr1P in western blots for all examined lines, in most cases associated with the hyper-phosphorylated IIO form of Pol II (<xref ref-type="fig" rid="fig1s1">Figure 1—figure supplement 1</xref>). To address the function of Tyr1P, we next generated Raji cell lines expressing Pol II resistant to α-amanitin (<xref ref-type="bibr" rid="bib3">Chapman et al., 2004</xref>) and carrying either wild-type (WT) or a mutant Rpb1 gene with substitution of tyrosine to phenylalanine (Y1F) in CTD repeats 4 to 51 (<xref ref-type="fig" rid="fig1s2">Figure 1—figure supplement 2</xref>). After expression of the mutant, we observed that Y1F yielded a truncated Rpb1 (Pol IIB, <xref ref-type="fig" rid="fig1">Figure 1A</xref>) and was unable to form the hyper-phosphorylated IIO Pol II. After disruption of the activity of endogenous Pol II by α-amanitin (<xref ref-type="fig" rid="fig1">Figure 1B</xref>) and soon after disappearance of WT Rpb1, cells became rapidly inviable. This phenotype reveals an essential function of the Y1 residue that appears more drastic than T4A or S7A mutations, but comparable with that of S5A (<xref ref-type="bibr" rid="bib4">Chapman et al., 2007</xref>; <xref ref-type="bibr" rid="bib14">Hintermair et al., 2012</xref>). We conclude that Tyr1P very likely contributes to stabilization of CTD and may occur early within the transcription cycle.<fig-group><fig id="fig1" position="float"><object-id pub-id-type="doi">10.7554/eLife.02105.003</object-id><label>Figure 1.</label><caption><title>Y1F mutations of the CTD heptads yield a truncated Pol IIB Rpb1.</title><p>(<bold>A</bold>) Rpb1-Y1F mutant was expressed after removal of tetracycline and in the presence of endogenous Rpb1. Probing with Rpb1 Ab reveals both endogenous and recombinant Rpb1 whereas HA reveals only recombinant Y1F mutant. (<bold>B</bold>) Protein expression of the Y1F mutant after shut-down of endogenous Rpb1 following treatment with α-amanitin.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.003">http://dx.doi.org/10.7554/eLife.02105.003</ext-link></p></caption><graphic xlink:href="elife02105f001"/></fig><fig id="fig1s1" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.02105.004</object-id><label>Figure 1—figure supplement 1.</label><caption><title>Tyr1P is expressed in various human and mouse cell lines.</title><p>(<bold>A</bold>) Western blot analyses of antibody recognition in mouse and human cell lines of Rpb1, CTD (8WG16), and CTD isoforms including Tyr1P (3D12). MEF, mouse embryo fibroblasts; Raji, Burkitt-Lymphoma; U2OS, osteosarcoma cell line; HEK293; human embryonic kidney cells; H9, human embryonic stem cells; HFB, human skin fibroblasts; Neural Pre, human neural precursor cells. (<bold>B</bold>) Western blot, as in (<bold>A</bold>) showing the specificity of 3D12 in Hela whole cell extracts over a wider range of proteins.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.004">http://dx.doi.org/10.7554/eLife.02105.004</ext-link></p></caption><graphic xlink:href="elife02105fs001"/></fig><fig id="fig1s2" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.02105.005</object-id><label>Figure 1—figure supplement 2.</label><caption><title>Sequence of the CTD heptads for the Tyr1 to Phe mutant (Y1F).</title><p>Amino-acid composition of the C-terminal domain of the Y1F mutant (as described in the ‘Materials and methods–Construction of the CTD Y1F mutant’) used for phenotypic and western blot analyses (<xref ref-type="fig" rid="fig1">Figure 1</xref>).</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.005">http://dx.doi.org/10.7554/eLife.02105.005</ext-link></p></caption><graphic xlink:href="elife02105fs002"/></fig></fig-group></p><p>To gain further insight into the involvement of Tyr1P in the transcription cycle, we performed co-immunoprecipitation experiments in human cells using antibodies directed against various CTD modifications reflecting 5′ transcriptionally engaged (Ser5P, Ser7P) or elongating forms (Ser2P, Thr4P) of Pol II (<xref ref-type="bibr" rid="bib4">Chapman et al., 2007</xref>; <xref ref-type="bibr" rid="bib14">Hintermair et al., 2012</xref>; <xref ref-type="bibr" rid="bib21">Mayer et al., 2012</xref>). Our experiments indicated clearly that Tyr1P co-immunoprecipitated with Ser5P and Ser7P but not Ser2P or Thr4P (<xref ref-type="fig" rid="fig2">Figure 2A</xref>). Consistently, signals for Tyr1P were observed in Ser5P and Ser7P but not in Ser2P co-immunoprecipitations. Thus, overall, this data points out an association of Tyr1P with early transcribing isoforms of human Pol II.<fig-group><fig id="fig2" position="float"><object-id pub-id-type="doi">10.7554/eLife.02105.006</object-id><label>Figure 2.</label><caption><title>CTD Tyrosine 1 is phosphorylated mainly at TSS and is dominant in antisense transcription.</title><p>(<bold>A</bold>) Co-immunoprecipitation with specific CTD isoforms in Raji B-cells reveals Tyr1P (3D12) association with Ser5P and Ser7P but not with Ser2P and Thr4P. (<bold>B</bold>) ChIP-seq example illustrating Tyr1P (3D12) association around the promoter of RPL22L1 gene. (<bold>C</bold>) Composite average profiling of ChIP-seq data at coding genes locations for Pol II (1433 genes), Tyr1P (3D12, 2462 genes), Ser5P (1464 genes), and Ser7P (2186 genes) in Raji B-cells and based on selections described in <xref ref-type="fig" rid="fig2s1">Figure 2—figure supplement 1B</xref>. Less stringent selections with more genes gave equivalent profiling (<xref ref-type="fig" rid="fig2s4">Figure 2—figure supplement 4A</xref>). (<bold>D</bold>) Profiling of Pol II, Tyr1P (3D12), Ser5P, Ser7P, nucleosomes midpoint and short strand specific RNAs (ssRNAs) around TSS locations with same selections described in (<bold>C</bold>). (<bold>E</bold>) Boxplots on 3201 genes without outliers showing mean levels of Pol II (2986 genes), Tyr1P (2964 genes), Ser5P (2909 genes), and Ser7P (2948 genes) ChIP-seq signal on regions representing each transcription orientation. The p-values (parametric two sided paired <italic>t</italic> test) of the difference of AS vs S signal are Pol II = 0.5, Tyr1p=3.4 × 10<sup>−15</sup>, Ser5p=0.6, Ser7p=3.5 × 10<sup>−2</sup>.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.006">http://dx.doi.org/10.7554/eLife.02105.006</ext-link></p></caption><graphic xlink:href="elife02105f002"/></fig><fig id="fig2s1" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.02105.007</object-id><label>Figure 2—figure supplement 1.</label><caption><title>Reproducibility of ChIP-seq experiments and selection of relevant signals used for analyses.</title><p>(<bold>A</bold>) Correlation plots of biological replicates (for all but H3K36me3 i.e., a technical replicate) of ChIP-seq experiments used in this study at gene locations (‘Materials and methods–Correlation of biological replicates and cross-correlation’). Spearman correlation coefficient is indicated on the top left of the plots. (<bold>B</bold>) Distribution and threshold of background-subtracted signal used for profiling of significantly bound gene (Total, i.e., whole genic regions) in <xref ref-type="fig" rid="fig2">Figure 2</xref>, <xref ref-type="fig" rid="fig2s5">Figure 2—figure supplement 5A</xref>, and <xref ref-type="fig" rid="fig2s7">Figure 2—figure supplement 7C</xref>. The mean values used for distribution were computed on [TSS-1000 bp:TES+2000 bp] (TSS: transcription start site; TES: transcription end site). Note that the thresholds were set to the mean of the second Gaussian of the distribution (‘Materials and methods–Gene selection and average binding profiles’). Numbers of genes selected for Pol II, Ser2P, Ser5P, Ser7P, Tyr1P 3D12, and Tyr1P 8G5 are 1521, 1536, 1543, 2382, 2652, and 2608, respectively. (<bold>C</bold>) Distribution and threshold of Pol II significantly bound promoters (TSS) as in (<bold>B</bold>). The selection is used in <xref ref-type="fig" rid="fig3">Figure 3</xref>, <xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1</xref>, and <xref ref-type="fig" rid="fig3s2">Figure 3—figure supplement 2</xref>. 2044 genes were selected based on their mean values on TSS −/+ 500 bp.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.007">http://dx.doi.org/10.7554/eLife.02105.007</ext-link></p></caption><graphic xlink:href="elife02105fs003"/></fig><fig id="fig2s2" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.02105.008</object-id><label>Figure 2—figure supplement 2.</label><caption><title>Pol II and CTD PTMs correlate positively with expression.</title><p>Based on microarray expression data, three groups of genes with low (L, 3414 genes), medium (M, 1238 genes), and high (H, 1007 genes) expression were used to profile Pol II isoforms and short ssRNA at promoters. (<bold>A</bold>) Heatmaps of signal densities for the three defined groups. (<bold>B</bold>) Average profiles of Pol II phospho-isoforms and ssRNA at the three defined groups. (<bold>C</bold>) Boxplots of the mean values retrieved at TSS −/+ 500 bp in the three classes for Pol II (3095, 1169, 957 genes), Tyr1P (3159, 1150, 958 genes), Ser5P (3072, 1157, 956 genes), and Ser7P (3184, 1130, 942 genes). (<bold>D</bold>) Boxplot of regions representing each transcription orientation as in <xref ref-type="fig" rid="fig2">Figure 2E</xref> for each class divided by Pol II binding values. p-value (parametric two sided paired <italic>t</italic> test) are respectively: 2.3 × 10<sup>−13</sup>; 5 × 10<sup>−4</sup>; 6 × 10<sup>−3</sup> (low), 2.4 × 10<sup>−13</sup>; 6 × 10<sup>−3</sup>; 2 × 10<sup>−4</sup> (medium), 7 × 10<sup>−6</sup>; 0.02; 0.8 (high). Represented number of genes are 3175, 3126, 3074, 3051, 3123, 3134 (low); 1154, 1079, 1154, 1125, 1139, 1084 (medium); 955, 930, 941, 941, 935, 913 (high).</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.008">http://dx.doi.org/10.7554/eLife.02105.008</ext-link></p></caption><graphic xlink:href="elife02105fs004"/></fig><fig id="fig2s3" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.02105.009</object-id><label>Figure 2—figure supplement 3.</label><caption><title>Examples of Tyr1P binding patterns at genic locations.</title><p>EIF1B and SNHG8 are mainly bound by Tyr1P (3D12) at TSS as for RPL22L1 gene of <xref ref-type="fig" rid="fig2">Figure 2B</xref>.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.009">http://dx.doi.org/10.7554/eLife.02105.009</ext-link></p></caption><graphic xlink:href="elife02105fs005"/></fig><fig id="fig2s4" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.02105.010</object-id><label>Figure 2—figure supplement 4.</label><caption><title>Average profiling of Pol II and phospho-isoforms at genic and promoter locations using wide relaxed threshold selections.</title><p>(<bold>A</bold>) Composite and TSS focused average profiling of ChIP-seq data as in <xref ref-type="fig" rid="fig2">Figure 2C,D</xref>, for a selection threshold of 0 as described in <xref ref-type="fig" rid="fig2s1">Figure 2—figure supplement 1B</xref>, at coding genes locations for Pol II (2714 genes), Tyr1P (3D12, 2987 genes), Ser5P (2697 genes), and Ser7P (3002 genes) in Raji B-cells. (<bold>B</bold>) Boxplots on 4749 genes as in <xref ref-type="fig" rid="fig2">Figure 2E</xref> for the less stringent selection showing mean levels of Pol II, Tyr1P, Ser5P, and Ser7P ChIP-seq signal on regions representing each transcription orientation. The p-values (parametric two sided paired <italic>t</italic> test) of the difference of AS vs S signal are Pol II = 0.2, Tyr1p=3.5 × 10<sup>−16</sup>, Ser5p=0.2, Ser7p=0.03. Boxplots do not show outliers for Pol II (3933 genes), Tyr1P (3897 genes), Ser5P (3920 genes), and Ser7P (3878 genes).</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.010">http://dx.doi.org/10.7554/eLife.02105.010</ext-link></p></caption><graphic xlink:href="elife02105fs006"/></fig><fig id="fig2s5" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.02105.011</object-id><label>Figure 2—figure supplement 5.</label><caption><title>Ser2P average profile at genic locations and examples of Tyr1P signal at promoter locations.</title><p>(<bold>A</bold>) Ser2P average profile on 1415 genes selected on mean values distribution shown in <xref ref-type="fig" rid="fig2s1">Figure 2—figure supplement 1B</xref> and represented as for <xref ref-type="fig" rid="fig2">Figure 2C</xref>. (<bold>B</bold>) Examples of Tyr1P (and other isoforms, short ssRNAs) at promoters of 5 coding genes. These genes show a dominance of Tyr1P (3D12) signal upstream (AS direction) relatively to downstream TSSs and as compared to Pol II and isoforms.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.011">http://dx.doi.org/10.7554/eLife.02105.011</ext-link></p></caption><graphic xlink:href="elife02105fs007"/></fig><fig id="fig2s6" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.02105.012</object-id><label>Figure 2—figure supplement 6.</label><caption><title>Tyr1P presents a specific pattern of phosphorylation along genes compared to Pol II.</title><p>(<bold>A</bold>) Genome-wide profiling of Pol II (N20) and CTD isoforms (as in <xref ref-type="fig" rid="fig2">Figure 2</xref>) for different classes of binding levels indicate a distribution of Tyr1P more prominent at promoters vs gene bodies as compared to Pol II and Ser7P, but comparable to that of Ser5P. The indicated signal rank of the values is over an area encompassing TSS, GB, and 3′ ends of genes as indicated in the ‘Materials and methods–Gene selection and average binding profiles’. Note that more Tyr1P signal is found at 3′ ends as compared to Ser5P. (<bold>B</bold>) Spearman correlation plots of significantly enriched areas for Pol II and phospho-isoforms (genes size &gt;2 kb) indicate that Tyr1P relates more to Pol II and early transcription marks at promoters than it does at gene bodies or 3′ends. Mean values for Spearman correlation were computed at [TSS-500 bp;TSS+500 bp], [TSS+1000 bp; 3′end-500 bp], and [3′end-500 bp; 3′end+1000 bp] (‘Materials and methods–Correlation of biological replicates and cross-correlation’).</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.012">http://dx.doi.org/10.7554/eLife.02105.012</ext-link></p></caption><graphic xlink:href="elife02105fs008"/></fig><fig id="fig2s7" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.02105.013</object-id><label>Figure 2—figure supplement 7.</label><caption><title>Tyr1P specific antibodies with distinct peptide recognition patterns show similar genome-wide profiling at TSS.</title><p>(<bold>A</bold>) CTD peptide recognition patterns of 3D12 and 8G5 Tyr1P Abs used in this study. Note that 8G5 shows a wider range of peptide recognition compared to 3D12. (<bold>B</bold>) Specificity and reactivity of mAbs were tested in ELISA experiments towards the peptides CTD-1 to -19. (<bold>C</bold>) Genome-wide profiling of ChIP-seq experiments performed with 8G5 at TSSs (left panel) or at gene body locations on 2365 genes. As for 3D12 Ab, the AS peak is over-represented when compared to Pol II.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.013">http://dx.doi.org/10.7554/eLife.02105.013</ext-link></p></caption><graphic xlink:href="elife02105fs009"/></fig></fig-group></p><p>To assess its relation to transcription genome-wide, we next performed Tyr1P ChIP-seq, using 3D12 mAb, and compared it to Pol II and the other phospho-isoforms. We isolated significantly associated regions based on the signal distribution of the background-subtracted data (<xref ref-type="fig" rid="fig2s1">Figure 2—figure supplement 1B</xref>) and found that Pol II and all isoforms, including Tyr1P, correlated with transcription levels of genes (<xref ref-type="fig" rid="fig2s2">Figure 2—figure supplement 2</xref>). At many gene locations, a predominant signal of Tyr1P at promoters was observed (<xref ref-type="fig" rid="fig2">Figure 2B</xref>, <xref ref-type="fig" rid="fig2s3">Figure 2—figure supplement 3</xref>). We further confirmed this by genome-wide profiling of Pol II isoforms at coding-gene locations (<xref ref-type="fig" rid="fig2">Figure 2C</xref>, <xref ref-type="fig" rid="fig2s4">Figure 2—figure supplement 4</xref>, <xref ref-type="fig" rid="fig2s5">Figure 2—figure supplement 5A</xref> for Ser2P profile). Our profiling analysis shows that Tyr1P signal is predominantly found at promoters similarly to Ser5P, weak or essentially absent at gene bodies and weak at 3′ends in contrast to Ser2P elongating mark and Ser7P (associated to both promoters and gene bodies). These observations are further supported by quantification of signals at various genic sections (<xref ref-type="fig" rid="fig2s6">Figure 2—figure supplement 6</xref>) and reinforce our conclusion that human Tyr1P is mainly associated to promoters in an early, post-initiation step of transcription. Although we did not further investigate this possibility, in the accompanying manuscript, Hsin et al show that Chicken Tyr1 is found phosphorylated in the nucleoplasm, raising the possibility that Tyr1P is also associated with recruitment of the enzyme and transcription initiation.</p><p>Genomic profiling at the vicinity of the transcription start site (TSS) indicates two main peaks of Pol II upstream and downstream of the TSS (<xref ref-type="fig" rid="fig2">Figure 2D</xref>, left panel and <xref ref-type="fig" rid="fig2s4">Figure 2—figure supplement 4</xref>). These peaks most likely reflect sense and antisense paused transcription as evidenced by our short strand specific (ssRNA) sequencing analysis, as previously described (<xref ref-type="bibr" rid="bib5">Core et al., 2008</xref>; <xref ref-type="bibr" rid="bib24">Preker et al., 2008</xref>; <xref ref-type="bibr" rid="bib26">Seila et al., 2008</xref>; <xref ref-type="bibr" rid="bib10">Fenouil et al., 2012</xref>) for mammalian promoters. This transcription results in short promoter-associated transcripts production and might relate to pervasive transcription of promoters in sequence context lacking strong elements imposing directionality. By comparing the signals of these two peaks with that of the Ser5P and Ser7P isoforms, Tyr1P showed a clearly distinct pattern with a more pronounced upstream peak (<xref ref-type="fig" rid="fig2">Figure 2D</xref>, <xref ref-type="fig" rid="fig2s4">Figure 2—figure supplement 4</xref> and examples in <xref ref-type="fig" rid="fig2s5">Figure 2—figure supplement 5B</xref>). We confirmed this result with an independent Tyr1P antibody (8G5) harboring wider range of CTD peptide recognition (<xref ref-type="fig" rid="fig2s7">Figure 2—figure supplement 7</xref>), and by using statistical analysis showing that antisense/sense (AS/S) difference was significant for Tyr1P as compared to other isoforms (<xref ref-type="fig" rid="fig2">Figure 2E</xref>, <xref ref-type="fig" rid="fig2s4">Figure 2—figure supplement 4B</xref>). Together, our analyses indicate that Tyr1P is predominantly associated with upstream polymerases, mostly reflecting AS transcription at mammalian promoters.</p><p>We previously showed that mammalian promoters associated with Pol II can be grouped in three main classes in mouse T-lymphocytes (<xref ref-type="bibr" rid="bib10">Fenouil et al., 2012</xref>), based on ranking of the main Pol II signal from the most upstream to the most downstream of the TSS. We reproduced this result and the main features of the three groups in human Raji B-cells by ranking the signal of Tyr1P (<xref ref-type="fig" rid="fig3">Figure 3A</xref>, <xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1A,B</xref>). The first class (the majority of genes), with Pol II signals most upstream of TSSs, harbors strongly paused Pol II at promoters with high GC content and CpG islands (CGIs) and is associated with the highest level of bidirectional and AS transcription. The second class, with a sharper Pol II peak centered close to the TSS and lower GC content, contains mostly mono-directional sense paused transcription whereas the third class contains more downstream Pol II with less pause. We then focused our attention on class I that contains most AS short RNAs. In this class, Tyr1P is essentially observed in AS while Ser5P, Ser7P, or total Pol II generally show a second peak around the TSS reflecting sense and therefore bidirectional transcription (<xref ref-type="fig" rid="fig3">Figure 3C</xref>, <xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1C</xref>). This indicates that AS Tyr1P relates to one specific class of promoters and suggests that in AS orientation, Tyr1P associates mainly with the leading edge of Pol II. Pleading for this hypothesis, the location of the AS Tyr1P in class I is found more downstream on average as compared to Pol II or Ser5P, and locates just after the −2 nucleosome midpoint (<xref ref-type="fig" rid="fig3">Figure 3B,C</xref>). A more detailed investigation of the individual positions of phospho-isoforms further shows that for the majority of promoters significantly associated with AS short RNAs in class I, Tyr1P is either located at the immediate proximity or after the main Pol II peak (<xref ref-type="fig" rid="fig3s2">Figure 3—figure supplement 2</xref>) suggesting that it might play a role in early elongation. Although Ser7P displayed similar characteristics, its influence on transcription of coding genes is likely to be minor, as Ser7 mutations do not show significant phenotype (<xref ref-type="bibr" rid="bib4">Chapman et al., 2007</xref>) or transcriptome impairment (JCA and DE, unpublished observations). We overall conclude that Tyr1P is a CTD PTM that associates with the 5′ end of genes and shows a stronger linkage to paused Pol II at promoters with bidirectional and AS transcription.<fig-group><fig id="fig3" position="float"><object-id pub-id-type="doi">10.7554/eLife.02105.014</object-id><label>Figure 3.</label><caption><title>Tyr1 is preferentially phosphorylated in antisense orientation on a particular subset of genes.</title><p>(<bold>A</bold>) Heatmaps of Tyr1P (3D12), Pol II, Ser5P, Ser7P, nucleosome midpoints (positioning) and short strand specific RNAs (red for AS and blue for S signal) at promoters with a significant level of Pol II. The genes were ordered by position of the main Tyr1P accumulation area from the most 5′ to the most 3′ within −1000 bp and +1000 bp around TSS. Three main classes are defined by Tyr1P occupancy: class I most 5′ (red bar, 1066 genes), class II TSS-proximal (green bar, 579 genes), and class III most 3′ (blue bar, 209 genes). (<bold>B</bold>) Average profiling of short ssRNAs and nucleosomes positions in class I. Positions of the nucleosome midpoints are indicated by a dashed line (nucleosome −3, −2, −1, and +1 from left to right). (<bold>C</bold>) Profiles of Pol II and CTD isoforms in class I. Red, blue, orange, and green dashed lines indicate the average position of the maximum values of Pol II, Tyr1P (3D12), Ser5P, and Ser7P signals, respectively. The distance between Pol II leading edge and isoforms is indicated below each graph. The borders of nucleosomes −3, −2, and +1 (from left to right) are shown as pink rectangles whereas the red, blue, orange, and green circles represent Pol II, Tyr1P, Ser5P, and Ser7P, respectively with indication of directionality based on the short ssRNA signals.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.014">http://dx.doi.org/10.7554/eLife.02105.014</ext-link></p></caption><graphic xlink:href="elife02105f003"/></fig><fig id="fig3s1" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.02105.015</object-id><label>Figure 3—figure supplement 1.</label><caption><title>Three classes of Pol II-bound promoters ordered by Tyr1P location in human Raji cells.</title><p>(<bold>A</bold>) Heatmaps of a selection of Pol II-bound promoters for ssRNAs, nucleosome and AT, GC contents ordered by Tyr1P (3D12) maximum signal from the most upstream to the most downstream of the annotated TSSs (as previously described in mouse lymphocytes, <xref ref-type="bibr" rid="bib10">Fenouil et al., 2012</xref>). Note that Pol II main accumulation areas occur at proximity of the main nucleosome position for each promoter class. As described before (<xref ref-type="bibr" rid="bib10">Fenouil et al., 2012</xref>), GC content and CpG islands correlate with nucleosome depletion. (<bold>B</bold>) Profiles of ssRNAs (sense and antisense) and nucleosome in the three groups. (<bold>C</bold>) Profiles of Pol II and CTD isoforms in the three classes of promoters as indicated.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.015">http://dx.doi.org/10.7554/eLife.02105.015</ext-link></p></caption><graphic xlink:href="elife02105fs010"/></fig><fig id="fig3s2" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.02105.016</object-id><label>Figure 3—figure supplement 2.</label><caption><title>CTD isoforms and nucleosome distribution around Pol II upstream of TSSs in class I promoters.</title><p>(<bold>A</bold>) 3D plots of Tyr1P, Ser5P, Ser7P and nucleosomes midpoints (MP) maximum signal locations as compared to Pol II ChIP-seq maxima for genes of group 1 of <xref ref-type="fig" rid="fig3">Figure 3A</xref>. Only genes with a significant signal of antisense ssRNA and higher than sense ssRNA were taken into account (see ‘Materials and methods–CTD isoforms and nucleosomes midpoint maximal peaks spatial organization analysis’ for details). The positive values of the distance to Pol II axis (in bp) indicate that maximum signals are located after Pol II in opposite direction of TSSs whereas negative values are in the inverse orientation. The number of maximal peaks before, after or colocalized with Pol II for Tyr1P, Ser5P, and Ser7P are 90/265/174, 99/152/278, 125/234/170, respectively. Note that most of the Tyr1P max values are located after Pol II whereas Ser5P is mainly found around Pol II main signal. (<bold>B</bold>) 2D Boxplots of the maximum values shown in (<bold>A</bold>) (upper panel) and for an independent analysis using Tyr1P max signal as reference (lower panel). In both cases Tyr1P locates at or after the leading edge of Pol II. (<bold>C</bold>) Distance to Pol II distribution of Tyr1P, Ser5P, and Ser7P for class I promoters selected as described in (<bold>A</bold>). Data is represented in bins of 10 (‘Materials and methods–Processing of sequenced tags’). The difference of distribution with the whole set of genes (black line) was assessed by a nonparametric Kolmogorov-Smirnov test. p-values are indicated at the top-right of each panel.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.016">http://dx.doi.org/10.7554/eLife.02105.016</ext-link></p></caption><graphic xlink:href="elife02105fs011"/></fig></fig-group></p><p>Many groups including ours have shown that highly active and tissue-specific enhancers are transcribed by Pol II in various tissues (<xref ref-type="bibr" rid="bib8">De Santa et al., 2010</xref>; <xref ref-type="bibr" rid="bib17">Kim et al., 2010</xref>; <xref ref-type="bibr" rid="bib18">Koch et al., 2011</xref>; <xref ref-type="bibr" rid="bib22">Natoli and Andrau, 2012</xref>). These enhancers can also be hallmarked by the occurrence of H3K4me1<sup>high</sup>/H3K4me3<sup>low</sup> epigenetic marks combination (<xref ref-type="bibr" rid="bib18">Koch et al., 2011</xref>; <xref ref-type="bibr" rid="bib23">Pekowska et al., 2011</xref>). To investigate if Tyr1P can be detected at enhancers, we first isolated intergenic regions (IGRs) with stringent criteria in B-cells using Pol II, H3K4me1, and me3 signals. These were further discriminated from noncoding promoters using the relative ratio of H3K4me1/me3 (<xref ref-type="bibr" rid="bib23">Pekowska et al., 2011</xref>; <xref ref-type="bibr" rid="bib20">Li et al., 2012</xref>), and from both unannotated coding and some long intergenic noncoding genes using the absence of H3K36me3 that marks gene bodies (<xref ref-type="bibr" rid="bib12">Guttman et al., 2009</xref>). Using these criteria, we isolated 390 B-cells enhancers (<xref ref-type="fig" rid="fig4s1">Figure 4—figure supplement 1A–D</xref>). Our selection was further validated using tissue-specificity analyses (<xref ref-type="fig" rid="fig4s1">Figure 4—figure supplement 1E</xref>) indicating IGRs associated with genes specific to B-cells. We next performed profiling of the various Pol II isoforms at these enhancers. As before (<xref ref-type="bibr" rid="bib18">Koch et al., 2011</xref>), we observed that these IGRs were associated with Ser5P (<xref ref-type="fig" rid="fig4">Figure 4A</xref>) but not with Ser2P Pol II (not shown) as well as with short transcripts (reflecting paused transcription) and a discrete nucleosome depleted region. Consistent with early elongating Pol II at enhancers, we found signal for both Ser7P and Tyr1P at these IGRs. Importantly, Tyr1P appeared more bound to enhancers as compared to promoters and total Pol II (<xref ref-type="fig" rid="fig4">Figure 4B,C</xref>, <xref ref-type="fig" rid="fig4s2">Figure 4—figure supplement 2</xref>), suggesting that Tyr1 is more phosphorylated than Ser5 or Ser7 at enhancers and represent a hallmark of these essential areas of the genome. Additionally, Tyr1P also displayed the best correlation with Pol II at isolated enhancers (<xref ref-type="fig" rid="fig4">Figure 4D</xref>). Finally, using an independent selection for active enhancers based on H3K27ac brought very similar results (<xref ref-type="fig" rid="fig4s3">Figure 4—figure supplement 3</xref>). Together, our investigations showed that Tyr1P is a strong signature of Pol II-transcribed active enhancers associated with tissue-specific gene expression.<fig-group><fig id="fig4" position="float"><object-id pub-id-type="doi">10.7554/eLife.02105.017</object-id><label>Figure 4.</label><caption><title>Tyr1P is a hallmark of enhancers relative to Pol II and promoters signal.</title><p>(<bold>A</bold>) Average profiling of Pol II, Tyr1P (3D12), Ser5P, Ser7P, nucleosomes occupancy, and short ssRNAs. 390 active putative enhancers (red) and 4618 control promoters (blue) were detected in human Raji B-cells (‘Materials and methods–Selection of enhancers and promoters using Pol II’). Profiles are centered on Pol II ChIP-seq maximal signal and are not oriented. (<bold>B</bold>) Boxplots of mean ChIP-seq signal on selected enhancer and control promoter regions for Ser5P (371/4378 values), Ser7P (368/4257 values), and Tyr1P (372/4266 values). Signals were normalized by the mean ChIP-seq signal of Pol II on the same regions. All marks show a significant difference (nonparametric Mann-Whitney-Wilcoxon test, p-values &lt;10<sup>−10</sup>). (<bold>C</bold>) Example of Tyr1P at promoter and putative enhancer. (<bold>D</bold>) Spearman cross-correlation between Pol II, Ser5P, Ser7P, Ser2P, and Tyr1P (3D12) at intergenic putative enhancers. Tyr1P and Pol II best correlate with each other.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.017">http://dx.doi.org/10.7554/eLife.02105.017</ext-link></p></caption><graphic xlink:href="elife02105f004"/></fig><fig id="fig4s1" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.02105.018</object-id><label>Figure 4—figure supplement 1.</label><caption><title>Pol II-bound enhancer selection procedure and features.</title><p>(<bold>A</bold>) Workflow of the enhancers (390) and control promoters (4618) selection based on ChIP-seq of H3K36me3, H3K4me3, H3K4me1, and Pol II. Details of procedure and number of regions isolated at each step (E1-4 and P1-3) are indicated in ‘Materials and methods–Selection of enhancers and promoters using Pol II’. (<bold>B</bold>) Plot of H3K4me3/me1 mean values ratios of selected intergenic regions at step E2 (in red), promoter regions at step P1 (in blue), and Hg19 RefSeq annotated promoters (in black). To stringently select isolated promoters and intergenic regions shown in (<bold>A</bold>) and attribute their putative enhancer and control promoter status, a threshold was defined (in dashed green line). (<bold>C</bold>) Nonoriented profiling of epigenetic marks associated with putative enhancers (in red) and control promoters (in blue) selected at steps P3 and E4 of procedure described in (<bold>A</bold>) and centered on the main Pol II peak as in <xref ref-type="fig" rid="fig4">Figure 4A</xref>. (<bold>D</bold>) Boxplots of H3K4me3 (363/4325 genes plotted) and H3K4me1 (375/4259 genes plotted) signals at putative enhancers (in red) and control promoters (in blue). Nonparametric Mann-Whitney-Wilcoxon test gave p-values &lt;10<sup>−152</sup>. (<bold>E</bold>) Tissue specificity analysis of the genes associated with putative enhancers (closest genes on each side of the isolated genomic loci) compared to genes of HGU133 array (whole genes, see ‘Materials and methods–Tissue specificity analysis’). The isolated tissues are ranked by p-values (indicated on the left) from top to bottom. This analysis indicates that both WT (CD19) and Raji human B-cells are among the most significant tissues thus validating the putative enhancer regions identified in our analysis and as described in mouse lymphocytes (<xref ref-type="bibr" rid="bib20">Li et al., 2012</xref>).</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.018">http://dx.doi.org/10.7554/eLife.02105.018</ext-link></p></caption><graphic xlink:href="elife02105fs012"/></fig><fig id="fig4s2" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.02105.019</object-id><label>Figure 4—figure supplement 2.</label><caption><title>Examples of Tyr1P enhancer association upstream or downstream of CXCR4, DUSP2, and IER5 genes.</title><p>As in <xref ref-type="fig" rid="fig4">Figure 4</xref>, light orange and blue rectangles highlight enhancer and promoter locations with higher H3K4me3 at promoters and higher H3K4me1 at enhancers. Relative amount of Tyr1P is higher at enhancers as compared to Pol II and to promoters. H3K4me3 level at CXCR4 IGR was observed but is not visible due to the scale used and because of high level of signal at promoter.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.019">http://dx.doi.org/10.7554/eLife.02105.019</ext-link></p></caption><graphic xlink:href="elife02105fs013"/></fig><fig id="fig4s3" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.02105.020</object-id><label>Figure 4—figure supplement 3.</label><caption><title>Selection of enhancers using H3K27ac also shows a dominance of Tyr1P on active and tissue specific enhancers.</title><p>(<bold>A</bold>) Workflow of a complementary selection of enhancers (927/2598 active), and control promoters (5946/6057 active) based on ChIP-seq of H3K36me3, H3K4me3, and H3K4me1. H3K27ac was used to extract specifically active enhancers from the whole set. Details of procedure and number of regions isolated at each step (E1'-6' and P1'-6') are indicated in ‘Materials and method–Selection of active enhancers and promoters using H3K27ac’. (<bold>B</bold>) Average profiles of Pol II and isoforms for active enhancers/promoters and the whole set of enhancers/promoters. (<bold>C</bold>) Active (H3K27ac selection) enhancers show increased enrichment over Pol II and tissue-specific gene expression. As in <xref ref-type="fig" rid="fig4">Figure 4</xref>, Spearman correlation, boxplots of comparison of levels of Pol II isoforms, and tissue specificity analyses indicate Tyr1P to be over-enriched at active enhancers as compared to Pol II and promoters. Nonparametric two-sided Mann-Whitney-Wilcoxon test for boxplots of Ser5P (780/5068 values), Ser7P (752/4953 values), and Tyr1P (739/5233 values) yields p-values of 5.1 × 10<sup>−56</sup>, 7.05 × 10<sup>−4</sup>, and 2.1 × 10<sup>−30</sup>, respectively. (<bold>D</bold>) Whole enhancer set (H3K4me1/3) analysis as in (<bold>C</bold>). Nonparametric two sided Mann-Whitney-Wilcoxon test for boxplots of Ser5P (2220/5141 values), Ser7P (2186/5005 values), and Tyr1P (2112/5306 values) yields p-values of 2.6 × 10<sup>−139</sup>, 6.8 × 10<sup>−4</sup>, and 8.09 × 10<sup>−4</sup>, respectively.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.020">http://dx.doi.org/10.7554/eLife.02105.020</ext-link></p></caption><graphic xlink:href="elife02105fs014"/></fig></fig-group></p><p>Here, we described that Tyr1P associates with 5′ Pol II and AS transcription at promoters and is a signature of active, tissue-specific enhancers in human B-cells. These findings contrast with features of Tyr1P in yeast, which is located at gene bodies and proposed to play a role in elongation by impairing termination factor recruitment (<xref ref-type="bibr" rid="bib21">Mayer et al., 2012</xref>). These apparent discrepancies thus provide an interesting paradigm whereby a conserved PTM has evolved to display specialized functions specific to metazoans. However, <italic>S. cerevisiae</italic> genes are very compact, mostly devoid of introns and promoters structure is also extremely divergent in both length and sequence between yeast (around 100–200 nt, AT-rich) and mammals (around 1000 nt, GC-rich). Furthermore, enhancers do not exist per se in yeast. In an accompanying manuscript, <xref ref-type="bibr" rid="bib16">Hsin et al. (2014)</xref> describe similar observations regarding stability of Y1F mutant in chicken cells and involvement of Tyr1P in AS transcription at promoters, thus providing further evidence that our observations are conserved in vertebrates. We therefore speculate that differential CTD PTMs might not only reflect, but also play a role in regulating the directionality of transcription. How would Tyr1P behave in organisms with less prominent bidirectional transcription at promoters such as <italic>Drosophila</italic> (<xref ref-type="bibr" rid="bib6">Core et al., 2012</xref>) thus represents an interesting evolutionary question to be addressed in future studies.</p><p>Based on the spatial location of Tyr1P in class I promoters, mostly found at the leading edge of Pol II in opposite orientation of the gene, it is tempting to speculate that this PTM might be involved in a transcriptional state marking the transition between early and productive elongation, providing a checkpoint for transcriptional complexes to proceed in productive elongation. Depending on the level of Tyr1P at promoters, Pol II might become competent for elongation as well as for overcoming the nucleosomal barrier both in sense and antisense orientation. Since less Pol II molecules are able to effectively enter elongation in AS orientation, more accumulation of the Tyr1P could be observed upstream of the TSS toward the leading edge of Pol II. This could also explain degradation of Y1F mutant that is due to absence of Tyr1P checkpoint signal, would accumulate around the edge of the promoters and become degraded. Finally there could also be a link between hyperphosphorylation of Tyr1 in AS orientation and exosome machinery recruitment to degrade nascent RNA prior release of the Pol II enzyme (<xref ref-type="bibr" rid="bib24">Preker et al., 2008</xref>; <xref ref-type="bibr" rid="bib1">Andersen et al., 2013</xref>). We believe our work will thus provide a new frame of investigation to decipher the complexity of mechanisms leading to transcriptional activation, at the heart of gene regulation.</p></sec><sec id="s3" sec-type="materials|methods"><title>Material and methods</title><sec id="s3-1"><title>Antibodies</title><p>Generation and validation of modification specific mAbs have been described before: Tyr1P mAb (3D12, <xref ref-type="bibr" rid="bib21">Mayer et al., 2012</xref>) and 8G5 (see <xref ref-type="fig" rid="fig2s7">Figure 2—figure supplement 7</xref>), Ser2P (3E10), Ser5P (3E8), and Ser7P (4E12, <xref ref-type="bibr" rid="bib4">Chapman et al., 2007</xref>), Thr4P (6D7, <xref ref-type="bibr" rid="bib14">Hintermair et al., 2012</xref>).</p><p>For further characterization of specificity, the 3D12 and 8G5 Tyr1P antibodies were analyzed in ELISA experiments using CTD-like peptides with different modification patterns (Peptide Specialty Laboratories GmbH, Heidelberg, Germany) coupled to 96-well maleimide plates (Thermo Fisher Scientific Inc., Rockford, IL USA) as antigen (<xref ref-type="fig" rid="fig2s7">Figure 2—figure supplement 7</xref>). Peptides were incubated with the monoclonal antibodies and biotinylated, subclass-specific antibodies, respectively. After incubation with horseradish peroxidase (HRP)-coupled avidin, H<sub>2</sub>O<sub>2</sub> and TMB (3,3',5,5'-tetramethylbenzidine) were added. Absorbance of each well was measured at 650 nm after color change and quantitated with an ELISA reader.</p></sec><sec id="s3-2"><title>Extracts, western blots, and co-immunoprecipitation</title><sec id="s3-2-1"><title>Immunoprecipitation (IP) experiments</title><p>3 × 10<sup>6</sup> Raji cells were lysed in 200 µl IP buffer (50 mM Tris–HCl, pH 8.0, 150 mM NaCl, 1% NP-40 (Roche, Germany), 1x PhosSTOP (Roche), 1x protease inhibitor cocktail (Roche)) for 20 min on ice. All samples were sonicated on ice using a BRANSON Sonifier 250 (15 s on, 15 s off, 50% duty) and centrifuged at 14,500 rpm for 15 min at 4°C. The supernatant was incubated with antibody-coupled protein G/A-sepharose (1:1) beads (2.5 µg of antibodies for 4 hr at 4°C, followed by two washes with 1 ml IP buffer) rotating overnight. Beads were washed several times with 1 ml IP buffer and proteins were boiled off Sepharose beads in Laemmli buffer containing 8M urea for SDS-Page.</p></sec><sec id="s3-2-2"><title>Western blots</title><p>Samples of protein were harvested following treatment using 2x Laemmli buffer. Protein equivalent to 200,000 cells was loaded in 20 µl Laemmli, per lane, and subjected to SDS-PAGE on a 6.5% gel before transfer to nitrocellulose (GE Healthcare, Germany). Membranes were either stained with affinity purified, IR-labelled secondary antibodies against rat (680 nm; Alexa, Invitrogen) and mouse (800 nm; Rockford, Biomol), and revealed using the Odyssey (Licor), or stained with hrp-conjugated secondary antibodies against rat (Sigma), mouse (Promega), or rabbit (Promega), and revealed by enhanced chemiluminescence.</p></sec></sec><sec id="s3-3"><title>Generation and analysis of Y1F mutant</title><sec id="s3-3-1"><title>Construction of the CTD Y1F mutant</title><p>Construction of wild-type and mutant (Y1F) Rpb1 expression vectors was performed as follow: The DNA sequence of RPB1 CTD comprising amino acids of repeats 1–52 (aa 1593–1970) was synthesized and cloned into a vector LSmock (<xref ref-type="bibr" rid="bib3">Chapman et al., 2004</xref>) and recombinant HA-tagged wild-type RPB1 was established. Alternatively, a CTD DNA sequence was synthesized with a replacement of amino acid tyrosine to phenylalanine in repeats 4 to 51 of CTD. Both vectors were sequenced before usage.</p></sec><sec id="s3-3-2"><title>α-Amanitin resistant cell lines and cell culture</title><p>Raji is an Epstein-Barr-virus-positive Burkitt's lymphoma cell line. Cells were transfected with the wild-type and (Y1F) Rpb1 expression vectors by electroporation (10 μg of plasmid DNA/10<sup>7</sup> cells; 960 μF, 250 V). Polyclonal cell batches were established after selection with G418 (1 mg/ml) for 10–12 days. Expression of recombinant Rpb1 was induced by removal of doxocyclin. 24 hr after induction, cells were cultured in the presence of 2 μg/ml α-amanitin (Sigma). Cells were grown in RPMI 1640 medium supplemented with 10% fetal calf serum, 1% penicillin streptomycin (GIBCO; Invitrogen, Germany), and 2 mM L-glutamine (GIBCO; Invitrogen) at densities between 2 × 10<sup>5</sup> to 10<sup>6</sup> cells/ml.</p></sec></sec><sec id="s3-4"><title>ChIP-seq, MNase-seq, and RNA-seq experiments</title><p>ChIP-seq and MNase-seq experiments were performed essentially as described before using same standard and QC for experiments (<xref ref-type="bibr" rid="bib10">Fenouil et al., 2012</xref>). Experimental details of individual experiments, including replicates when applicable, are also indicated in <xref ref-type="table" rid="tbl1">Table 1</xref>.<table-wrap id="tbl1" position="float"><object-id pub-id-type="doi">10.7554/eLife.02105.021</object-id><label>Table 1.</label><caption><p>Summary of ChIP conditions and bioinformatics treatment for each experiment (NR = not relevant, NA = not available)</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.021">http://dx.doi.org/10.7554/eLife.02105.021</ext-link></p></caption><table frame="hsides" rules="groups"><thead><tr><th/><th colspan="6">ChIP antibodies and conditions used (* For ChIP-QPCR)</th><th/><th colspan="2"/><th/><th/><th colspan="2">Peak detection</th></tr><tr><th>Experiment</th><th>Antibody (clone)</th><th>Origin</th><th>Reference Antibody</th><th>Number of cells</th><th>Antibody/Beads</th><th>Washes (RIPA/TE)</th><th>Replicates Number</th><th>Tags Not Aligned/Multiple Alignment (× 10<sup>6</sup>)</th><th>Tags Used (× 10<sup>6</sup>)</th><th>Lanes Number</th><th>Extension Size (bp)</th><th>Threshold</th><th>Max Gap</th></tr></thead><tbody><tr><td rowspan="3">Pol II</td><td rowspan="3">Total (N-20)</td><td rowspan="3">Rabbit polyclonal</td><td rowspan="3">Santa Cruz (sc-899x)</td><td rowspan="3">1 × 10<sup>8</sup></td><td rowspan="3">20 µg/200 µl</td><td rowspan="3">8x/1x</td><td>1</td><td>8.93</td><td>19.83</td><td>1</td><td>176</td><td rowspan="3">80</td><td rowspan="3">350</td></tr><tr><td>2</td><td>17.94</td><td>33.02</td><td>2</td><td>166</td></tr><tr><td>3</td><td>16.54</td><td>28.48</td><td>1</td><td>156</td></tr><tr><td rowspan="2">H3K4me1</td><td rowspan="2">H3K4me1</td><td rowspan="2">Rabbit polyclonal</td><td rowspan="2">Abcam (ab8895)</td><td rowspan="2">5 × 10<sup>6</sup></td><td rowspan="2">2 µg/20 µl</td><td rowspan="2">8x/1x</td><td>1</td><td>9.35</td><td>7.83</td><td>1</td><td>176</td><td rowspan="2">60</td><td rowspan="2">700</td></tr><tr><td>2</td><td>7.59</td><td>20.93</td><td>1</td><td>226</td></tr><tr><td rowspan="2">H3K4me3</td><td rowspan="2">H3K4me3</td><td rowspan="2">Rabbit polyclonal</td><td rowspan="2">Abcam (ab8580)</td><td rowspan="2">5 × 10<sup>6</sup></td><td rowspan="2">2 µg/20 µl</td><td rowspan="2">8x/1x</td><td>1</td><td>7.12</td><td>2.61</td><td>1</td><td>186</td><td rowspan="2">50</td><td rowspan="2">400</td></tr><tr><td>2</td><td>NA</td><td>14.14</td><td>1</td><td>123</td></tr><tr><td rowspan="2">H3K36me3</td><td rowspan="2">H3K36me3</td><td rowspan="2">Rabbit polyclonal</td><td rowspan="2">Abcam (ab9050)</td><td rowspan="2">2 × 10<sup>7</sup></td><td rowspan="2">8 µg/80 µl</td><td rowspan="2">8x/1x</td><td>1</td><td>NA</td><td>21.21</td><td>1</td><td>196</td><td rowspan="2">40</td><td rowspan="2">1000</td></tr><tr><td>2</td><td>NA</td><td>5.57</td><td>1</td><td>316</td></tr><tr><td>H3K27ac</td><td>H3K27ac</td><td>Rabbit polyclonal</td><td>Ab4729</td><td>5 × 10<sup>6</sup></td><td>2 µg/20 µl</td><td>5x/1x</td><td>1</td><td>5.33</td><td>52.50</td><td>1</td><td>197</td><td>100</td><td>750</td></tr><tr><td rowspan="3">Tyr1P</td><td rowspan="2">Tyr1P (3D12)</td><td rowspan="2">Rat monoclonal</td><td rowspan="2"><xref ref-type="bibr" rid="bib21">Mayer et al. (2012)</xref></td><td rowspan="2">1 × 10<sup>8</sup></td><td rowspan="2">10 µg/100 µl</td><td rowspan="2">5x/1x</td><td>1</td><td>12.30</td><td>15.56</td><td>1</td><td>206</td><td rowspan="2">NR</td><td rowspan="2">NR</td></tr><tr><td>2</td><td>9.98</td><td>15.55</td><td>1</td><td>276</td></tr><tr><td>Tyr1P (8G5)</td><td>Rat monoclonal</td><td>This article</td><td>1 × 10<sup>8</sup></td><td>10 µg/100 µl</td><td>5x/1x</td><td>1</td><td>30.26</td><td>28.78</td><td>1</td><td>187</td><td>NR</td><td>NR</td></tr><tr><td rowspan="2">Ser2P</td><td rowspan="2">Ser2P (3E10)</td><td rowspan="2">Rat monoclonal</td><td rowspan="2"><xref ref-type="bibr" rid="bib4">Chapman et al. (2007)</xref></td><td rowspan="2">2 × 10<sup>8</sup></td><td rowspan="2">80 µg/400 µl</td><td rowspan="2">5x/1x</td><td>1</td><td>9.31</td><td>11.28</td><td>1</td><td>192</td><td rowspan="2">NR</td><td rowspan="2">NR</td></tr><tr><td>2</td><td>9.85</td><td>15.94</td><td>1</td><td>286</td></tr><tr><td rowspan="2">Ser5P</td><td rowspan="2">Ser5P (3E8)</td><td rowspan="2">Rat monoclonal</td><td rowspan="2"><xref ref-type="bibr" rid="bib4">Chapman et al. (2007)</xref></td><td rowspan="2">1.2 × 10<sup>8</sup> (2.5 × 10<sup>7</sup>*)</td><td rowspan="2">24 µg/240 µl (5 µg/50 µl*)</td><td rowspan="2">8x/1x</td><td>1</td><td>NA</td><td>13.98</td><td>1</td><td>146</td><td rowspan="2">NR</td><td rowspan="2">NR</td></tr><tr><td>2</td><td>NA</td><td>3.57</td><td>1</td><td>216</td></tr><tr><td rowspan="2">Ser7P</td><td rowspan="2">Ser7P (4E12)</td><td rowspan="2">Rat monoclonal</td><td rowspan="2"><xref ref-type="bibr" rid="bib4">Chapman et al. (2007)</xref></td><td rowspan="2">1 × 10<sup>8</sup></td><td rowspan="2">10 µg/100 µl</td><td rowspan="2">5x/1x</td><td>1</td><td>NA</td><td>16.46</td><td>1</td><td>156</td><td rowspan="2">NR</td><td rowspan="2">NR</td></tr><tr><td>2</td><td>NA</td><td>1.92</td><td>1</td><td>226</td></tr><tr><td>Short-RNA-seq</td><td>NR</td><td>NR</td><td>NR</td><td>1 × 10<sup>7</sup></td><td>NR</td><td>NR</td><td>1</td><td>NA</td><td>9.87</td><td>1</td><td>NR</td><td>NR</td><td>NR</td></tr><tr><td>MNase-seq</td><td>NR</td><td>NR</td><td>NR</td><td>2 × 10<sup>7</sup></td><td>NR</td><td>NR</td><td>1</td><td>90.00</td><td>289.60</td><td>1</td><td>152/NR midpoints<xref ref-type="table-fn" rid="tblfn1">**</xref></td><td>NR</td><td>NR</td></tr><tr><td rowspan="4">Input</td><td rowspan="4">NR</td><td rowspan="4">NR</td><td rowspan="4">NR</td><td rowspan="4">NR</td><td rowspan="4">NR</td><td rowspan="4">NR</td><td>1</td><td>20.10</td><td>18.18</td><td>1</td><td>126</td><td rowspan="4">NR</td><td rowspan="4">NR</td></tr><tr><td>2</td><td>NA</td><td>29.74</td><td>1</td><td>146</td></tr><tr><td>3</td><td>15.41</td><td>24.93</td><td>1</td><td>118</td></tr><tr><td>4</td><td>11.20</td><td>28.32</td><td>1</td><td>196</td></tr></tbody></table><table-wrap-foot><fn id="tblfn1"><label>**</label><p>For MNase-seq, the experiment was performed and processed in pair-end. For nucleosome density, tags were not elongated but connected and the indicated sequence average length is withdrawn by our analysis pipeline using the pair-end information. For midpoints analyses, elongation does not apply and data treatment is indicated earlier in ‘Materials and methods–Processing of sequenced tags’.</p></fn></table-wrap-foot></table-wrap></p><sec id="s3-4-1"><title>ChIP-seq</title><p>Briefly, for ChIP-seq experiments, Raji B-cells were directly crosslinked in 25 ml of growth medium. Crosslinking was performed with the addition of 1/10th volume of crosslinking solution (11% formaldehyde, 100 mM NaCl, 1 mM EDTA pH 8, 0.5 mM EGTA pH 8, 50 mM Hepes pH 7.8) for a final formaldehyde concentration of 1% for 10 min at room temperature. The reaction was quenched with the addition of 250 mM glycine and incubation at room temperature for 5 min. Cells were washed twice with cold DPBS and counted. All buffers contained EDTA-free protease inhibitor cocktail (Roche, France) and phosphatase inhibitors (Thermo Scientific, France) to final concentration of 1x together with 0.2 mM PMSF and 1 µg/ml pepstatin. 5 × 10<sup>7</sup> cells were then lysed in 2.5 mL LB1 buffer (50 mM Hepes pH 7.5, 140 mM NaCl, 1 mM EDTA pH 8, 10% glycerol, 0.75% NP-40, 0.25% Triton X-100) by incubation at 4°C for 20 min. Nuclei were collected by centrifugation at 1350×<italic>g</italic> and washed in 2.5 ml LB2 (200 mM NaCl, 1 mM EDTA pH 8, 0.5 mM EGTA pH 8, 10 mM Tris pH 8) for 10 min. Nuclei were then centrifuged and resuspended in 1.5 ml of LB3 (1 mM EDTA pH 8, 0.5 mM EGTA pH 8, 10 mM Tris pH 8, 100 mM NaCl, 0.1% Na-Deoxycholate, 0.5% N-lauroylsarcosine) and sonicated using a Misonix 4000 (Misonix Inc, Farmingdale, NY, USA) sonicator for 14 cycles of 30 s ON and 30 s OFF at amplitude of 40. After sonication Triton X-100 was added to 1% final concentration and cellular debris was precipitated by centrifugation at 20000×<italic>g</italic> for 10 min in a refrigerated centrifuge. Aliquots of clear supernatant were transferred to new tubes, snap frozen, and kept at −80°C until use. 50 µl aliquots were taken to serve as input control as well as sonication quality control.</p><p>Inputs were combined with an equal volume of 2x elution buffer (100 mM Tris pH 8, 20 mM EDTA pH 8, 2% SDS) and incubated overnight in a water bath at 65°C for 13–15 hr. SDS was then diluted by the addition of an equal volume of TE (10 mM Tris pH 8, 1 mM EDTA pH 8) and RNA was digested by RNase A at a final concentration of 0.2 μg/ml at 37°C for 2 hr. Samples were subsequently Proteinase K treated at 55°C for 2 hr at a final concentration of 0.2 μg/ml. DNA was purified by two subsequent phenol:chloroform:isoamylalcohol (25:24:1, pH 8) extractions and followed by a Qiaquick purification (PCR purification columns, Qiagen, Germany). DNA concentration was measured using a Nanodrop 1000 (Thermo Scientific, France) and 4 ng DNA was analyzed using High Sensitivity DNA chips on a 2100 Bioanalyzer to verify sonication efficiencies.</p><p>All experiments were performed using Dynabeads (Invitrogen, USA) coated with Protein-G. Beads were washed 3x with 1 ml and subsequently resuspended in 250 μl of blocking solution (0.5% BSA in 1x DPBS). After the addition of the antibody, the beads were incubated at 4°C overnight on a rotating wheel. Unbound antibodies were removed through three further washes with 1 ml of blocking solution. Beads were resuspended in 100 μl of blocking solution, chromatin extracts were added, and the mix was incubated overnight at 4°C on a rotating wheel.</p><p>EDTA-free protease inhibitors (Roche) were added to all washing buffers to a final concentration of 1x together with 0.2 mM PMSF and 1 μg/ml pepstatin. Beads were washed 8 times in RIPA buffer (50 mM Hepes pH 7.6, 500 mM LiCl, 1 mM EDTA pH 8, 1% NP-40, 0.7% Na-Deoxycholate) and once in TE+ (10 mM Tris pH 8, 1 mM EDTA pH 8, 50 mM NaCl). Immunoprecipitated chromatin was recovered from the beads with two subsequent elution steps at 65°C for 15 and 10 min in 110 μl and 100 μl of elution buffer (50 mM Tris pH 8, 10 mM EDTA pH 8, 1% SDS), respectively. The two eluates were combined and incubated at 65°C overnight (13–15 hr) for crosslink reversal. DNA was purified as described for the input (see <xref ref-type="table" rid="tbl1">Table 1</xref> for a summary of ChIP conditions for each experiment).</p><p>Prior to sequencing, ChIP DNA was quantified using the double stranded DNA HS kit on a Qubit apparatus (Life Technologies, USA) and 1 ng ChIP DNA was analyzed on a High Sensitivity DNA chip on a 2100 Bioanalyzer (Agilent Technologies, USA). DNA yields were typically between 5 and 100 ng for different antibodies. At least 1 ng of ChIP or input DNA was used for library preparation according to the Illumina ChIP-seq protocol. After end-repair and adapter ligation, fragments were size-selected (cut) on an agarose gel prior to pre-amplification and clustering. The size-selected and pre-amplified fragments were verified on a 2100 Bioanalyzer (Agilent Technologies, USA) before clustering and sequencing on a Genome Analyzer II or HighSeq 2000 (Illumina, USA) according to manufacturer's instructions.</p></sec><sec id="s3-4-2"><title>MNase-seq</title><p>For sequencing of nucleosomal DNA, 2 × 10<sup>7</sup> cells were resuspended in 50 μl Solution I (150 mM sucrose, 80 mM KCl, 5 mM K<sub>2</sub>HPO<sub>4</sub>, 5 mM MgCl<sub>2</sub>, 0.5 mM CaCl<sub>2</sub>, 35 mM HEPES pH 7.4) and NP40 was added to a final concentration of 0.2%. Cell membranes were permeabilized for one minute at 37°C. For nucleosomal digestion, 40U of MNase was added with 0.5 ml of Solution II (150 mM sucrose, 50 mM Tris pH 8, 50 mM NaCl, 2 mM CaCl<sub>2</sub>) and incubated for 30 min at room temperature. The reactions were stopped with the addition of EDTA to a final concentration of 10 mM. The cells were lyzed using 1.45 ml of SDS Lysis Buffer (1% SDS, 10 mM EDTA pH 8, 50 mM Tris pH 8), with a 10 min incubation at 4°C. A 200 μl aliquot was taken for purification and the remaining extract was stored at −80°C. An equal volume of TE (200 μl) was added to the aliquot, followed by subsequent 2 hr treatments with each 0.2 μg/ml final concentrations of RNase A and Proteinase K at 37°C and 55°C, respectively. DNA was extracted by two subsequent phenol:chloroform:isoamylalcohol (25:24:1) extractions, further purified using QIAquick PCR purification columns (Qiagen, Germany) and eluted in 50 μl of water. The quality of nucleosomal digestion was verified by running 2 ng of DNA on High-Sensitivity 2100 Bioanalyzer chips (Agilent, USA). The typical Bioanalyser profile in our standardized conditions shows a clear peak of mononucleosome at 146 −/+ 5 bp that represents 80% of the nucleosomal DNA (the rest of the digested material spreads essentially in di- and tri-nucleosomal DNA). After library preparation, DNA fragments corresponding to mononucleosomes were cut from an agarose gel and subsequently clustered and sequenced on Genome Analyzer II (Illumina, USA) according to manufacturer's instructions.</p></sec><sec id="s3-4-3"><title>Short strand specific RNA-seq</title><p>Total RNA was extracted from 1 × 10<sup>7</sup> Raji cells using TRIzol (Life Technologies, USA) according to the manufacturer's instructions with some modifications to ensure higher recovery rates of small RNAs. This was achieved by addition of 10 μg of linear acrylamide (Life Technologies, USA) before RNA precipitation. DNA was digested using the rigorous Turbo DNase (Ambion, USA) treatment as per manufacturer's instructions. RNA quantity was measured on a Qubit apparatus (Life Technologies, USA) using RNA assay kit and the quality was verified using RNA pico chips on a 2100 Bioanalyzer (Agilent Technologies, USA).</p><p>Before preparation of sequencing libraries, small RNAs were enriched from 10 µg total RNA by using mirVana RNA Isolation kit (Life Technologies, USA) using manufacturer's protocol for small RNA enrichment. Strand specific RNA-seq library was constructed with ScriptMiner Small RNA-seq Library Preparation Kit (Epicenter, USA) according to manufacturer's recommended protocol. Briefly, after both 5′ and 3′ adapter ligation, resulting cDNA library was PCR amplified with 14 amplification cycles. Purified library DNA was run on a 10% TBE-PAGE gel and library DNA corresponding to transcripts between 15 nt and 50 nt was cut from the gel and transferred into 0.5 ml tubes with punctured bottoms which were in turn placed in 2 ml collection tubes. Gel slices were crushed into 2 ml tubes by a 2 min centrifugation at 14000×<italic>g</italic>. For library DNA elution by soaking, 0.4 ml of 0.3M NaCl was added to each tube, before a 4 hr rotation at room temperature. After removal of gel particles using 0.22 μm cellulose acetate filters, 10 μg of linear acrylamide (Life Technologies, USA) and 2.5 vol (approximately 1 ml) of ice-cold absolute ethanol were added. After 30 min incubation at −80°C, the eluted cDNA was precipitated by centrifugation at 4°C and maximum speed for 45 min. The pellet was washed with 1 ml of cold 80% ethanol, air dried, and resuspended in 20 μl of water. The size-selected small RNA library DNA was quantified using a Qubit apparatus with dsDNA High Sensitivity kit (Life Technologies, USA) and verified using DNA High Sensitivity 2100 Bioanalyzer chips (Agilent Technologies, USA). The library was clustered and sequenced using 76 cycles on a Genome Analyzer II (Illumina, USA) according to manufacturer's instructions.</p></sec></sec><sec id="s3-5"><title>Data pre-processing</title><p>Details of the data pre-processing are described in <xref ref-type="bibr" rid="bib10">Fenouil et al. (2012)</xref>.</p><sec id="s3-5-1"><title>Quality control and filtering</title><p>In brief, all samples were sequenced on an Illumina Genome Analyzer (GAIIx for ChIP-seq and RNA-seq, or HIseq2000 for MNase-seq and H3K27ac). Quality assessment and filtering of ChIP-seq and MNase-seq sequences were performed using either the Integrated Eland software or FASTX-Toolkit (<ext-link ext-link-type="uri" xlink:href="http://hannonlab.cshl.edu/fastx_toolkit/index.html">http://hannonlab.cshl.edu/fastx_toolkit/index.html</ext-link>) to pre-process FastQ files. Quality score and nucleotide composition at each position of the sequenced tags were assessed by box and bar plotting using FastX-Toolkit standard functions.</p><p>Quality controls (QC) and filtering of RNA samples were performed using fastQC (<ext-link ext-link-type="uri" xlink:href="http://www.bioinformatics.babraham.ac.uk/projects/fastqc/">http://www.bioinformatics.babraham.ac.uk/projects/fastqc/</ext-link>), FASTX-toolkit, and Cutadapt (<ext-link ext-link-type="uri" xlink:href="http://code.google.com/p/cutadapt/">http://code.google.com/p/cutadapt/</ext-link>). Adapters were removed (Cutadapt) and a QC report was generated (fastQC). Sequences were further trimmed at nucleotide 55 and quality filtered as for DNA sample (FASTX-toolkit).</p></sec><sec id="s3-5-2"><title>Processing of sequenced tags</title><p>All samples were aligned to human genome (hg19, GRCh37) using Bowtie (<xref ref-type="bibr" rid="bib19">Langmead et al., 2009</xref>) aligner (allowing two mismatches, keeping uniquely aligned reads only). Number of tags used are shown in <xref ref-type="table" rid="tbl1">Table 1</xref>. For technical replicates, Eland aligned files or BAM files were merged and processed as described in <xref ref-type="bibr" rid="bib10">Fenouil et al. (2012)</xref>. Correlations between biological replicates used in this study are shown in <xref ref-type="fig" rid="fig2s1">Figure 2—figure supplement 1A</xref>. Whenever 2 replicates were not fitting a minimal good signal/noise or reproducible signal, samples were discarded from analysis and experiment reproduced. For the processing, briefly, piles of tags with same coordinates, due to artifacts of PCR or unannotated regions of the genome were removed according to a thresholding method, except for RNA-seq experiment. Uniquely aligned tags were further elongated after estimating optimal elongation size <italic>in silico</italic> and enabling to use the original fragment length for further processing. For ChIP-seq experiments, all samples were input subtracted and signals were scaled. For nucleosome mapping, MNAse-seq experiment in Raji was sequenced in paired-end with higher depth than ChIP-seq in Hiseq2000. Two types of analyses were applied to this data: nucleosomes density (<xref ref-type="fig" rid="fig4">Figure 4A</xref>, <xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1</xref>) and nucleosomes midpoint (<xref ref-type="fig" rid="fig2">Figure 2D</xref>, <xref ref-type="fig" rid="fig3">Figure 3</xref>, <xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1</xref>) that allow to score more specifically for depletion or positioning, respectively. For nucleosome density, paired tags were processed so to be directly connected and to retrieve original fragments (orphan tags were connected to the corresponding pairs using the estimated elongation size computed as described above). The input subtraction step was omitted. For nucleosomes midpoint analyses, the middle of elongated fragments was set as reference allowing locating the maximum signal approximately at the midpoint of the nucleosomes (dyads). For all experiments, the number of tags covering each nucleotide of the genome was computed and averaged in bins of 50 nucleotides and in bins of 10 (<xref ref-type="fig" rid="fig3s2">Figure 3—figure supplement 2C</xref>). The scores of bins were rescaled (after input subtraction when applicable) to reduce over-representation of particular genomic regions and signal/noise ratio. Finally, wig files of each corresponding biological replicates were merged.</p></sec></sec><sec id="s3-6"><title>Bioinformatics analysis</title><sec id="s3-6-1"><title>Gene selection and average binding profiles</title><p>Wiggle files scores were retrieved with an in-house R script (<xref ref-type="supplementary-material" rid="SD1-data">Source code 1</xref>) for hg19 Refseq annotations and coordinates defined for selected enhancers and promoters. Overlapping annotations and those being at less than 2000 bp of another were removed. Indeed, keeping genes in vicinity of others could mix different signals leading to misinterpretation. To select Refseq genes with a significant signal, mean values distributions of Pol II isoforms and short ssRNAs at (TSS-1000 bp; TES+2000 bp) (whole gene, <xref ref-type="fig" rid="fig2">Figure 2C,D</xref>, <xref ref-type="fig" rid="fig2s5">Figure 2—figure supplement 5A</xref>, <xref ref-type="fig" rid="fig2s6">Figure 2—figure supplement 6A</xref>) and at TSS −/+500 bp (TSS, <xref ref-type="fig" rid="fig3">Figure 3</xref>, <xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1</xref>, <xref ref-type="fig" rid="fig3s2">Figure 3—figure supplement 2</xref>) were plotted using an in-house script (<xref ref-type="fig" rid="fig2s1">Figure 2—figure supplement 1B,C</xref>, <xref ref-type="supplementary-material" rid="SD1-data">Source code 1</xref>). Gene sets of <xref ref-type="fig" rid="fig2">Figure 2</xref> were selected according to each experiment mean distribution except for MNase-seq and RNA-seq whose selections were based on Pol II. For <xref ref-type="fig" rid="fig2s4">Figure 2—figure supplement 4</xref>, a less stringent threshold at 0 was used in order to study phosphorylation patterns of lower bound genes. The set of genes used in <xref ref-type="fig" rid="fig3">Figure 3</xref> were also selected according to levels of Pol II at TSS (<xref ref-type="fig" rid="fig2s1">Figure 2—figure supplement 1C</xref>). Based on distribution, two Gaussian distributions were fitted using the R package mixdist (<ext-link ext-link-type="uri" xlink:href="http://www.math.mcmaster.ca/peter/mix/mix.html">http://www.math.mcmaster.ca/peter/mix/mix.html</ext-link>). The threshold above which a mean value is considered as significant was set to the mean of the second Gaussian distribution. In these analyses, only genes with a length above 2 kb were kept as shorter genes tend to harbor specific profiles not reflecting the majority of coding sequences, for examples due to shorter (or lack of) introns. Moreover, histone, rRNA, snomiRNA, snoRNA, snRNA, and tRNA genes as well as outliers of short ssRNAs were removed since they also potentially modify the shapes of average profiles. Finally, a total of 1854 genes was used in <xref ref-type="fig" rid="fig3">Figure 3</xref> (1846 without antisense RNA outliers).</p><p>An in-house R package retrieves signal of ChIP-seq, RNA-seq, and MNase-seq, centers them at TSS and transcription end site (TES) on a user defined selection of genes and intervals. It also retrieves all values inside each annotation, scale them to the same length, and add the half of values computed around TSS upstream and around TES downstream the annotation to obtain profiles as shown in <xref ref-type="fig" rid="fig2">Figure 2C</xref>. Rescaling and plotting are obtained by interpolating the retrieved values on 1000 points enabling to build a matrix on which each column will be averaged. In <xref ref-type="fig" rid="fig2s6">Figure 2—figure supplement 6A</xref>, the values were further divided into three curves representing average profiles of the top 5%, top 5–20%, and bottom 5% of genes signal.</p></sec><sec id="s3-6-2"><title>Boxplots and statistical tests</title><p>The in-house package mentioned above was used to retrieve values on which means were computed. The boxplots of <xref ref-type="fig" rid="fig2">Figure 2E</xref> represent two sets of mean values computed on: the antisense region which was defined as covering 500 bp before TSS and the sense region as covering 500 bp after. The analysis was performed on 3201 genes defined as being the union of the set of genes retrieved for each mark. The outliers defined by the R function ‘boxplot’ by default as being all values above Q3+(1.5 × (Q3−Q1)) (interquartile range) were filtered. The remaining values were scaled between 0 and 1 before plotting. Before performing the parametric two-sided paired sample <italic>t</italic> test (<xref ref-type="supplementary-material" rid="SD1-data">Source code 1</xref>), the normal distribution of data was checked (data not shown). In <xref ref-type="fig" rid="fig2s2">Figure 2—figure supplement 2D</xref>, the same method was used on lowly, medium, and highly expressed genes without scaling between 0 and 1 but instead dividing by the binding values of Pol II.</p><p><xref ref-type="fig" rid="fig2s2">Figure 2—figure supplement 2C</xref> represents mean values computed as mentioned above using only one region −/+500 bp around TSSs without removing outliers and scaling. However, outliers were not represented. The boxplots in <xref ref-type="fig" rid="fig4">Figure 4B</xref>, <xref ref-type="fig" rid="fig4s1">Figure 4—figure supplement 1D</xref>, and <xref ref-type="fig" rid="fig4s3">Figure 4—figure supplement 3C,D</xref> were computed similarly and divided by the corresponding mean values of Pol II. No mean values of Pol II equal to zero were detected.</p></sec><sec id="s3-6-3"><title>Tyr1P peak sorting and corresponding clusters</title><p>For Tyr1P sorting (<xref ref-type="fig" rid="fig3">Figure 3</xref>, <xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1</xref>), an in-house script (<xref ref-type="supplementary-material" rid="SD1-data">Source code 1</xref>) was used as described previously in <xref ref-type="bibr" rid="bib10">Fenouil et al. (2012)</xref>. Briefly, taking the genes selected as having significant level of Pol II, genes were ordered according to the relative increasing distance to the TSS of the maximal peak of Tyr1P. Other clusters show the corresponding signal of Pol II, Ser5P, Ser7P, nucleosomes, and short ssRNAs on the same genes. Heatmaps were formatted in terms of color and contrast according to sample read depth using Java TreeView software (<xref ref-type="bibr" rid="bib25">Saldanha, 2004</xref>).</p></sec><sec id="s3-6-4"><title>Definition of AT/GC content and density map</title><p>The AT content defines the presence of A or T in a particular sequence. Similarly, the GC content defines the presence of G or C in a given sequence.</p><p>The heatmaps of <xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1A</xref> (AT and GC content) were built as follow: The corresponding fasta sequences of genes used in <xref ref-type="fig" rid="fig3">Figure 3</xref> were retrieved with the R package ChIPpeakAnno (<xref ref-type="bibr" rid="bib29">Zhu et al., 2010</xref>) in association with the Bioconductor package BSgenome.Hsapiens.UCSC.hg19 (<ext-link ext-link-type="uri" xlink:href="http://www.bioconductor.org/packages/2.12/data/annotation/html/BSgenome.Hsapiens.UCSC.hg19.html">http://www.bioconductor.org/packages/2.12/data/annotation/html/BSgenome.Hsapiens.UCSC.hg19.html</ext-link>). The command line RSAT tools (<xref ref-type="bibr" rid="bib28">Turatsinze et al., 2008</xref>) enabled to retrieve the motifs W (A or T) and S (G or C) from those sequences. With an in-house script (<xref ref-type="supplementary-material" rid="SD1-data">Source code 1</xref>), the positions of motifs were converted to GFF formatted files taking into account the positions of Refseq hg19 annotations. Finally, another in-house script (<xref ref-type="supplementary-material" rid="SD1-data">Source code 1</xref>) converted those GFF to a binary matrix that was output in a format readable by Java Treeview software. This software was used as described above for color scaling.</p></sec><sec id="s3-6-5"><title>Correlation of biological replicates and cross-correlation</title><p>In <xref ref-type="fig" rid="fig4">Figure 4D</xref>, mean values used for Spearman correlation were retrieved on selected enhancer regions (+/−2000 bp around Pol II ChIP-seq maximal signal). In <xref ref-type="fig" rid="fig2s1">Figure 2—figure supplement 1</xref>, each point represents the mean value of ChIP-seq signal of a gene on interval [TSS-1000 bp;3′+1000 bp]. For <xref ref-type="fig" rid="fig4s3">Figure 4—figure supplement 3</xref>, cross-correlation were computed −/+ 500 bp around H3K4me3 ChIP-seq maximal signal. Finally for <xref ref-type="fig" rid="fig2s6">Figure 2—figure supplement 6B</xref>, from left to right, Spearman correlations were computed on mean values at [TSS−500 bp;TSS+500 bp], [TSS+1000 bp;3'−500 bp], and [3′−500 bp;3'+1000 bp], respectively. The scripts for generating the correlations of biological replicates and tables of cross-correlation are available in <xref ref-type="supplementary-material" rid="SD1-data">Source code 1</xref>.</p></sec><sec id="s3-6-6"><title>Selection of enhancers and promoters using Pol II</title><p>For the analyses shown in <xref ref-type="fig" rid="fig4">Figure 4</xref> and <xref ref-type="fig" rid="fig4s1">Figure 4—figure supplement 1</xref> (scripts and procedure to detect enhancers and promoters can be found in <xref ref-type="supplementary-material" rid="SD1-data">Source code 1</xref>), wiggle files of ChIP-seq signals of Pol II, H3K4me1, H3K4me3, and H3K36me3 were analyzed to extract enriched regions at control promoters and putative intergenic enhancers. The peak-calling was performed using an in-house script (<xref ref-type="supplementary-material" rid="SD1-data">Source code 1</xref>) fixing a threshold based on the peak height and the gap between two adjacent signals. Enriched regions separated by a distance less than a fixed max gap were merged (chosen values of thresholds and max gap are summarized in <xref ref-type="table" rid="tbl1">Table 1</xref>). Regions showing a combined enrichment of Pol II, H3K4me1, and H3K4me3 signal were further identified as regions of interest to build control promoters and putative intergenic enhancer sets (<xref ref-type="fig" rid="fig4s1">Figure 4—figure supplement 1A–E1P1</xref>). When a region intersected a gene annotation on the interval [TSS−2000; TSS+1000], it was defined as a ‘promoter region’ (6073 regions). To refine enhancer selection and to avoid lincRNAs promoter regions (<xref ref-type="bibr" rid="bib12">Guttman et al., 2009</xref>; <xref ref-type="bibr" rid="bib22">Natoli and Andrau, 2012</xref>), we removed the regions located at less than 5000 bp from any hg19 Refseq gene and harboring a significant H3K36me3 signal enrichment in vicinity that is less than 2000 bp from boundaries (747 regions, <xref ref-type="fig" rid="fig4s1">Figure 4—figure supplement 1A–E2</xref>). We further used the H3K4me3/me1 ratio to define final enhancer and promoter selections (<xref ref-type="bibr" rid="bib23">Pekowska et al., 2011</xref>; <xref ref-type="bibr" rid="bib7">de Almeida et al., 2011</xref>; <xref ref-type="bibr" rid="bib20">Li et al., 2012</xref>; <xref ref-type="bibr" rid="bib22">Natoli and Andrau, 2012</xref>). Means and relative ratios of ChIP-seq signal of H3K4me1 and H3K4me3 on intergenic enhancer candidates, on promoter candidates, and on corresponding annotated hg19 Refseq promoters (extended by ±1000 bp) were computed (<xref ref-type="fig" rid="fig4s1">Figure 4—figure supplement 1B</xref>). A threshold (green dashed line, <xref ref-type="fig" rid="fig4s1">Figure 4—figure supplement 1B</xref>) was defined to remove intergenic enhancer candidate regions with a H3K4 methylation ratio signature similar to promoters (ratio above the threshold), leading to a selection of enhancers (422 regions, <xref ref-type="fig" rid="fig4s1">Figure 4—figure supplement 1A–E3</xref>). Similarly, promoter candidates with H3K4me3 over H3K4me1 ratio below the fixed threshold were removed from the selection (5812 regions remaining, <xref ref-type="fig" rid="fig4s1">Figure 4—figure supplement 1A–P2</xref>).</p><p>In identified promoters and enhancers sets, the location of maximal signal of Pol II was defined as the centre of the region. Finally, mean values of short ssRNA signal were computed on each promoter and enhancer at centers of the regions ± 2000 bp around Pol II peak. The enhancers and promoters with outlying values were filtered from selections (390 enhancers and 4618 promoters remaining, <xref ref-type="fig" rid="fig4s1">Figure 4—figure supplement 1AE4P3</xref>). Note that using Pol II as a docking site for these analyses typically yields a rather strong nucleosome density at the middle of the promoter/enhancer area (<xref ref-type="fig" rid="fig4">Figure 4A</xref>). Different results can be obtained (lower nucleosome densities) when TBP is used as a docking site (<xref ref-type="bibr" rid="bib7">de Almeida et al., 2011</xref>).</p></sec><sec id="s3-6-7"><title>Selection of active enhancers and promoters using H3K27ac</title><p>Similarly to the previous section (see also <xref ref-type="supplementary-material" rid="SD1-data">Source code 1</xref>), enhancers and promoters were selected using detected peaks of H3K4me1, H3K4me3, H3K36me3, and H3K27ac (<xref ref-type="fig" rid="fig4s3">Figure 4—figure supplement 3A</xref>). This selection enables distinguishing active enhancers and promoters (having an overlapping peak of H3K27ac) from the whole selection (based on H3K4me1/3 that includes less active or poised enhancers). Although Pol II was described to be a hallmark of active and tissue specific enhancers (<xref ref-type="bibr" rid="bib18">Koch et al., 2011</xref>), the here below described procedure enabled to retrieve a higher number of enhancers (2598; 927 active) and promoters (6057; 5946 active) giving a less stringent description of these genomic modules.</p><p>Regions harboring H3K4me1 and H3K4me3 were first split into intergenic regions without H3K36me3 (E2′, 3404) and promoter regions (P1′, 8201). Using the ratio H3K4me1/H3K4me3, 2789 enhancers (E3′) and 7147 promoters (P2′) were kept. Performing H3K27ac overlap on the above isolated regions yields 1045 active enhancers and 7030 active promoters. Regions were centered on H3K4me3 maximal values and discarding regions having short RNAs outliers finally gives active enhancers and control promoters (E5′/P5′, 927/5946) and a whole set of enhancers and control promoters (E6′/P6′, 2598/6057).</p></sec><sec id="s3-6-8"><title>Tissue specificity analysis</title><p>To assess the tissue specificity of genes associated with identified enhancers and promoters of <xref ref-type="fig" rid="fig4">Figure 4</xref> (<xref ref-type="fig" rid="fig4s1">Figure 4—figure supplement 1E</xref>) and <xref ref-type="fig" rid="fig4s3">Figure 4—figure supplement 3C,D</xref>, we proceeded as in <xref ref-type="bibr" rid="bib18">Koch et al. (2011)</xref>. Briefly, using bioGPS website (<ext-link ext-link-type="uri" xlink:href="http://biogps.org/#goto=welcome">http://biogps.org/#goto=welcome</ext-link>), a Gene Atlas averaged dataset of expression values based on HGU133 array for human containing 84 tissues (<xref ref-type="bibr" rid="bib27">Su et al., 2004</xref>) was used. The expression values of genes nearest to selected enhancers and promoters were compared to the whole dataset and the significance of differences was assessed with a nonparametric statistical Mann-Whitney-Wilcoxon test. Bars of expression levels were sorted by p-values and the 10 most differentially expressed tissues are shown. Scripts generating the tissue specificity barplots are available in <xref ref-type="supplementary-material" rid="SD1-data">Source code 1</xref>.</p></sec><sec id="s3-6-9"><title>Gene expression analysis</title><p>Microarrays data of expression in Human Raji cell line was retrieved on Array Express database (E-GEOD-46873). Corresponding symbols between array chip and human hg19 Refseq annotations were downloaded from Ensembl Biomart (Release 73, <xref ref-type="bibr" rid="bib11">Flicek et al., 2013</xref>).</p><p>Replicates were merged by taking the mean of expression. When several probes indicated expression of a single Refseq gene, the median of expression was attributed to the corresponding Refseq ID. Refseq genes were then ordered by expression removing genes at less than 2 kb from another and particular categories of genes were removed as described in ‘Materials and methods–Gene selection and average binding profiles’. Corresponding ChIP-seq and short ssRNA-seq signals were retrieved on the ordered genes and represented with heatmaps at 1 kb around TSS (<xref ref-type="fig" rid="fig2s2">Figure 2—figure supplement 2</xref>). For profiles shown in <xref ref-type="fig" rid="fig2s2">Figure 2—figure supplement 2B</xref>, outliers were discarded. As mentioned above, colors were scaled using Java Treeview software. Profiles (<xref ref-type="fig" rid="fig2s2">Figure 2—figure supplement 2B</xref>) and boxplots (<xref ref-type="fig" rid="fig2s2">Figure 2—figure supplement 2CD</xref>) were built as described in ‘Materials and methods–Gene selection and average binding profiles and Boxplots and statistical tests’. Input files and scripts used can be found in <xref ref-type="supplementary-material" rid="SD1-data">Source code 1</xref>.</p></sec><sec id="s3-6-10"><title>CTD isoforms and nucleosomes midpoint maximal peaks spatial organization analysis</title><p>Binary matrices of 2000 interpolated ChIP-seq values shown in <xref ref-type="fig" rid="fig3">Figure 3A</xref> and <xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1A</xref> in Java Treeview format were used as input. They were reduced to values at ± 500 bp around TSS and the list of genes limited to group 1. Maximal value indexes of Tyr1P signal were first retrieved. To avoid ambiguities in interpretation in our relative Pol II and isoforms positions in class I (<xref ref-type="fig" rid="fig3s2">Figure 3—figure supplement 2</xref>), we analyzed those genes that belonged to class I and that clearly featured AS transcription. For this, mean values of short ssRNA experiments were computed at −50/+100 bp around Tyr1P detected maximal peaks. Genes having a significant level of antisense RNAs were kept using the mean distribution and thresholding as described in ‘Materials and methods–Gene selection and average binding profiles’. Only annotations with a level of antisense RNAs higher than sense RNAs were kept performing a one sided nonparametric Mann-Whitney-Wilcoxon statistical test (p-value &lt;0.05). A total of 529 genes were selected. Then, maximal peaks detection for the other marks was computed at −100/+100 bp around Tyr1P signal. For each maximal peak of each experiment shown in <xref ref-type="fig" rid="fig3s2">Figure 3—figure supplement 2</xref>, the distances to maximal peaks of Tyr1P and Pol II were computed. The R package rgl (<ext-link ext-link-type="uri" xlink:href="http://rgl.neoscientists.org/about.shtml">http://rgl.neoscientists.org/about.shtml</ext-link>) was used for 3D representation of the maximal peaks according to the distance to TSS, to Pol II and their values.</p><p>To assess if distances retrieved were not originating from background noise (<xref ref-type="fig" rid="fig3s2">Figure 3—figure supplement 2C</xref>), distances to Pol II of selected genes of (A) on 500 bp before TSS (representing the AS region) were compared to the total set of genes (keeping only genes at more than 2000 bp from any RefSeq annotations). Kernel density estimates were computed using R. A lower resolution of 10 bp was used (compared to 50 bp of <xref ref-type="fig" rid="fig3s2">Figure 3—figure supplement 2A,B</xref>). Scripts and procedures to generate figures of the spatial analysis can be found in <xref ref-type="supplementary-material" rid="SD1-data">Source code 1</xref>.</p></sec></sec></sec></body><back><ack id="ack"><title>Acknowledgements</title><p>Members of the Jean Christophe Andrau's lab were supported by grants for ANR (Muhammad Ahmad Maqbool, Lionel Spinelli), CNRS (Romain Fenouil), FRM (Charlène Innocenti), Ministère de la Recherche (Nicolas Descostes) and Ligue Nationale contre le Cancer (Nicolas Descostes). Work in the Dirk Eick's lab was supported by Deutsche Forschungsgemeinschaft Grants SFB1064 and SFB684. We thank Salvatore Spicuglia for suggestion in the manuscript. We thank Jim Manley and colleagues for communicating their manuscript prior submission. We thank also Pierre Ferrier for his advice and support.</p><p>Data accession</p><p>Data reported in this paper can be found at Gene Expression Omnibus database under the accession number GSE52914.</p></ack><sec sec-type="additional-information"><title>Additional information</title><fn-group content-type="competing-interest"><title>Competing interests</title><fn fn-type="conflict" id="conf1"><p>The authors declare that no competing interests exist.</p></fn></fn-group><fn-group content-type="author-contribution"><title>Author contributions</title><fn fn-type="con" id="con1"><p>ND, Performed bioinformatic analyses, Conception and design, Analysis and interpretation of data, Drafting or revising the article, Contributed unpublished essential data or reagents</p></fn><fn fn-type="con" id="con2"><p>MH, Involved in antibody generation and biochemical characterization, Conception and design, Acquisition of data, Drafting or revising the article, Contributed unpublished essential data or reagents</p></fn><fn fn-type="con" id="con3"><p>LS, Performed bioinformatic analyses, Analysis and interpretation of data, Drafting or revising the article</p></fn><fn fn-type="con" id="con4"><p>RS, Involved in antibody generation and biochemical characterization, Acquisition of data, Drafting or revising the article</p></fn><fn fn-type="con" id="con5"><p>MAM, Performed genome-wide experiments, Conception and design, Acquisition of data, Drafting or revising the article, Contributed unpublished essential data or reagents</p></fn><fn fn-type="con" id="con6"><p>RF, Performed bioinformatic analyses, Analysis and interpretation of data, Drafting or revising the article, Contributed unpublished essential data or reagents</p></fn><fn fn-type="con" id="con7"><p>FK, Performed genome-wide experiments, Acquisition of data, Drafting or revising the article, Contributed unpublished essential data or reagents</p></fn><fn fn-type="con" id="con8"><p>CI, Performed genome-wide experiments</p></fn><fn fn-type="con" id="con9"><p>MG, Performed sequencing at the CNAG platform, Acquisition of data</p></fn><fn fn-type="con" id="con10"><p>IG, Performed sequencing at the CNAG platform, Acquisition of data</p></fn><fn fn-type="con" id="con11"><p>DE, Conception and design, Acquisition of data, Analysis and interpretation of data, Drafting or revising the article, Contributed unpublished essential data or reagents</p></fn><fn fn-type="con" id="con12"><p>J-CA, Conception and design, Acquisition of data, Analysis and interpretation of data, Drafting or revising the article, Contributed unpublished essential data or reagents</p></fn></fn-group></sec><sec sec-type="supplementary-material"><title>Additional files</title><supplementary-material id="SD1-data"><object-id pub-id-type="doi">10.7554/eLife.02105.022</object-id><label>Source code 1.</label><caption><p>Folder containing the different scripts used in this study.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.02105.022">http://dx.doi.org/10.7554/eLife.02105.022</ext-link></p></caption><media mime-subtype="tar.gz" mimetype="application" xlink:href="elife02105s001.tar.gz"/></supplementary-material><sec sec-type="datasets"><title>Major datasets</title><p>The following datasets were generated:</p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro1"><name><surname>Descostes</surname><given-names>N</given-names></name>, <name><surname>Heidemann</surname><given-names>M</given-names></name>, <name><surname>Spinelli</surname><given-names>L</given-names></name>, <name><surname>Schüller</surname><given-names>R</given-names></name>, <name><surname>Maqbool</surname><given-names>MA</given-names></name>, <name><surname>Fenouil</surname><given-names>R</given-names></name>, <name><surname>Koch</surname><given-names>F</given-names></name>, <name><surname>Innocenti</surname><given-names>C</given-names></name>, <name><surname>Gut</surname><given-names>M</given-names></name>, <name><surname>Gut</surname><given-names>I</given-names></name>, <name><surname>Eick</surname><given-names>D</given-names></name>, <name><surname>Andrau</surname><given-names>J</given-names></name>, <year>2014</year><x>, </x><source>Pol II</source><x>, </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914</ext-link><x>, </x><comment>Publicly available at NCBI Gene Expression Omnibus.</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro2"><name><surname>Descostes</surname><given-names>N</given-names></name>, <name><surname>Heidemann</surname><given-names>M</given-names></name>, <name><surname>Spinelli</surname><given-names>L</given-names></name>, <name><surname>Schüller</surname><given-names>R</given-names></name>, <name><surname>Maqbool</surname><given-names>MA</given-names></name>, <name><surname>Fenouil</surname><given-names>R</given-names></name>, <name><surname>Koch</surname><given-names>F</given-names></name>, <name><surname>Innocenti</surname><given-names>C</given-names></name>, <name><surname>Gut</surname><given-names>M</given-names></name>, <name><surname>Gut</surname><given-names>I</given-names></name>, <name><surname>Eick</surname><given-names>D</given-names></name>, <name><surname>Andrau</surname><given-names>J</given-names></name>, <year>2014</year><x>, </x><source>H3K4me1</source><x>, </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914</ext-link><x>, </x><comment>Publicly available at NCBI Gene Expression Omnibus.</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro3"><name><surname>Descostes</surname><given-names>N</given-names></name>, <name><surname>Heidemann</surname><given-names>M</given-names></name>, <name><surname>Spinelli</surname><given-names>L</given-names></name>, <name><surname>Schüller</surname><given-names>R</given-names></name>, <name><surname>Maqbool</surname><given-names>MA</given-names></name>, <name><surname>Fenouil</surname><given-names>R</given-names></name>, <name><surname>Koch</surname><given-names>F</given-names></name>, <name><surname>Innocenti</surname><given-names>C</given-names></name>, <name><surname>Gut</surname><given-names>M</given-names></name>, <name><surname>Gut</surname><given-names>I</given-names></name>, <name><surname>Eick</surname><given-names>D</given-names></name>, <name><surname>Andrau</surname><given-names>J</given-names></name>, <year>2014</year><x>, </x><source>H3K4me3</source><x>, </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914</ext-link><x>, </x><comment>Publicly available at NCBI Gene Expression Omnibus.</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro4"><name><surname>Descostes</surname><given-names>N</given-names></name>, <name><surname>Heidemann</surname><given-names>M</given-names></name>, <name><surname>Spinelli</surname><given-names>L</given-names></name>, <name><surname>Schüller</surname><given-names>R</given-names></name>, <name><surname>Maqbool</surname><given-names>MA</given-names></name>, <name><surname>Fenouil</surname><given-names>R</given-names></name>, <name><surname>Koch</surname><given-names>F</given-names></name>, <name><surname>Innocenti</surname><given-names>C</given-names></name>, <name><surname>Gut</surname><given-names>M</given-names></name>, <name><surname>Gut</surname><given-names>I</given-names></name>, <name><surname>Eick</surname><given-names>D</given-names></name>, <name><surname>Andrau</surname><given-names>J</given-names></name>, <year>2014</year><x>, </x><source>H3K36me3</source><x>, </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914</ext-link><x>, </x><comment>Publicly available at NCBI Gene Expression Omnibus.</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro5"><name><surname>Descostes</surname><given-names>N</given-names></name>, <name><surname>Heidemann</surname><given-names>M</given-names></name>, <name><surname>Spinelli</surname><given-names>L</given-names></name>, <name><surname>Schüller</surname><given-names>R</given-names></name>, <name><surname>Maqbool</surname><given-names>MA</given-names></name>, <name><surname>Fenouil</surname><given-names>R</given-names></name>, <name><surname>Koch</surname><given-names>F</given-names></name>, <name><surname>Innocenti</surname><given-names>C</given-names></name>, <name><surname>Gut</surname><given-names>M</given-names></name>, <name><surname>Gut</surname><given-names>I</given-names></name>, <name><surname>Eick</surname><given-names>D</given-names></name>, <name><surname>Andrau</surname><given-names>J</given-names></name>, <year>2014</year><x>, </x><source>H3K27ac</source><x>, </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914</ext-link><x>, </x><comment>Publicly available at NCBI Gene Expression Omnibus.</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro6"><name><surname>Descostes</surname><given-names>N</given-names></name>, <name><surname>Heidemann</surname><given-names>M</given-names></name>, <name><surname>Spinelli</surname><given-names>L</given-names></name>, <name><surname>Schüller</surname><given-names>R</given-names></name>, <name><surname>Maqbool</surname><given-names>MA</given-names></name>, <name><surname>Fenouil</surname><given-names>R</given-names></name>, <name><surname>Koch</surname><given-names>F</given-names></name>, <name><surname>Innocenti</surname><given-names>C</given-names></name>, <name><surname>Gut</surname><given-names>M</given-names></name>, <name><surname>Gut</surname><given-names>I</given-names></name>, <name><surname>Eick</surname><given-names>D</given-names></name>, <name><surname>Andrau</surname><given-names>J</given-names></name>, <year>2014</year><x>, </x><source>Tyr1P</source><x>, </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914</ext-link><x>, </x><comment>Publicly available at NCBI Gene Expression Omnibus.</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro7"><name><surname>Descostes</surname><given-names>N</given-names></name>, <name><surname>Heidemann</surname><given-names>M</given-names></name>, <name><surname>Spinelli</surname><given-names>L</given-names></name>, <name><surname>Schüller</surname><given-names>R</given-names></name>, <name><surname>Maqbool</surname><given-names>MA</given-names></name>, <name><surname>Fenouil</surname><given-names>R</given-names></name>, <name><surname>Koch</surname><given-names>F</given-names></name>, <name><surname>Innocenti</surname><given-names>C</given-names></name>, <name><surname>Gut</surname><given-names>M</given-names></name>, <name><surname>Gut</surname><given-names>I</given-names></name>, <name><surname>Eick</surname><given-names>D</given-names></name>, <name><surname>Andrau</surname><given-names>J</given-names></name>, <year>2014</year><x>, </x><source>Ser2P</source><x>, </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914</ext-link><x>, </x><comment>Publicly available at NCBI Gene Expression Omnibus.</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro8"><name><surname>Descostes</surname><given-names>N</given-names></name>, <name><surname>Heidemann</surname><given-names>M</given-names></name>, <name><surname>Spinelli</surname><given-names>L</given-names></name>, <name><surname>Schüller</surname><given-names>R</given-names></name>, <name><surname>Maqbool</surname><given-names>MA</given-names></name>, <name><surname>Fenouil</surname><given-names>R</given-names></name>, <name><surname>Koch</surname><given-names>F</given-names></name>, <name><surname>Innocenti</surname><given-names>C</given-names></name>, <name><surname>Gut</surname><given-names>M</given-names></name>, <name><surname>Gut</surname><given-names>I</given-names></name>, <name><surname>Eick</surname><given-names>D</given-names></name>, <name><surname>Andrau</surname><given-names>J</given-names></name>, <year>2014</year><x>, </x><source>Ser5P</source><x>, </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914</ext-link><x>, </x><comment>Publicly available at NCBI Gene Expression Omnibus.</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro9"><name><surname>Descostes</surname><given-names>N</given-names></name>, <name><surname>Heidemann</surname><given-names>M</given-names></name>, <name><surname>Spinelli</surname><given-names>L</given-names></name>, <name><surname>Schüller</surname><given-names>R</given-names></name>, <name><surname>Maqbool</surname><given-names>MA</given-names></name>, <name><surname>Fenouil</surname><given-names>R</given-names></name>, <name><surname>Koch</surname><given-names>F</given-names></name>, <name><surname>Innocenti</surname><given-names>C</given-names></name>, <name><surname>Gut</surname><given-names>M</given-names></name>, <name><surname>Gut</surname><given-names>I</given-names></name>, <name><surname>Eick</surname><given-names>D</given-names></name>, <name><surname>Andrau</surname><given-names>J</given-names></name>, <year>2014</year><x>, </x><source>Ser7P</source><x>, </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914</ext-link><x>, </x><comment>Publicly available at NCBI Gene Expression Omnibus.</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro10"><name><surname>Descostes</surname><given-names>N</given-names></name>, <name><surname>Heidemann</surname><given-names>M</given-names></name>, <name><surname>Spinelli</surname><given-names>L</given-names></name>, <name><surname>Schüller</surname><given-names>R</given-names></name>, <name><surname>Maqbool</surname><given-names>MA</given-names></name>, <name><surname>Fenouil</surname><given-names>R</given-names></name>, <name><surname>Koch</surname><given-names>F</given-names></name>, <name><surname>Innocenti</surname><given-names>C</given-names></name>, <name><surname>Gut</surname><given-names>M</given-names></name>, <name><surname>Gut</surname><given-names>I</given-names></name>, <name><surname>Eick</surname><given-names>D</given-names></name>, <name><surname>Andrau</surname><given-names>J</given-names></name>, <year>2014</year><x>, </x><source>short RNAs</source><x>, </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914</ext-link><x>, </x><comment>Publicly available at NCBI Gene Expression Omnibus.</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro11"><name><surname>Descostes</surname><given-names>N</given-names></name>, <name><surname>Heidemann</surname><given-names>M</given-names></name>, <name><surname>Spinelli</surname><given-names>L</given-names></name>, <name><surname>Schüller</surname><given-names>R</given-names></name>, <name><surname>Maqbool</surname><given-names>MA</given-names></name>, <name><surname>Fenouil</surname><given-names>R</given-names></name>, <name><surname>Koch</surname><given-names>F</given-names></name>, <name><surname>Innocenti</surname><given-names>C</given-names></name>, <name><surname>Gut</surname><given-names>M</given-names></name>, <name><surname>Gut</surname><given-names>I</given-names></name>, <name><surname>Eick</surname><given-names>D</given-names></name>, <name><surname>Andrau</surname><given-names>J</given-names></name>, <year>2014</year><x>, </x><source>MNase</source><x>, </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914</ext-link><x>, </x><comment>Publicly available at NCBI Gene Expression Omnibus.</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro12"><name><surname>Descostes</surname><given-names>N</given-names></name>, <name><surname>Heidemann</surname><given-names>M</given-names></name>, <name><surname>Spinelli</surname><given-names>L</given-names></name>, <name><surname>Schüller</surname><given-names>R</given-names></name>, <name><surname>Maqbool</surname><given-names>MA</given-names></name>, <name><surname>Fenouil</surname><given-names>R</given-names></name>, <name><surname>Koch</surname><given-names>F</given-names></name>, <name><surname>Innocenti</surname><given-names>C</given-names></name>, <name><surname>Gut</surname><given-names>M</given-names></name>, <name><surname>Gut</surname><given-names>I</given-names></name>, <name><surname>Eick</surname><given-names>D</given-names></name>, <name><surname>Andrau</surname><given-names>J</given-names></name>, <year>2014</year><x>, </x><source>input</source><x>, </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE52914</ext-link><x>, </x><comment>Publicly available at NCBI Gene Expression Omnibus.</comment></related-object></p></sec></sec><ref-list><title>References</title><ref id="bib1"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Andersen</surname><given-names>PR</given-names></name><name><surname>Domanski</surname><given-names>M</given-names></name><name><surname>Kristiansen</surname><given-names>MS</given-names></name><name><surname>Storvall</surname><given-names>H</given-names></name><name><surname>Ntini</surname><given-names>E</given-names></name><name><surname>Verheggen</surname><given-names>C</given-names></name><name><surname>Schein</surname><given-names>A</given-names></name><name><surname>Bunkenborg</surname><given-names>J</given-names></name><name><surname>Poser</surname><given-names>I</given-names></name><name><surname>Hallais</surname><given-names>M</given-names></name><name><surname>Sandberg</surname><given-names>R</given-names></name><name><surname>Hyman</surname><given-names>A</given-names></name><name><surname>LaCava</surname><given-names>J</given-names></name><name><surname>Rout</surname><given-names>MP</given-names></name><name><surname>Andersen</surname><given-names>JS</given-names></name><name><surname>Bertrand</surname><given-names>E</given-names></name><name><surname>Jensen</surname><given-names>TH</given-names></name></person-group><year>2013</year><article-title>The human cap-binding complex is functionally connected to the nuclear RNA exosome</article-title><source>Nature Structural &amp; Molecular Biology</source><volume>20</volume><fpage>1367</fpage><lpage>1376</lpage><pub-id pub-id-type="doi">10.1038/nsmb.2703</pub-id></element-citation></ref><ref id="bib2"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Buratowski</surname><given-names>S</given-names></name></person-group><year>2009</year><article-title>Progression through the RNA polymerase II CTD cycle</article-title><source>Molecular Cell</source><volume>36</volume><fpage>541</fpage><lpage>546</lpage><pub-id pub-id-type="doi">10.1016/j.molcel.2009.10.019</pub-id></element-citation></ref><ref id="bib4"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chapman</surname><given-names>RD</given-names></name><name><surname>Heidemann</surname><given-names>M</given-names></name><name><surname>Albert</surname><given-names>TK</given-names></name><name><surname>Mailhammer</surname><given-names>R</given-names></name><name><surname>Flatley</surname><given-names>A</given-names></name><name><surname>Meisterernst</surname><given-names>M</given-names></name><name><surname>Kremmer</surname><given-names>E</given-names></name><name><surname>Eick</surname><given-names>D</given-names></name></person-group><year>2007</year><article-title>Transcribing RNA polymerase II is phosphorylated at CTD residue serine-7</article-title><source>Science</source><volume>318</volume><fpage>1780</fpage><lpage>1782</lpage><pub-id pub-id-type="doi">10.1126/science.1145977</pub-id></element-citation></ref><ref id="bib3"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chapman</surname><given-names>RD</given-names></name><name><surname>Palancade</surname><given-names>B</given-names></name><name><surname>Lang</surname><given-names>A</given-names></name><name><surname>Bensaude</surname><given-names>O</given-names></name><name><surname>Eick</surname><given-names>D</given-names></name></person-group><year>2004</year><article-title>The last CTD repeat of the mammalian RNA polymerase II large subunit is important for its stability</article-title><source>Nucleic Acids Research</source><volume>32</volume><fpage>35</fpage><lpage>44</lpage><pub-id pub-id-type="doi">10.1093/nar/gkh172</pub-id></element-citation></ref><ref id="bib6"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Core</surname><given-names>LJ</given-names></name><name><surname>Waterfall</surname><given-names>JJ</given-names></name><name><surname>Gilchrist</surname><given-names>DA</given-names></name><name><surname>Fargo</surname><given-names>DC</given-names></name><name><surname>Kwak</surname><given-names>H</given-names></name><name><surname>Adelman</surname><given-names>K</given-names></name><name><surname>Lis</surname><given-names>JT</given-names></name></person-group><year>2012</year><article-title>Defining the status of RNA polymerase at promoters</article-title><source>Cell Reports</source><volume>2</volume><fpage>1025</fpage><lpage>1035</lpage><pub-id pub-id-type="doi">10.1016/j.celrep.2012.08.034</pub-id></element-citation></ref><ref id="bib5"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Core</surname><given-names>LJ</given-names></name><name><surname>Waterfall</surname><given-names>JJ</given-names></name><name><surname>Lis</surname><given-names>JT</given-names></name></person-group><year>2008</year><article-title>Nascent RNA sequencing reveals widespread pausing and divergent initiation at human promoters</article-title><source>Science</source><volume>322</volume><fpage>1845</fpage><lpage>1848</lpage><pub-id pub-id-type="doi">10.1126/science.1162228</pub-id></element-citation></ref><ref id="bib7"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>de Almeida</surname><given-names>SF</given-names></name><name><surname>Grosso</surname><given-names>AR</given-names></name><name><surname>Koch</surname><given-names>F</given-names></name><name><surname>Fenouil</surname><given-names>R</given-names></name><name><surname>Carvalho</surname><given-names>S</given-names></name><name><surname>Andrade</surname><given-names>J</given-names></name><name><surname>Levezinho</surname><given-names>H</given-names></name><name><surname>Gut</surname><given-names>M</given-names></name><name><surname>Eick</surname><given-names>D</given-names></name><name><surname>Gut</surname><given-names>I</given-names></name><name><surname>Andrau</surname><given-names>JC</given-names></name><name><surname>Ferrier</surname><given-names>P</given-names></name><name><surname>Carmo-Fonseca</surname><given-names>M</given-names></name></person-group><year>2011</year><article-title>Splicing enhances recruitment of methyltransferase HYPB/Setd2 and methylation of histone H3 Lys36</article-title><source>Nature Structural &amp; Molecular Biology</source><volume>18</volume><fpage>977</fpage><lpage>983</lpage><pub-id pub-id-type="doi">10.1038/nsmb.2123</pub-id></element-citation></ref><ref id="bib8"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>De Santa</surname><given-names>F</given-names></name><name><surname>Barozzi</surname><given-names>I</given-names></name><name><surname>Mietton</surname><given-names>F</given-names></name><name><surname>Ghisletti</surname><given-names>S</given-names></name><name><surname>Polletti</surname><given-names>S</given-names></name><name><surname>Tusi</surname><given-names>BK</given-names></name><name><surname>Muller</surname><given-names>H</given-names></name><name><surname>Ragoussis</surname><given-names>J</given-names></name><name><surname>Wei</surname><given-names>CL</given-names></name><name><surname>Natoli</surname><given-names>G</given-names></name></person-group><year>2010</year><article-title>A large fraction of extragenic RNA pol II transcription sites overlap enhancers</article-title><source>PLOS Biology</source><volume>8</volume><fpage>e1000384</fpage><pub-id pub-id-type="doi">10.1371/journal.pbio.1000384</pub-id></element-citation></ref><ref id="bib9"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Egloff</surname><given-names>S</given-names></name><name><surname>O'Reilly</surname><given-names>D</given-names></name><name><surname>Chapman</surname><given-names>RD</given-names></name><name><surname>Taylor</surname><given-names>A</given-names></name><name><surname>Tanzhaus</surname><given-names>K</given-names></name><name><surname>Pitts</surname><given-names>L</given-names></name><name><surname>Eick</surname><given-names>D</given-names></name><name><surname>Murphy</surname><given-names>S</given-names></name></person-group><year>2007</year><article-title>Serine-7 of the RNA polymerase II CTD is specifically required for snRNA gene expression</article-title><source>Science</source><volume>318</volume><fpage>1777</fpage><lpage>1779</lpage><pub-id pub-id-type="doi">10.1126/science.1145989</pub-id></element-citation></ref><ref id="bib10"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Fenouil</surname><given-names>R</given-names></name><name><surname>Cauchy</surname><given-names>P</given-names></name><name><surname>Koch</surname><given-names>F</given-names></name><name><surname>Descostes</surname><given-names>N</given-names></name><name><surname>Cabeza</surname><given-names>JZ</given-names></name><name><surname>Innocenti</surname><given-names>C</given-names></name><name><surname>Ferrier</surname><given-names>P</given-names></name><name><surname>Spicuglia</surname><given-names>S</given-names></name><name><surname>Gut</surname><given-names>M</given-names></name><name><surname>Gut</surname><given-names>I</given-names></name><name><surname>Andrau</surname><given-names>JC</given-names></name></person-group><year>2012</year><article-title>CpG islands and GC content dictate nucleosome depletion in a transcription-independent manner at mammalian promoters</article-title><source>Genome Research</source><volume>22</volume><fpage>2399</fpage><lpage>2408</lpage><pub-id pub-id-type="doi">10.1101/gr.138776.112</pub-id></element-citation></ref><ref id="bib11"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Flicek</surname><given-names>P</given-names></name><name><surname>Ahmed</surname><given-names>I</given-names></name><name><surname>Amode</surname><given-names>MR</given-names></name><name><surname>Barrell</surname><given-names>D</given-names></name><name><surname>Beal</surname><given-names>K</given-names></name><name><surname>Brent</surname><given-names>S</given-names></name><name><surname>Carvalho-Silva</surname><given-names>D</given-names></name><name><surname>Clapham</surname><given-names>P</given-names></name><name><surname>Coates</surname><given-names>G</given-names></name><name><surname>Fairley</surname><given-names>S</given-names></name><name><surname>Fitzgerald</surname><given-names>S</given-names></name><name><surname>Gil</surname><given-names>L</given-names></name><name><surname>García-Girón</surname><given-names>C</given-names></name><name><surname>Gordon</surname><given-names>L</given-names></name><name><surname>Hourlier</surname><given-names>T</given-names></name><name><surname>Hunt</surname><given-names>S</given-names></name><name><surname>Juettemann</surname><given-names>T</given-names></name><name><surname>Kähäri</surname><given-names>AK</given-names></name><name><surname>Keenan</surname><given-names>S</given-names></name><name><surname>Komorowska</surname><given-names>M</given-names></name><name><surname>Kulesha</surname><given-names>E</given-names></name><name><surname>Longden</surname><given-names>I</given-names></name><name><surname>Maurel</surname><given-names>T</given-names></name><name><surname>McLaren</surname><given-names>WM</given-names></name><name><surname>Muffato</surname><given-names>M</given-names></name><name><surname>Nag</surname><given-names>R</given-names></name><name><surname>Overduin</surname><given-names>B</given-names></name><name><surname>Pignatelli</surname><given-names>M</given-names></name><name><surname>Pritchard</surname><given-names>B</given-names></name><name><surname>Pritchard</surname><given-names>E</given-names></name><name><surname>Riat</surname><given-names>HS</given-names></name><name><surname>Ritchie</surname><given-names>GR</given-names></name><name><surname>Ruffier</surname><given-names>M</given-names></name><name><surname>Schuster</surname><given-names>M</given-names></name><name><surname>Sheppard</surname><given-names>D</given-names></name><name><surname>Sobral</surname><given-names>D</given-names></name><name><surname>Taylor</surname><given-names>K</given-names></name><name><surname>Thormann</surname><given-names>A</given-names></name><name><surname>Trevanion</surname><given-names>S</given-names></name><name><surname>White</surname><given-names>S</given-names></name><name><surname>Wilder</surname><given-names>SP</given-names></name><name><surname>Aken</surname><given-names>BL</given-names></name><name><surname>Birney</surname><given-names>E</given-names></name><name><surname>Cunningham</surname><given-names>F</given-names></name><name><surname>Dunham</surname><given-names>I</given-names></name><name><surname>Harrow</surname><given-names>J</given-names></name><name><surname>Herrero</surname><given-names>J</given-names></name><name><surname>Hubbard</surname><given-names>TJ</given-names></name><name><surname>Johnson</surname><given-names>N</given-names></name><name><surname>Kinsella</surname><given-names>R</given-names></name><name><surname>Parker</surname><given-names>A</given-names></name><name><surname>Spudich</surname><given-names>G</given-names></name><name><surname>Yates</surname><given-names>A</given-names></name><name><surname>Zadissa</surname><given-names>A</given-names></name><name><surname>Searle</surname><given-names>SM</given-names></name></person-group><year>2013</year><article-title>Ensembl 2013</article-title><source>Nucleic Acids Research</source><volume>41</volume><fpage>D48</fpage><lpage>D55</lpage><pub-id pub-id-type="doi">10.1093/nar/gks1236</pub-id></element-citation></ref><ref id="bib12"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Guttman</surname><given-names>M</given-names></name><name><surname>Amit</surname><given-names>I</given-names></name><name><surname>Garber</surname><given-names>M</given-names></name><name><surname>French</surname><given-names>C</given-names></name><name><surname>Lin</surname><given-names>MF</given-names></name><name><surname>Feldser</surname><given-names>D</given-names></name><name><surname>Huarte</surname><given-names>M</given-names></name><name><surname>Zuk</surname><given-names>O</given-names></name><name><surname>Carey</surname><given-names>BW</given-names></name><name><surname>Cassady</surname><given-names>JP</given-names></name><name><surname>Cabili</surname><given-names>MN</given-names></name><name><surname>Jaenisch</surname><given-names>R</given-names></name><name><surname>Mikkelsen</surname><given-names>TS</given-names></name><name><surname>Jacks</surname><given-names>T</given-names></name><name><surname>Hacohen</surname><given-names>N</given-names></name><name><surname>Bernstein</surname><given-names>BE</given-names></name><name><surname>Kellis</surname><given-names>M</given-names></name><name><surname>Regev</surname><given-names>A</given-names></name><name><surname>Rinn</surname><given-names>JL</given-names></name><name><surname>Lander</surname><given-names>ES</given-names></name></person-group><year>2009</year><article-title>Chromatin signature reveals over a thousand highly conserved large non-coding RNAs in mammals</article-title><source>Nature</source><volume>458</volume><fpage>223</fpage><lpage>227</lpage><pub-id pub-id-type="doi">10.1038/nature07672</pub-id></element-citation></ref><ref id="bib13"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Heidemann</surname><given-names>M</given-names></name><name><surname>Hintermair</surname><given-names>C</given-names></name><name><surname>Voß</surname><given-names>K</given-names></name><name><surname>Eick</surname><given-names>D</given-names></name></person-group><year>2012</year><article-title>Dynamic phosphorylation patterns of RNA polymerase II CTD during transcription</article-title><source>Biochimica et Biophysica Acta</source><volume>1829</volume><fpage>55</fpage><lpage>62</lpage><pub-id pub-id-type="doi">10.1016/j.bbagrm.2012.08.013</pub-id></element-citation></ref><ref id="bib14"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hintermair</surname><given-names>C</given-names></name><name><surname>Heidemann</surname><given-names>M</given-names></name><name><surname>Koch</surname><given-names>F</given-names></name><name><surname>Descostes</surname><given-names>N</given-names></name><name><surname>Gut</surname><given-names>M</given-names></name><name><surname>Gut</surname><given-names>I</given-names></name><name><surname>Fenouil</surname><given-names>R</given-names></name><name><surname>Ferrier</surname><given-names>P</given-names></name><name><surname>Flatley</surname><given-names>A</given-names></name><name><surname>Kremmer</surname><given-names>E</given-names></name><name><surname>Chapman</surname><given-names>RD</given-names></name><name><surname>Andrau</surname><given-names>JC</given-names></name><name><surname>Eick</surname><given-names>D</given-names></name></person-group><year>2012</year><article-title>Threonine-4 of mammalian RNA polymerase II CTD is targeted by Polo-like kinase 3 and required for transcriptional elongation</article-title><source>The EMBO Journal</source><volume>31</volume><fpage>2784</fpage><lpage>2797</lpage><pub-id pub-id-type="doi">10.1038/emboj.2012.123</pub-id></element-citation></ref><ref id="bib16"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hsin</surname><given-names>JP</given-names></name><name><surname>Li</surname><given-names>W</given-names></name><name><surname>Hoque</surname><given-names>M</given-names></name><name><surname>Tian</surname><given-names>B</given-names></name><name><surname>Manley</surname><given-names>JL</given-names></name></person-group><year>2014</year><article-title>RNAP II CTD tyrosine 1 performs multiple functions in vertebrate cells</article-title><source>eLife</source><volume>3</volume><fpage>e02112</fpage><pub-id pub-id-type="doi">10.7554/eLife.02112</pub-id></element-citation></ref><ref id="bib15"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hsin</surname><given-names>JP</given-names></name><name><surname>Sheth</surname><given-names>A</given-names></name><name><surname>Manley</surname><given-names>JL</given-names></name></person-group><year>2011</year><article-title>RNAP II CTD phosphorylated on threonine-4 is required for histone mRNA 3' end processing</article-title><source>Science</source><volume>334</volume><fpage>683</fpage><lpage>686</lpage><pub-id pub-id-type="doi">10.1126/science.1206034</pub-id></element-citation></ref><ref id="bib17"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname><given-names>TK</given-names></name><name><surname>Hemberg</surname><given-names>M</given-names></name><name><surname>Gray</surname><given-names>JM</given-names></name><name><surname>Costa</surname><given-names>AM</given-names></name><name><surname>Bear</surname><given-names>DM</given-names></name><name><surname>Wu</surname><given-names>J</given-names></name><name><surname>Harmin</surname><given-names>DA</given-names></name><name><surname>Laptewicz</surname><given-names>M</given-names></name><name><surname>Barbara-Haley</surname><given-names>K</given-names></name><name><surname>Kuersten</surname><given-names>S</given-names></name><name><surname>Markenscoff-Papadimitriou</surname><given-names>E</given-names></name><name><surname>Kuhl</surname><given-names>D</given-names></name><name><surname>Bito</surname><given-names>H</given-names></name><name><surname>Worley</surname><given-names>PF</given-names></name><name><surname>Kreiman</surname><given-names>G</given-names></name><name><surname>Greenberg</surname><given-names>ME</given-names></name></person-group><year>2010</year><article-title>Widespread transcription at neuronal activity-regulated enhancers</article-title><source>Nature</source><volume>465</volume><fpage>182</fpage><lpage>187</lpage><pub-id pub-id-type="doi">10.1038/nature09033</pub-id></element-citation></ref><ref id="bib18"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Koch</surname><given-names>F</given-names></name><name><surname>Fenouil</surname><given-names>R</given-names></name><name><surname>Gut</surname><given-names>M</given-names></name><name><surname>Cauchy</surname><given-names>P</given-names></name><name><surname>Albert</surname><given-names>TK</given-names></name><name><surname>Zacarias-Cabeza</surname><given-names>J</given-names></name><name><surname>Spicuglia</surname><given-names>S</given-names></name><name><surname>de la Chapelle</surname><given-names>AL</given-names></name><name><surname>Heidemann</surname><given-names>M</given-names></name><name><surname>Hintermair</surname><given-names>C</given-names></name><name><surname>Eick</surname><given-names>D</given-names></name><name><surname>Gut</surname><given-names>I</given-names></name><name><surname>Ferrier</surname><given-names>P</given-names></name><name><surname>Andrau</surname><given-names>JC</given-names></name></person-group><year>2011</year><article-title>Transcription initiation platforms and GTF recruitment at tissue-specific enhancers and promoters</article-title><source>Nature Structural &amp; Molecular Biology</source><volume>18</volume><fpage>956</fpage><lpage>963</lpage><pub-id pub-id-type="doi">10.1038/nsmb.2085</pub-id></element-citation></ref><ref id="bib19"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Langmead</surname><given-names>B</given-names></name><name><surname>Trapnell</surname><given-names>C</given-names></name><name><surname>Pop</surname><given-names>M</given-names></name><name><surname>Salzberg</surname><given-names>SL</given-names></name></person-group><year>2009</year><article-title>Ultrafast and memory-efficient alignment of short DNA sequences to the human genome</article-title><source>Genome Biology</source><volume>10</volume><fpage>R25</fpage><pub-id pub-id-type="doi">10.1186/gb-2009-10-3-r25</pub-id></element-citation></ref><ref id="bib20"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Li</surname><given-names>G</given-names></name><name><surname>Ruan</surname><given-names>X</given-names></name><name><surname>Auerbach</surname><given-names>RK</given-names></name><name><surname>Sandhu</surname><given-names>KS</given-names></name><name><surname>Zheng</surname><given-names>M</given-names></name><name><surname>Wang</surname><given-names>P</given-names></name><name><surname>Poh</surname><given-names>HM</given-names></name><name><surname>Goh</surname><given-names>Y</given-names></name><name><surname>Lim</surname><given-names>J</given-names></name><name><surname>Zhang</surname><given-names>J</given-names></name><name><surname>Sim</surname><given-names>HS</given-names></name><name><surname>Peh</surname><given-names>SQ</given-names></name><name><surname>Mulawadi</surname><given-names>FH</given-names></name><name><surname>Ong</surname><given-names>CT</given-names></name><name><surname>Orlov</surname><given-names>YL</given-names></name><name><surname>Hong</surname><given-names>S</given-names></name><name><surname>Zhang</surname><given-names>Z</given-names></name><name><surname>Landt</surname><given-names>S</given-names></name><name><surname>Raha</surname><given-names>D</given-names></name><name><surname>Euskirchen</surname><given-names>G</given-names></name><name><surname>Wei</surname><given-names>CL</given-names></name><name><surname>Ge</surname><given-names>W</given-names></name><name><surname>Wang</surname><given-names>H</given-names></name><name><surname>Davis</surname><given-names>C</given-names></name><name><surname>Fisher-Aylor</surname><given-names>KI</given-names></name><name><surname>Mortazavi</surname><given-names>A</given-names></name><name><surname>Gerstein</surname><given-names>M</given-names></name><name><surname>Gingeras</surname><given-names>T</given-names></name><name><surname>Wold</surname><given-names>B</given-names></name><name><surname>Sun</surname><given-names>Y</given-names></name><name><surname>Fullwood</surname><given-names>MJ</given-names></name><name><surname>Cheung</surname><given-names>E</given-names></name><name><surname>Liu</surname><given-names>E</given-names></name><name><surname>Sung</surname><given-names>WK</given-names></name><name><surname>Snyder</surname><given-names>M</given-names></name><name><surname>Ruan</surname><given-names>Y</given-names></name></person-group><year>2012</year><article-title>Extensive promoter-centered chromatin interactions provide a topological basis for transcription regulation</article-title><source>Cell</source><volume>148</volume><fpage>84</fpage><lpage>98</lpage><pub-id pub-id-type="doi">10.1016/j.cell.2011.12.014</pub-id></element-citation></ref><ref id="bib21"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Mayer</surname><given-names>A</given-names></name><name><surname>Heidemann</surname><given-names>M</given-names></name><name><surname>Lidschreiber</surname><given-names>M</given-names></name><name><surname>Schreieck</surname><given-names>A</given-names></name><name><surname>Sun</surname><given-names>M</given-names></name><name><surname>Hintermair</surname><given-names>C</given-names></name><name><surname>Kremmer</surname><given-names>E</given-names></name><name><surname>Eick</surname><given-names>D</given-names></name><name><surname>Cramer</surname><given-names>P</given-names></name></person-group><year>2012</year><article-title>CTD tyrosine phosphorylation impairs termination factor recruitment to RNA polymerase II</article-title><source>Science</source><volume>336</volume><fpage>1723</fpage><lpage>1725</lpage><pub-id pub-id-type="doi">10.1126/science.1219651</pub-id></element-citation></ref><ref id="bib22"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Natoli</surname><given-names>G</given-names></name><name><surname>Andrau</surname><given-names>JC</given-names></name></person-group><year>2012</year><article-title>Noncoding transcription at enhancers: general principles and functional models</article-title><source>Annual Review of Genetics</source><volume>46</volume><fpage>1</fpage><lpage>19</lpage><pub-id pub-id-type="doi">10.1146/annurev-genet-110711-155459</pub-id></element-citation></ref><ref id="bib23"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Pekowska</surname><given-names>A</given-names></name><name><surname>Benoukraf</surname><given-names>T</given-names></name><name><surname>Zacarias-Cabeza</surname><given-names>J</given-names></name><name><surname>Belhocine</surname><given-names>M</given-names></name><name><surname>Koch</surname><given-names>F</given-names></name><name><surname>Holota</surname><given-names>H</given-names></name><name><surname>Imbert</surname><given-names>J</given-names></name><name><surname>Andrau</surname><given-names>JC</given-names></name><name><surname>Ferrier</surname><given-names>P</given-names></name><name><surname>Spicuglia</surname><given-names>S</given-names></name></person-group><year>2011</year><article-title>H3K4 tri-methylation provides an epigenetic signature of active enhancers</article-title><source>The EMBO Journal</source><volume>30</volume><fpage>4198</fpage><lpage>4210</lpage><pub-id pub-id-type="doi">10.1038/emboj.2011.295</pub-id></element-citation></ref><ref id="bib24"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Preker</surname><given-names>P</given-names></name><name><surname>Nielsen</surname><given-names>J</given-names></name><name><surname>Kammler</surname><given-names>S</given-names></name><name><surname>Lykke-Andersen</surname><given-names>S</given-names></name><name><surname>Christensen</surname><given-names>MS</given-names></name><name><surname>Mapendano</surname><given-names>CK</given-names></name><name><surname>Schierup</surname><given-names>MH</given-names></name><name><surname>Jensen</surname><given-names>TH</given-names></name></person-group><year>2008</year><article-title>RNA exosome depletion reveals transcription upstream of active human promoters</article-title><source>Science</source><volume>322</volume><fpage>1851</fpage><lpage>1854</lpage><pub-id pub-id-type="doi">10.1126/science.1164096</pub-id></element-citation></ref><ref id="bib25"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Saldanha</surname><given-names>AJ</given-names></name></person-group><year>2004</year><article-title>Java Treeview–extensible visualization of microarray data</article-title><source>Bioinformatics</source><volume>20</volume><fpage>3246</fpage><lpage>3248</lpage><pub-id pub-id-type="doi">10.1093/bioinformatics/bth349</pub-id></element-citation></ref><ref id="bib26"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Seila</surname><given-names>AC</given-names></name><name><surname>Calabrese</surname><given-names>JM</given-names></name><name><surname>Levine</surname><given-names>SS</given-names></name><name><surname>Yeo</surname><given-names>GW</given-names></name><name><surname>Rahl</surname><given-names>PB</given-names></name><name><surname>Flynn</surname><given-names>RA</given-names></name><name><surname>Young</surname><given-names>RA</given-names></name><name><surname>Sharp</surname><given-names>PA</given-names></name></person-group><year>2008</year><article-title>Divergent transcription from active promoters</article-title><source>Science</source><volume>322</volume><fpage>1849</fpage><lpage>1851</lpage><pub-id pub-id-type="doi">10.1126/science.1162253</pub-id></element-citation></ref><ref id="bib27"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Su</surname><given-names>AI</given-names></name><name><surname>Wiltshire</surname><given-names>T</given-names></name><name><surname>Batalov</surname><given-names>S</given-names></name><name><surname>Lapp</surname><given-names>H</given-names></name><name><surname>Ching</surname><given-names>KA</given-names></name><name><surname>Block</surname><given-names>D</given-names></name><name><surname>Zhang</surname><given-names>J</given-names></name><name><surname>Soden</surname><given-names>R</given-names></name><name><surname>Hayakawa</surname><given-names>M</given-names></name><name><surname>Kreiman</surname><given-names>G</given-names></name><name><surname>Cooke</surname><given-names>MP</given-names></name><name><surname>Walker</surname><given-names>JR</given-names></name><name><surname>Hogenesch</surname><given-names>JB</given-names></name></person-group><year>2004</year><article-title>A gene atlas of the mouse and human protein-encoding transcriptomes</article-title><source>Proceedings of the National Academy of Sciences of the United States of America</source><volume>101</volume><fpage>6062</fpage><lpage>6067</lpage><pub-id pub-id-type="doi">10.1073/pnas.0400782101</pub-id></element-citation></ref><ref id="bib28"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Turatsinze</surname><given-names>JV</given-names></name><name><surname>Thomas-Chollier</surname><given-names>M</given-names></name><name><surname>Defrance</surname><given-names>M</given-names></name><name><surname>van Helden</surname><given-names>J</given-names></name></person-group><year>2008</year><article-title>Using RSAT to scan genome sequences for transcription factor binding sites and cis-regulatory modules</article-title><source>Nature Protocols</source><volume>3</volume><fpage>1578</fpage><lpage>1588</lpage><pub-id pub-id-type="doi">10.1038/nprot.2008.97</pub-id></element-citation></ref><ref id="bib29"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhu</surname><given-names>LJ</given-names></name><name><surname>Gazin</surname><given-names>C</given-names></name><name><surname>Lawson</surname><given-names>ND</given-names></name><name><surname>Pagès</surname><given-names>H</given-names></name><name><surname>Lin</surname><given-names>SM</given-names></name><name><surname>Lapointe</surname><given-names>DS</given-names></name><name><surname>Green</surname><given-names>MR</given-names></name></person-group><year>2010</year><article-title>ChIPpeakAnno: a Bioconductor package to annotate ChIP-seq and ChIP-chip data</article-title><source>BMC Bioinformatics</source><volume>11</volume><fpage>237</fpage><pub-id pub-id-type="doi">10.1186/1471-2105-11-237</pub-id></element-citation></ref></ref-list></back></article>