Permalink
Cannot retrieve contributors at this time
Fetching contributors…
| <?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Archiving and Interchange DTD v1.1d1 20130915//EN" "JATS-archivearticle1.dtd"><article article-type="research-article" dtd-version="1.1d1" xmlns:xlink="http://www.w3.org/1999/xlink"><front><journal-meta><journal-id journal-id-type="nlm-ta">elife</journal-id><journal-id journal-id-type="hwp">eLife</journal-id><journal-id journal-id-type="publisher-id">eLife</journal-id><journal-title-group><journal-title>eLife</journal-title></journal-title-group><issn publication-format="electronic">2050-084X</issn><publisher><publisher-name>eLife Sciences Publications, Ltd</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">00569</article-id><article-id pub-id-type="doi">10.7554/eLife.00569</article-id><article-categories><subj-group subj-group-type="display-channel"><subject>Research article</subject></subj-group><subj-group subj-group-type="heading"><subject>Developmental biology and stem cells</subject></subj-group><subj-group subj-group-type="heading"><subject>Genomics and evolutionary biology</subject></subj-group></article-categories><title-group><article-title>The genome sequence of the colonial chordate, <italic>Botryllus schlosseri</italic></article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes" id="author-3790"><name><surname>Voskoboynik</surname><given-names>Ayelet</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="aff" rid="aff2"/><xref ref-type="corresp" rid="cor1">*</xref><xref ref-type="other" rid="par-1"/><xref ref-type="other" rid="par-2"/><xref ref-type="other" rid="par-3"/><xref ref-type="fn" rid="con1"/><xref ref-type="fn" rid="conf1"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/></contrib><contrib contrib-type="author" equal-contrib="yes" id="author-3870"><name><surname>Neff</surname><given-names>Norma F</given-names></name><xref ref-type="aff" rid="aff3"/><xref ref-type="fn" rid="equal-contrib">†</xref><xref ref-type="fn" rid="con2"/><xref ref-type="fn" rid="conf2"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/></contrib><contrib contrib-type="author" equal-contrib="yes" id="author-3871"><name><surname>Sahoo</surname><given-names>Debashis</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="fn" rid="equal-contrib">†</xref><xref ref-type="other" rid="par-5"/><xref ref-type="other" rid="par-6"/><xref ref-type="other" rid="par-7"/><xref ref-type="fn" rid="con3"/><xref ref-type="fn" rid="conf2"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/></contrib><contrib contrib-type="author" equal-contrib="yes" id="author-3872"><name><surname>Newman</surname><given-names>Aaron M</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="fn" rid="equal-contrib">†</xref><xref ref-type="other" rid="par-6"/><xref ref-type="fn" rid="con4"/><xref ref-type="fn" rid="conf2"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/></contrib><contrib contrib-type="author" equal-contrib="yes" id="author-3873"><name><surname>Pushkarev</surname><given-names>Dmitry</given-names></name><xref ref-type="aff" rid="aff3"/><xref ref-type="fn" rid="equal-contrib">†</xref><xref ref-type="fn" rid="con5"/><xref ref-type="fn" rid="conf1"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/></contrib><contrib contrib-type="author" equal-contrib="yes" id="author-3874"><name><surname>Koh</surname><given-names>Winston</given-names></name><xref ref-type="aff" rid="aff3"/><xref ref-type="fn" rid="equal-contrib">†</xref><xref ref-type="fn" rid="con6"/><xref ref-type="fn" rid="conf2"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/></contrib><contrib contrib-type="author" id="author-3875"><name><surname>Passarelli</surname><given-names>Benedetto</given-names></name><xref ref-type="aff" rid="aff3"/><xref ref-type="fn" rid="con7"/><xref ref-type="fn" rid="conf2"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/></contrib><contrib contrib-type="author" id="author-3876"><name><surname>Fan</surname><given-names>H Christina</given-names></name><xref ref-type="aff" rid="aff3"/><xref ref-type="fn" rid="con8"/><xref ref-type="fn" rid="conf2"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/></contrib><contrib contrib-type="author" id="author-3877"><name><surname>Mantalas</surname><given-names>Gary L</given-names></name><xref ref-type="aff" rid="aff3"/><xref ref-type="fn" rid="con9"/><xref ref-type="fn" rid="conf2"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/></contrib><contrib contrib-type="author" id="author-3878"><name><surname>Palmeri</surname><given-names>Karla J</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="aff" rid="aff2"/><xref ref-type="fn" rid="con10"/><xref ref-type="fn" rid="conf2"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/></contrib><contrib contrib-type="author" id="author-3879"><name><surname>Ishizuka</surname><given-names>Katherine J</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="aff" rid="aff2"/><xref ref-type="fn" rid="con11"/><xref ref-type="fn" rid="conf2"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/></contrib><contrib contrib-type="author" id="author-3880"><name><surname>Gissi</surname><given-names>Carmela</given-names></name><xref ref-type="aff" rid="aff4"/><xref ref-type="other" rid="par-4"/><xref ref-type="fn" rid="con12"/><xref ref-type="fn" rid="conf2"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/></contrib><contrib contrib-type="author" id="author-3881"><name><surname>Griggio</surname><given-names>Francesca</given-names></name><xref ref-type="aff" rid="aff4"/><xref ref-type="fn" rid="con13"/><xref ref-type="fn" rid="conf2"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/></contrib><contrib contrib-type="author" id="author-3882"><name><surname>Ben-Shlomo</surname><given-names>Rachel</given-names></name><xref ref-type="aff" rid="aff5"/><xref ref-type="fn" rid="con14"/><xref ref-type="fn" rid="conf2"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/></contrib><contrib contrib-type="author" id="author-3864"><name><surname>Corey</surname><given-names>Daniel M</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="fn" rid="con15"/><xref ref-type="fn" rid="conf2"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/></contrib><contrib contrib-type="author" id="author-3883"><name><surname>Penland</surname><given-names>Lolita</given-names></name><xref ref-type="aff" rid="aff3"/><xref ref-type="fn" rid="con16"/><xref ref-type="fn" rid="conf2"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/></contrib><contrib contrib-type="author" id="author-3884"><name><surname>White</surname><given-names>Richard A</given-names><suffix>III</suffix></name><xref ref-type="aff" rid="aff3"/><xref ref-type="fn" rid="con17"/><xref ref-type="fn" rid="conf2"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/></contrib><contrib contrib-type="author" corresp="yes" id="author-3885"><name><surname>Weissman</surname><given-names>Irving L</given-names></name><xref ref-type="aff" rid="aff1"/><xref ref-type="aff" rid="aff2"/><xref ref-type="aff" rid="aff6"/><xref ref-type="corresp" rid="cor2">*</xref><xref ref-type="other" rid="par-1"/><xref ref-type="other" rid="par-2"/><xref ref-type="other" rid="par-3"/><xref ref-type="other" rid="par-8"/><xref ref-type="fn" rid="con18"/><xref ref-type="fn" rid="conf2"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/></contrib><contrib contrib-type="author" corresp="yes" id="author-3886"><name><surname>Quake</surname><given-names>Stephen R</given-names></name><xref ref-type="aff" rid="aff3"/><xref ref-type="corresp" rid="cor3">*</xref><xref ref-type="other" rid="par-1"/><xref ref-type="other" rid="par-2"/><xref ref-type="other" rid="par-3"/><xref ref-type="fn" rid="con19"/><xref ref-type="fn" rid="conf1"/><xref ref-type="other" rid="dataro1"/><xref ref-type="other" rid="dataro2"/><xref ref-type="other" rid="dataro3"/></contrib><aff id="aff1"><institution content-type="dept">Department of Pathology</institution>, <institution>Institute for Stem Cell Biology and Regenerative Medicine, Stanford University</institution>, <addr-line><named-content content-type="city">Stanford</named-content></addr-line>, <country>United States</country></aff><aff id="aff2"><institution content-type="dept">Hopkins Marine Station</institution>, <institution>Stanford University</institution>, <addr-line><named-content content-type="city">Pacific Grove</named-content></addr-line>, <country>United States</country></aff><aff id="aff3"><institution content-type="dept">Departments of Applied Physics and Bioengineering</institution>, <institution>Howard Hughes Medical Institute, Stanford University</institution>, <addr-line><named-content content-type="city">Stanford</named-content></addr-line>, <country>United States</country></aff><aff id="aff4"><institution content-type="dept">Dipartimento di Bioscienze</institution>, <institution>Università degli Studi di Milano</institution>, <addr-line><named-content content-type="city">Milano</named-content></addr-line>, <country>Italy</country></aff><aff id="aff5"><institution content-type="dept">Department of Biology</institution>, <institution>University of Haifa-Oranim</institution>, <addr-line><named-content content-type="city">Tivon</named-content></addr-line>, <country>Israel</country></aff><aff id="aff6"><institution content-type="dept">Ludwig Center for Cancer Stem Cell Research and Medicine</institution>, <institution>Stanford University School of Medicine</institution>, <addr-line><named-content content-type="city">Stanford</named-content></addr-line>, <country>United States</country></aff></contrib-group><contrib-group content-type="section"><contrib contrib-type="editor"><name><surname>Bronner</surname><given-names>Marianne E</given-names></name><role>Reviewing editor</role><aff><institution>California Institute of Technology</institution>, <country>United States</country></aff></contrib></contrib-group><author-notes><corresp id="cor1"><label>*</label>For correspondence: <email>ayeletv@stanford.edu</email> (AV);</corresp><corresp id="cor2"><label>*</label>For correspondence: <email>irv@stanford.edu</email> (ILW);</corresp><corresp id="cor3"><label>*</label>For correspondence: <email>quake@stanford.edu</email> (SRQ)</corresp><fn fn-type="con" id="equal-contrib"><label>†</label><p>These authors contributed equally to this work</p></fn></author-notes><pub-date date-type="pub" publication-format="electronic"><day>02</day><month>07</month><year>2013</year></pub-date><pub-date pub-type="collection"><year>2013</year></pub-date><volume>2</volume><elocation-id>e00569</elocation-id><history><date date-type="received"><day>22</day><month>01</month><year>2013</year></date><date date-type="accepted"><day>28</day><month>05</month><year>2013</year></date></history><permissions><copyright-statement>© 2013, Voskoboynik et al</copyright-statement><copyright-year>2013</copyright-year><copyright-holder>Voskoboynik et al</copyright-holder><license xlink:href="http://creativecommons.org/licenses/by/3.0/"><license-p>This article is distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/3.0/">Creative Commons Attribution License</ext-link>, which permits unrestricted use and redistribution provided that the original author and source are credited.</license-p></license></permissions><self-uri content-type="pdf" xlink:href="elife00569.pdf"/><abstract><object-id pub-id-type="doi">10.7554/eLife.00569.001</object-id><p><italic>Botryllus schlosseri</italic> is a colonial urochordate that follows the chordate plan of development following sexual reproduction, but invokes a stem cell-mediated budding program during subsequent rounds of asexual reproduction. As urochordates are considered to be the closest living invertebrate relatives of vertebrates, they are ideal subjects for whole genome sequence analyses. Using a novel method for high-throughput sequencing of eukaryotic genomes, we sequenced and assembled 580 Mbp of the <italic>B. schlosseri</italic> genome. The genome assembly is comprised of nearly 14,000 intron-containing predicted genes, and 13,500 intron-less predicted genes, 40% of which could be confidently parceled into 13 (of 16 haploid) chromosomes. A comparison of homologous genes between <italic>B. schlosseri</italic> and other diverse taxonomic groups revealed genomic events underlying the evolution of vertebrates and lymphoid-mediated immunity. The <italic>B. schlosseri</italic> genome is a community resource for studying alternative modes of reproduction, natural transplantation reactions, and stem cell-mediated regeneration.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.001">http://dx.doi.org/10.7554/eLife.00569.001</ext-link></p></abstract><abstract abstract-type="executive-summary"><object-id pub-id-type="doi">10.7554/eLife.00569.002</object-id><title>eLife Digest</title><p>The tunicates are an evolutionary group that includes species such as sea squirts and sea tulips. Their name comes from the structure known as a ‘tunic’ that surrounds their sac-like bodies. As marine filter feeders, tunicates obtain nutrients by straining food particles from water, and they can live either alone or in colonies depending on the species. Charles Darwin suggested that tunicates may be the key to understanding the evolution of vertebrates, and indeed today they are regarded as the closest living relatives of this group.</p><p>Colonial tunicates can reproduce either sexually, or asexually by budding. Compatible colonies have the ability to recognize one another and to fuse their blood vessels to form a single organism, whereas incompatible colonies reject one another and remain separate. This recognition process bears some resemblance to the rejection of foreign organ transplants in mammals.</p><p>Here, Voskoboynik and co-workers present the first genome sequence of a colonial tunicate, <italic>Botryllus schlosseri.</italic> They used a novel sequencing approach that significantly increased the length of a DNA molecule that can be determined by next-generation sequencing, and allowed large DNA repeat regions to be easily resolved. In total, they sequenced 580 million base pairs of DNA, which they estimate contains roughly 27,000 genes.</p><p>By comparing the <italic>B. schlosseri</italic> genome with those of a number of vertebrates, Voskoboynik et al. identified multiple <italic>B. schlosseri</italic> genes that also participate in the development and functioning of the vertebrate eye, heart, and auditory system, as well as others that may have contributed to the evolution of the immune system and of blood cells. The genome of <italic>B. schlosseri</italic> thus provides an important new tool for studying the genetic basis of the evolution of vertebrates.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.002">http://dx.doi.org/10.7554/eLife.00569.002</ext-link></p></abstract><kwd-group kwd-group-type="author-keywords"><title>Author keywords</title><kwd>Botryllus schlosseri</kwd><kwd>tunicates</kwd><kwd>stem cell</kwd><kwd>hematopoiesis</kwd><kwd>vertebrate evolution</kwd><kwd>genome</kwd></kwd-group><kwd-group kwd-group-type="research-organism"><title>Research organism</title><kwd>Other</kwd></kwd-group><funding-group><award-group id="par-1"><funding-source><institution-wrap><institution>National Institutes of Health</institution></institution-wrap></funding-source><award-id>1R56AI089968-01</award-id><principal-award-recipient><name><surname>Voskoboynik</surname><given-names>Ayelet</given-names></name><name><surname>Weissman</surname><given-names>Irving L</given-names></name><name><surname>Quake</surname><given-names>Stephen R</given-names></name></principal-award-recipient></award-group><award-group id="par-2"><funding-source><institution-wrap><institution>National Institutes of Health</institution></institution-wrap></funding-source><award-id>RO1GM100315-01</award-id><principal-award-recipient><name><surname>Voskoboynik</surname><given-names>Ayelet</given-names></name><name><surname>Weissman</surname><given-names>Irving L</given-names></name><name><surname>Quake</surname><given-names>Stephen R</given-names></name></principal-award-recipient></award-group><award-group id="par-3"><funding-source><institution-wrap><institution>National Institutes of Health</institution></institution-wrap></funding-source><award-id>1R01AG037968-01</award-id><principal-award-recipient><name><surname>Voskoboynik</surname><given-names>Ayelet</given-names></name><name><surname>Weissman</surname><given-names>Irving L</given-names></name><name><surname>Quake</surname><given-names>Stephen R</given-names></name></principal-award-recipient></award-group><award-group id="par-4"><funding-source><institution-wrap><institution>PRIN</institution></institution-wrap></funding-source><award-id>PRIN2009</award-id><principal-award-recipient><name><surname>Gissi</surname><given-names>Carmela</given-names></name></principal-award-recipient></award-group><award-group id="par-5"><funding-source><institution-wrap><institution>National Institutes of Health</institution></institution-wrap></funding-source><award-id>K99CA151673-01A1</award-id><principal-award-recipient><name><surname>Sahoo</surname><given-names>Debashis</given-names></name></principal-award-recipient></award-group><award-group id="par-6"><funding-source><institution-wrap><institution>Siebel Foundation</institution></institution-wrap></funding-source><award-id>Siebel Stem Cell Institute and the Thomas and Stacey Siebel Foundation</award-id><principal-award-recipient><name><surname>Sahoo</surname><given-names>Debashis</given-names></name><name><surname>Newman</surname><given-names>Aaron M</given-names></name></principal-award-recipient></award-group><award-group id="par-7"><funding-source><institution-wrap><institution>Department of Defense Grant</institution></institution-wrap></funding-source><award-id>W81XWH-10-1-0500</award-id><principal-award-recipient><name><surname>Sahoo</surname><given-names>Debashis</given-names></name></principal-award-recipient></award-group><award-group id="par-8"><funding-source><institution-wrap><institution>The Virginia and D K Ludwig Fund for Cancer Research</institution></institution-wrap></funding-source><principal-award-recipient><name><surname>Weissman</surname><given-names>Irving L</given-names></name></principal-award-recipient></award-group><funding-statement>The funders had no role in study design, data collection and interpretation, or the decision to submit the work for publication.</funding-statement></funding-group><custom-meta-group><custom-meta><meta-name>elife-xml-version</meta-name><meta-value>2</meta-value></custom-meta><custom-meta specific-use="meta-only"><meta-name>Author impact statement</meta-name><meta-value>The <italic>Botryllus schlosseri</italic> genome yields insights into the evolution of hematopoiesis.</meta-value></custom-meta></custom-meta-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>In 1866, Russian embryologist Alexander Kowalevsky wrote to Charles Darwin about the extensive developmental and morphological similarities between ascidian larvae and vertebrates, leading Darwin to hypothesize that ascidians (belonging to urochordates or tunicates) might be crucial to understanding the origin of the vertebrate phylum (<xref ref-type="bibr" rid="bib15">Darwin, 1874</xref>). Indeed, tunicates are the closest extant relatives of vertebrates (<xref ref-type="bibr" rid="bib19">Delsuc et al., 2006</xref>), and represent an investigative model for evolutionary events leading to adaptive immunity (<xref ref-type="bibr" rid="bib66">Sabbadin, 1962</xref>; <xref ref-type="bibr" rid="bib70">Scofield et al., 1982</xref>) and vertebrate-specific organ/tissue complexity (<xref ref-type="bibr" rid="bib18">Dehal et al., 2002</xref>; <xref ref-type="bibr" rid="bib34">Jeffery et al., 2004</xref>; <xref ref-type="bibr" rid="bib2">Abitua et al., 2012</xref>). The colonial tunicate species, <italic>Botryllus schlosseri</italic>, represents an important model organism for studying unique aspects of a pre-vertebrate colonial lifestyle, such as self recognition (<xref ref-type="bibr" rid="bib66">Sabbadin, 1962</xref>; <xref ref-type="bibr" rid="bib70">Scofield et al., 1982</xref>), vasculature and blood development (<xref ref-type="bibr" rid="bib69">Schlumpberger et al., 1984</xref>; <xref ref-type="bibr" rid="bib28">Gasparini et al., 2008</xref>; <xref ref-type="bibr" rid="bib83">Tiozzo et al., 2008</xref>), apoptosis (<xref ref-type="bibr" rid="bib45">Lauzon et al., 1993</xref>; <xref ref-type="bibr" rid="bib13">Cima et al., 2009</xref>), and alternative reproduction pathways (<xref ref-type="bibr" rid="bib67">Sabbadin et al., 1975</xref>; <xref ref-type="bibr" rid="bib49">Manni and Burighel, 2006</xref>; <xref ref-type="bibr" rid="bib87">Voskoboynik et al., 2007</xref>; <xref ref-type="bibr" rid="bib46">Lemaire, 2011</xref>), including stem cell-mediated regeneration of complete individuals within a colony unit (<xref ref-type="bibr" rid="bib41">Laird et al., 2005</xref>; <xref ref-type="bibr" rid="bib88">Voskoboynik et al., 2008</xref>; <xref ref-type="bibr" rid="bib64">Rinkevich et al., 2013</xref>).</p><p><italic>Botryllus schlosseri</italic> is an invasive colonial urochordate, living in large communities consisting of multiple colonies organized into expansive mats that coat a variety of marine surfaces, such as rocks, molluscs, multicellular algae, and ship hulls (<xref ref-type="bibr" rid="bib80">Stoner et al., 2002</xref>). Communities develop among compatible colonies, governed by a genetically encoded histocompatibility system (<xref ref-type="bibr" rid="bib66">Sabbadin, 1962</xref>; <xref ref-type="bibr" rid="bib70">Scofield et al., 1982</xref>). The progeny of each colony usually represents a clone of the vascularly connected, asexually reproducing individuals (zooids) derived from a single planktonic larva (<xref ref-type="bibr" rid="bib49">Manni and Burighel, 2006</xref>; <xref ref-type="fig" rid="fig1">Figure 1A–D</xref>). Compatible colonies fuse their blood vessels to generate a chimera, while incompatible colonies reject one another, maintaining individuality (<xref ref-type="bibr" rid="bib66">Sabbadin, 1962</xref>; <xref ref-type="bibr" rid="bib70">Scofield et al., 1982</xref>; <xref ref-type="bibr" rid="bib97">Voskoboynik et al., 2013</xref>). Following the fusion of blood vessels between colonies, the circulating stem cells of one partner colony can compete and replace the germline and/or the soma of the other partner (<xref ref-type="bibr" rid="bib78">Stoner and Weissman, 1996</xref>; <xref ref-type="bibr" rid="bib79">Stoner et al., 1999</xref>; <xref ref-type="bibr" rid="bib41">Laird et al., 2005</xref>; <xref ref-type="bibr" rid="bib88">Voskoboynik et al., 2008</xref>; <xref ref-type="bibr" rid="bib64">Rinkevich et al., 2013</xref>), a phenomenon analogous to allogeneic transplantation.<fig-group><fig id="fig1" position="float"><object-id pub-id-type="doi">10.7554/eLife.00569.003</object-id><label>Figure 1.</label><caption><title><italic>Botryllus schlosseri</italic> anatomy, life cycle, and phylogeny.</title><p><italic>B. schlosseri</italic> reproduces both through sexual and asexual (budding) pathways, giving rise to virtually identical adult body plans. Upon settlement, the tadpole phase of the <italic>B. schlosseri</italic> lifecycle (<bold>A</bold>) will metamorphose into a founder individual (oozooid) (<bold>B</bold>), which through asexual budding, generates a colony. The colony includes three overlapping generations: an adult zooid, a primary bud, and a secondary bud, all of which are connected via a vascular network (bv) embedded within a gelatinous matrix (termed tunic). The common vasculature terminates in finger-like protrusions (termed ampullae; <bold>B</bold>–<bold>D</bold>). Bud development commences in stage A (<bold>C</bold>). Through budding, <italic>B. schlosseri</italic> generates its entire body, including digestive (ds) and respiratory (brs) systems, a simple tube-like heart (h), an endostyle (en) that harbors a stem cell niche, a primitive neural complex, and siphons used for feeding, waste, and releasing larvae (<bold>B</bold>–<bold>D</bold>). Each week, successive buds grow large (<bold>D</bold>) and complete replication of all zooids in the colony, ultimately replacing the previous generation’s zooids, which die through a massive apoptosis. (<bold>E</bold>) A phylogenomic tree produced from analysis of 521 nuclear genes (40,798 aligned amino acids) from 15 species, including <italic>B. schlosseri</italic>. Scale bar-1 mm.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.003">http://dx.doi.org/10.7554/eLife.00569.003</ext-link></p></caption><graphic xlink:href="elife00569f001"/></fig><fig id="fig1s1" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.00569.004</object-id><label>Figure 1—figure supplement 1.</label><caption><title>Mitogenomic analysis of tunicates and deuterostomes.</title><p>Based on the 13 mitochondrially-encoded proteins. The tree was inferred by PhyloBayes under a GTR+G+CAT model. Support values at nodes represents Bayesian Posterior Probability (PP) and are reported only when >0.5 and <0.95. Nodes with PP < 0.5 were collapsed. The tree was rooted with the non-deuterostome <italic>Drosophila</italic> and <italic>Aplysia</italic> species. The main deuterostome lineages are represented in different colours. Abbreviations for tunicate orders: Stolido: Stolidobranchia; Phlebo: Phlebobranchia; Aplouso: Aplousobranchia. Colonial tunicates are indicated by an asterisk and include <italic>Botryllus schlosseri</italic>, all Aplousobranchia ascidians, and the thaliacean <italic>Doliolum nationalis</italic>.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.004">http://dx.doi.org/10.7554/eLife.00569.004</ext-link></p></caption><graphic xlink:href="elife00569fs001"/></fig></fig-group></p><p>Tunicates are classified as chordates because their planktonic larva stage (<xref ref-type="fig" rid="fig1">Figure 1A</xref>) shares structural characteristics with all chordates: a notochord, dorsal neural tube, segmented musculature, and gill slits (<xref ref-type="bibr" rid="bib15">Darwin, 1874</xref>; <xref ref-type="bibr" rid="bib18">Dehal et al., 2002</xref>). Larvae settle in response to light and metamorphose into sessile individuals (<xref ref-type="fig" rid="fig1">Figure 1B</xref>), which lose most of their chordate phenotypes (<xref ref-type="bibr" rid="bib15">Darwin, 1874</xref>; <xref ref-type="bibr" rid="bib18">Dehal et al., 2002</xref>). Tunicates reproduce either sexually (solitary tunicates; <xref ref-type="bibr" rid="bib18">Dehal et al., 2002</xref>; <xref ref-type="bibr" rid="bib46">Lemaire, 2011</xref>), or sexually and asexually (colonial tunicates; <xref ref-type="bibr" rid="bib49">Manni and Burighel, 2006</xref>; <xref ref-type="bibr" rid="bib46">Lemaire, 2011</xref>). These two reproductive modes give rise to nearly identical complex adult body plans, including digestive and respiratory systems, a simple tube-like heart, siphons, an endostyle, a neural complex, ovary and testis (<xref ref-type="bibr" rid="bib49">Manni and Burighel, 2006</xref>; <xref ref-type="fig" rid="fig1">Figure 1A–D</xref>).</p><p>The ability to reproduce asexually renders colonial tunicates robust survivors, capable of rapid proliferation and whole body regeneration. These unique features of colonial tunicates coupled with their key evolutionary position and long history of scientific study prompted us to sequence the <italic>B. schlosseri</italic> genome.</p></sec><sec id="s2" sec-type="results|discussion"><title>Results and discussion</title><sec id="s2-1"><title>A novel genome sequencing method for deciphering repeat-rich genomes</title><p>The <italic>B. schlosseri</italic> genome was previously estimated to be 725 Mb based on flow cytometry analysis (<xref ref-type="bibr" rid="bib17">De Tomaso et al., 1998</xref>), and metaphase spreads suggested that it is organized into 16 chromosomes (<xref ref-type="bibr" rid="bib14">Colombera, 1963</xref>). To accurately assemble this relatively large genome, we developed a novel method to accurately sequence many large fragments in parallel. This long read sequencing approach (LRseq) effectively increases the read length of a next generation sequencer by 50-fold, while decreasing the error rate by orders of magnitude (<xref ref-type="fig" rid="fig2">Figure 2</xref>; ‘Materials and methods’ under ‘Genome sequencing and assembly’). Our approach began with genomic DNA sheared to 6–8 kb fragments. Limiting dilution was used to create aliquots of a few hundred to a few thousand DNA molecules. Each aliquot was amplified with PCR, fragmented (600–800 bp), barcoded, and sequenced by Illumina HiSeq 2000 (<xref ref-type="fig" rid="fig2">Figure 2</xref>). The Velvet assembler (<xref ref-type="bibr" rid="bib96">Zerbino, 2010</xref>) was used to assemble short paired-end reads from each barcode (i.e., well) separately, thus simplifying the assembly problem and creating effective read lengths corresponding to the original large fragment sizes (<xref ref-type="fig" rid="fig2">Figure 2B</xref>; <xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2A</xref>, <xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2B</xref>). Limiting the number of DNA molecules per well greatly reduces or eliminates chances of having a repeated or duplicate sequence within a defined partition. Furthermore, since each well was over-sequenced, the error rate is reduced by the coverage and is substantially improved from the intrinsic error rate of the sequencer (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2C</xref>). This procedure is amenable to automation in multiwell plates, and we obtained data from twelve 96-well plates (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2A</xref>, <xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2B</xref>). We validated this method on human genomic DNA, for which an independent reference is available (<xref ref-type="fig" rid="fig2s1">Figure 2—figure supplement 1</xref>).<fig-group><fig id="fig2" position="float"><object-id pub-id-type="doi">10.7554/eLife.00569.005</object-id><label>Figure 2.</label><caption><title>A novel short read genome sequencing and assembly method for complex, repeat-rich genomes.</title><p>(<bold>A</bold>) Genomic DNA is sheared into 6–8 kb fragments, partitioned into twelve 96-well plates, further fragmented to 600–800 bp, barcoded and sequenced separately for each well (Illumina HiSeq 2000 2x100bp), and assembled by Velvet. (<bold>B</bold>) Size distribution of contigs assembled from a representative library preparation (BL5). (<bold>C</bold>) Limiting the number of amplifiable molecules per well (barcode) to the level that almost 100% of all amplifiable molecules are present as single copies (<1000 gDNA molecules) greatly reduces the chance of having a repeated or homologous sequence within a well. Thus, sample complexity is significantly reduced, which reduces ambiguity in the reconstruction of a consensus sequence. As an example, two different predicted repeat-containing genes (g2001,1189bp; and g2002, 688bp) were assembled from two different wells (005 and 145 respectively). Although they contain highly homologous repeats (represented as a Dot Matrix plot, (<bold>D</bold>) these repetitive genes were resolved and reconstructed properly in the final assembly.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.005">http://dx.doi.org/10.7554/eLife.00569.005</ext-link></p></caption><graphic xlink:href="elife00569f002"/></fig><fig id="fig2s1" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.00569.006</object-id><label>Figure 2—figure supplement 1.</label><caption><title>Validation of LRseq approach on human genomic DNA.</title><p>Genomic DNA from HapMap NA7019 was prepared for LRseq. These figures show LRseq assembly statistics, obtained by mapping sequenced reads to human genome reference 36. These data were also used to estimate the concentration of amplifiable molecules in <italic>B. schlosseri</italic> 356a DNA samples prepared by an identical protocol.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.006">http://dx.doi.org/10.7554/eLife.00569.006</ext-link></p></caption><graphic xlink:href="elife00569fs002"/></fig><fig id="fig2s2" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.00569.007</object-id><label>Figure 2—figure supplement 2.</label><caption><title>Clonality confirmation of the genome of clone Sc6a-b and clone 356a.</title><p>(<bold>A</bold>) Sc6a-b clone, a long lived (7 years old when sampled), highly regenerative colony was chosen to be sequenced. Sc6a-b subclones were starved for 48 hr prior to sampling, and 400 individuals (zooids) were sampled for sequencing. Subclones of this colony are still alive and maintained in our mariculture facility. (<bold>B</bold>) A few zooids were taken from every sample set and tested via AFLP’s genotyping analysis, confirming that all zooids belong to one genotype. (<bold>C</bold> and <bold>D)</bold>. Sc6a-b microsatellite loci were homozygous (2 loci) and heterozygous (1 loci) confirming one genotype. (<bold>E</bold> and <bold>F</bold>) 356a clone was a highly regenerative long lived colony. 150 individuals were sampled and their gDNA was sequenced. Microsatellite loci were homozygous (<bold>E</bold> and <bold>F</bold>), confirming one genotype. Scale bar-1 mm</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.007">http://dx.doi.org/10.7554/eLife.00569.007</ext-link></p></caption><graphic xlink:href="elife00569fs003"/></fig><fig id="fig2s3" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.00569.008</object-id><label>Figure 2—figure supplement 3.</label><caption><title>Statistics for 356a assembly.</title><p>(<bold>A</bold>) Contig length distribution. (<bold>B</bold>) Distribution of coverage of 356a assembled Celera contigs by Velvet assembled fragments.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.008">http://dx.doi.org/10.7554/eLife.00569.008</ext-link></p></caption><graphic xlink:href="elife00569fs004"/></fig><fig id="fig2s4" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.00569.009</object-id><label>Figure 2—figure supplement 4.</label><caption><title>Interspersed and tandem repeats distribution in the <italic>B. schlosseri</italic> genome.</title><p>(<bold>A</bold>) RepeatScout (version 1.0.5; <xref ref-type="bibr" rid="bib60">Price et al., 2005</xref>) was used to identify interspersed repeat elements de novo using a k-mer length of 14. All identified repeats were subsequently filtered for tandem repeat and low complexity content, using RepeatScout. Genome-wide interspersed repeats were catalogued using RepeatMasker (version open-4.0; <xref ref-type="bibr" rid="bib74">Smit et al., 1996-2010</xref>). The distribution of large interspersed repeats families (≥1kb) ordered by copy number is presented. (<bold>B</bold>) To identify both perfect (100% sequence identity) and degenerate genomic tandem repeats, we used XSTREAM (<xref ref-type="bibr" rid="bib54">Newman and Cooper, 2007</xref>), with a minimum repeat length of 20 bp, minimum word match of 0.8, and otherwise default parameters. 3,183,988 tandem repeats were identified, period range: 1–6525 bp, copy number range: 2.7–1096x</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.009">http://dx.doi.org/10.7554/eLife.00569.009</ext-link></p></caption><graphic xlink:href="elife00569fs005"/></fig><fig id="fig2s5" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.00569.010</object-id><label>Figure 2—figure supplement 5.</label><caption><title>Coverage of 4 fosmids by the <italic>B. schlosseri</italic> assembly.</title><p>Fosmid sequences (red lines; gi; ac numbers are shown, number=bp), were compared with <italic>B. schlosseri</italic> contigs using blast (e-value < e<sup>−10</sup>). Best alignments between contigs >500bp (black lines) are shown. Repetitive regions are marked (blue).</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.010">http://dx.doi.org/10.7554/eLife.00569.010</ext-link></p></caption><graphic xlink:href="elife00569fs006"/></fig><fig id="fig2s6" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.00569.011</object-id><label>Figure 2—figure supplement 6.</label><caption><title>Validation of putative <italic>B. schlosseri</italic> genes.</title><p>We experimentally validated 145 <italic>B. schlosseri</italic> predicted genes. Genes were validated by observing expression in <italic>B. schlosseri</italic> cDNAs and gDNA via PCR and qPCR assays and resequencing them on Sanger. (<bold>A</bold>) cDNA PCR product of several early erythroid and HSC putative genes identified in <italic>B. schlosseri</italic> tissues (endostyle, blood or zooid). Names of the putative genes and the tissues that were tested in this experiment are indicated on the gel image. (<bold>B</bold>) qPCR expression in <italic>B. schlosseri</italic> blood of six putative immunity genes.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.011">http://dx.doi.org/10.7554/eLife.00569.011</ext-link></p></caption><graphic xlink:href="elife00569fs007"/></fig></fig-group></p><p>Genomic DNA (gDNA) was extracted from tissue from two long-lived <italic>B. schlosseri</italic> colonies (Sc6a-b and 356a) raised in our mariculture facility (‘Materials and methods’ under ‘Animals and genomic DNA sample collection’). Microsatellite heterogeneity confirmed clonality (<xref ref-type="fig" rid="fig2s2">Figure 2—figure supplement 2</xref>). Each colony was sequenced and assembled separately. We first attempted conventional sequencing and assembly from colony Sc6a-b DNA using Roche 454 Titanium (Branford, USA) and Illumina GAII (San Diego, USA) sequences (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2C</xref>, ‘Materials and methods’ under ‘Genome sequencing and assembly’). This Sc6a-b assembly achieved an average N50 of 1 kb, yielding short contigs that were insufficient for whole genome assembly (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2D</xref>). By contrast, when we applied LRseq to the 356a clone, we obtained a 566 Mbp assembly with a dramatically improved N50 of 7kb (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2D</xref>; <xref ref-type="fig" rid="fig2s3">Figure 2—figure supplement 3</xref>). This approach not only simplified the assembly of a complex eukaryotic genome, but also reduced the confounding impact of repetitive DNA on contig assembly (<xref ref-type="fig" rid="fig2">Figure 2C–D</xref>; <xref ref-type="fig" rid="fig2s3">Figure 2—figure supplement 3</xref>).</p></sec><sec id="s2-2"><title>Chromosome assignments, repeats, and gene content</title><p>We sought to determine the chromosomal organization of the <italic>B. schlosseri</italic> genome. Using embryos from a wild <italic>B. schlosseri</italic> colony from Monterey Bay, we loaded a dilute solution of dispersed metaphase chromosomes into a microfluidic device as previously described (<xref ref-type="bibr" rid="bib24">Fan et al., 2011</xref>). The isolated metaphase chromosome mixtures from 21 individual wells were amplified, barcoded, and sequenced separately (‘Materials and methods’ under ‘Chromosome sequencing, assignment and assembly’; <xref ref-type="bibr" rid="bib24">Fan et al., 2011</xref>; <xref ref-type="bibr" rid="bib92">Xu et al., 2011</xref>). Using the 21 chromosome mixtures, containing between 1 and 4 chromosomes each, 356a genomic contigs larger than 7 kb were aligned to the chromosome reads using BWA. Then, scaffolds were assigned to chromosome clusters by iterative K-means clustering on the correlation matrix between each scaffold (<xref ref-type="fig" rid="fig3">Figure 3</xref>; ‘Materials and methods’ under ‘Chromosome sequencing, assignment and assembly’). Assuming that <italic>B. schlosseri</italic> carries 16x2 chromosomes (<xref ref-type="bibr" rid="bib14">Colombera, 1963</xref>), this approach clearly resolves 13 chromosomes with a mean chromosome meta-scaffold size of 16,234 kb and a mean N50 of 38 kb (<xref ref-type="fig" rid="fig3">Figure 3</xref>; <xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1</xref>; <xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2D</xref>). Finally, we attempted to improve our genomic assembly by incorporating the additional 21 chromosome assemblies into a hybrid assembly (‘Materials and methods’ under ‘Chromosome sequencing, assignment and assembly’; <xref ref-type="fig" rid="fig3s2">Figure 3—figure supplement 2</xref>; <xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1</xref>). An overall improvement in N50 was achieved, yielding a final 580 Mbp draft assembly (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2D</xref>).<fig-group><fig id="fig3" position="float"><object-id pub-id-type="doi">10.7554/eLife.00569.012</object-id><label>Figure 3.</label><caption><title>Clustering and assignment of <italic>B.schlosseri</italic> chromosomes.</title><p>(<bold>A</bold>) We isolated and sequenced 21 metaphase chromosome mixtures using a microfluidic device. Each chromosome mixtures was amplified, barcoded and sequenced separately (IlluminaHiSeq). Genomic contigs larger than 7 kb were aligned to the chromosome reads using BWA. Subsequently, assignment of scaffolds to chromosome cluster was performed using iterative K-means clustering on the correlation matrix between each scaffold. In addition, to find the number of clusters/chromosomes we performed k-means clustering iteratively across different cluster numbers. This plot demonstrates that increasing beyond 13 clusters does little to reduce the error; therefore 13 chromosomes were successfully resolved. (<bold>B</bold>) To estimate the configuration after the clustering step, 17 out of the 21 wells were deduced to contain information that is used in the clustering process. The average number of normalized reads counts from each metaphase chromosome mixture (well) that align to each scaffold in a cluster group was calculated and plotted. Each peak represented can be inferred to denote the presence of a specific chromosome in the well. Examples of four representative wells are presented, metaphase chromosome mixtures contained between 1–4 chromosomes (see also <xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1</xref>).</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.012">http://dx.doi.org/10.7554/eLife.00569.012</ext-link></p></caption><graphic xlink:href="elife00569f003"/></fig><fig id="fig3s1" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.00569.013</object-id><label>Figure 3—figure supplement 1.</label><caption><title>Distribution of <italic>B. schlosseri</italic> chromosome groups across different wells.</title><p>We isolated and sequenced metaphase diluted chromosome mixtures using a microfluidic device. Each chromosome mixture was amplified, barcoded and sequenced separately (IlluminaHiSeq). The average number of normalized reads counts from each diluted chromosome mixture (well) that align to each scaffold in a cluster group was calculated and plotted. Each peak represents the presence of a specific chromosome in the well. In the 17 wells presented above, chromosome mixtures contained between 1–4 chromosomes.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.013">http://dx.doi.org/10.7554/eLife.00569.013</ext-link></p></caption><graphic xlink:href="elife00569fs008"/></fig><fig id="fig3s2" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.00569.014</object-id><label>Figure 3—figure supplement 2.</label><caption><title>Pipeline for the assignment of chromosome scaffolds and the 356a–chromosomes hybrid assembly process.</title><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.014">http://dx.doi.org/10.7554/eLife.00569.014</ext-link></p></caption><graphic xlink:href="elife00569fs009"/></fig><fig id="fig3s3" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.00569.015</object-id><label>Figure 3—figure supplement 3.</label><caption><title>356a-Chromosome hybrid assembly of <italic>B. schlosseri</italic>.</title><p>Reads from each of the individual chromosome sample preparations were subsequently assembled using Velvet. The resulting chromosome level contigs were then merged with the 356a assembly to create a 356a-chromosome hybrid assembly.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.015">http://dx.doi.org/10.7554/eLife.00569.015</ext-link></p></caption><graphic xlink:href="elife00569fs010"/></fig><fig id="fig3s4" position="float" specific-use="child-fig"><object-id pub-id-type="doi">10.7554/eLife.00569.016</object-id><label>Figure 3—figure supplement 4.</label><caption><title>The fraction of <italic>B. schlosseri</italic> predicted intron-less genes (blue) and genes with introns (red) in the different chromosomes.</title><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.016">http://dx.doi.org/10.7554/eLife.00569.016</ext-link></p></caption><graphic xlink:href="elife00569fs011"/></fig></fig-group></p><p>Repetitive elements can confound traditional genome assembly methods (<xref ref-type="bibr" rid="bib68">Salzberg et al., 2012</xref>), and are often removed to avoid assembly errors (e.g., <xref ref-type="bibr" rid="bib18">Dehal et al., 2002</xref>; <xref ref-type="bibr" rid="bib61">Putnam et al., 2007</xref>; <xref ref-type="bibr" rid="bib72">Shinzato et al., 2011</xref>; <xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2H</xref>). However, because LRSeq was designed to explicitly resolve long read sequences even in the presence of repeats, we further evaluated LRSeq performance by enumerating two major repeat classes in the assembly, interspersed repeats and tandem repeats. We used RepeatScout for de novo identification of interspersed elements (<xref ref-type="bibr" rid="bib60">Price et al., 2005</xref>), and RepeatMasker (<xref ref-type="bibr" rid="bib74">Smit et al., 1996–2010</xref>) for analysis of genome-wide repeat demographics. We identified 6601 interspersed repeat families, each present in at least three copies, that together cover ∼65% of the <italic>B. schlosseri</italic> genome assembly (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2E</xref>). We also identified 1400 large repeat families, defined as interspersed repeats with genomic alignments of at least 1 kb. Notably, large interspersed repeats are found in a median of four chromosomes (of 13 chromosome assignments), and >10% of large interspersed repeat families occur in over 100 copies (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2E</xref>; <xref ref-type="fig" rid="fig2s4">Figure 2—figure supplement 4A</xref>). Despite considerable repetitive content, we observed a strong concordance between genomic contigs and Sanger fosmid sequences, supporting the effectiveness of the LRseq approach (e.g., see <xref ref-type="fig" rid="fig2s5">Figure 2—figure supplement 5</xref>). As a further validation, we interrogated our former sc6ab 380 Mb assembly for the same interspersed repeat elements, with the expectation of recovering less repeats. Indeed, only 52.27% of sc6ab base pairs were masked using the same repeat library. These results validate the repeat families and support their widespread presence in the <italic>B. schlosseri</italic> genome. Finally, we analyzed the assembly for perfect (100% sequence identity) and degenerate tandem repeat content using XSTREAM (<xref ref-type="bibr" rid="bib54">Newman and Cooper, 2007</xref>). In all, ∼3.2 million tandem repeats were identified, with periods ranging from 1–6525 bp and copy numbers ranging from 2–1096x (<xref ref-type="fig" rid="fig2s4">Figure 2—figure supplement 4B</xref>). By comparison, the human genome was assembled to a very high standard using conventional Sanger technology and later Illumina technology, and was found to contain over 50% repeats (<xref ref-type="bibr" rid="bib37">de Konning et al., 2011</xref>). The considerable repeat content and diversity in the <italic>B. schlosseri</italic> genome indicates that LRseq may have general utility for resolving repeat architectures in diverse eukaryotic genomes.</p><p>We further validated the assembly by comparison to a variety of independently generated <italic>B. schlosseri</italic> sequence data. All <italic>B. schlosseri</italic> genes (n = 66), fosmid sequences (n = 11) and most of the 98,611 expressed sequence tags (ESTs) available from NCBI aligned with the <italic>B. schlosseri</italic> draft assembly (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2F</xref>, <xref ref-type="fig" rid="fig2s5">Figure 2—figure supplement 5</xref>; ‘Materials and methods’ under ‘Evaluation of 365a-chromosomes hybrid assembly’). Moreover, nearly all of the independently sequenced and assembled Roche 454 Sc6a-b contigs (93%) were successfully mapped to the assembly (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary files 2F</xref>; ‘Materials and methods’ under ‘Evaluation of 365a-chromosomes hybrid assembly’). Taken together, these data represent independent validation of the quality and integrity of the <italic>B. schlosseri</italic> draft assembly which compares favorably to, and in some cases exceeds, existing wild type genomes with respect to ungapped chromosome contig N50, chromosome assignments, and repeat sequence integration (e.g., see <xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2G</xref>).</p><p>Next, to identify protein-encoding genes, we generated RNA-Seq data (88 Gb; <xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2C</xref>) from 19 different colonies to guide the gene prediction program Augustus (<xref ref-type="bibr" rid="bib77">Stanke et al., 2008</xref>). In total, 38,730 putative protein-coding loci were identified, all of which have at least 30% transcript support (‘Materials and methods’ under ‘RNA sequencing’, ‘Gene prediction’, ‘Gene annotation’; <xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2I</xref>). Among these predicted genes, 27,463 include a start and stop codon, 13,910 genes have at least one intron, and 13,553 are intron-less (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2H</xref>). Moreover, for each of the <italic>B. schlosseri</italic> chromosomes 55% of genes have at least one intron while ∼45% are intron-less (<xref ref-type="fig" rid="fig3s4">Figure 3—figure supplement 4</xref>). In addition, the mean <italic>B. schlosseri</italic> gene length is predicted to be 3.6 kbp with a mean exon length of 170 bp (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2H</xref>). We tested a set of 145 genes by PCR and Sanger-sequencing, and were able to confirm 144 of them (99.3%), further validating the genome assembly (<xref ref-type="fig" rid="fig2s6">Figure 2—figure supplement 6</xref>, ‘Materials and methods’ under ‘Evaluation of genes’).</p><p>Using these predicted genes, we investigated the evolutionary position of <italic>B. schlosseri</italic>. Phylogenomic analysis of 425 conserved homologous genes across 15 diverse species, and mitogenomic analysis of 65 species both support the phylogenic position of tunicates within Chordata (<xref ref-type="bibr" rid="bib19">Delsuc et al., 2006</xref>; <xref ref-type="fig" rid="fig1">Figure 1E</xref>; <xref ref-type="fig" rid="fig1s1">Figure 1—figure supplement 1</xref>, <xref ref-type="supplementary-material" rid="SD2-data">Supplementary file 1</xref>; ‘Materials and methods’ under ‘Mitochondrial phylogeny’, ‘Phylogenomic analyses’), and provide strong evidence that colonial and solitary tunicates represent the closest living relative of vertebrates.</p></sec><sec id="s2-3"><title><italic>B. schlosseri</italic> and the emergence of vertebrate phenotypes</title><p>We investigated the <italic>B. schlosseri</italic> genome for molecular events underlying the emergence and early diversification of vertebrates. Protein-encoding genes in <italic>B. schlosseri</italic> were compared to a diverse sampling of 18 well-annotated genomes from other species, and for each genome, we assessed the presence or absence of significant homology to human or mouse proteins (<xref ref-type="supplementary-material" rid="SD1-data">Figure 4—source data 1A</xref>; ‘Materials and methods’ under ‘Evolution analysis’). All proteomes were combined into a single data set (of constant size) for blast analysis. As such, differences in the number of genes per genome would not have impacted our results. An e-value cutoff of e<sup>−10</sup> was selected to strike a balance between statistical significance and the detection of remote homology (‘Materials and methods’ under ‘Evolution analysis’). Among the analyzed species, we found that 77% of human genes could be traced back to protochordates with at least some homology (e-value ≤ e<sup>−10</sup>), around 10% less than chicken (85%) and frog (86%) genomes, indicating that the common ancestral genome of tunicates and vertebrates had homology to at least 77% of the human gene repertoire. This list includes about 660 genes present in the common ancestor, but absent in non-chordate species (<xref ref-type="supplementary-material" rid="SD1-data">Figure 4—source data 1B</xref>).</p><p>Among the genes found in <italic>B. schlosseri</italic> (either alone or in combination with other protochordate species) and vertebrates (<xref ref-type="supplementary-material" rid="SD1-data">Figure 4—source data 1B</xref>, <xref ref-type="supplementary-material" rid="SD1-data">Figure 4—source data 1C</xref>), we found genes that are critical to the development and function of the vertebrate heart (e.g., <italic>ALPK3</italic>, <italic>TNNT2</italic>; <xref ref-type="bibr" rid="bib32">Hosoda et al., 2001</xref>; <xref ref-type="bibr" rid="bib26">Frey et al., 2012</xref>), and eye (gamma and beta crystallins; <xref ref-type="bibr" rid="bib81">Sun et al., 2011</xref>), and the ability to hear (<italic>GJB</italic>2/3/6 <italic>CLDN</italic>; <xref ref-type="bibr" rid="bib63">Rabionet et al., 2000</xref>; <xref ref-type="bibr" rid="bib91">Wilcox et al., 2001</xref>; <xref ref-type="fig" rid="fig4">Figure 4</xref>, <xref ref-type="supplementary-material" rid="SD1-data">Figure 4—source data 1C</xref>). Mutations in these genes are implicated in a variety of human diseases and disorders, including heart diseases (<xref ref-type="bibr" rid="bib26">Frey et al., 2012</xref>), cataracts (<xref ref-type="bibr" rid="bib81">Sun et al., 2011</xref>), deafness (<xref ref-type="bibr" rid="bib63">Rabionet et al., 2000</xref>; <xref ref-type="bibr" rid="bib91">Wilcox et al., 2001</xref>), and nemaline myopathy (<xref ref-type="bibr" rid="bib35">Johnston et al., 2000</xref>; <xref ref-type="fig" rid="fig4">Figure 4</xref>, <xref ref-type="supplementary-material" rid="SD1-data">Figure 4—source data 1C</xref>). In addition, <italic>B. schlosseri</italic> was the only protochordate in our analysis with proteins homologous to pregnancy-specific glycoproteins (PSGs). PSGs are the major placental polypeptides, and complications in pregnancies and spontaneous abortions have been associated with abnormally low levels of PSGs in the maternal blood (<xref ref-type="bibr" rid="bib9">Camolotto et al., 2010</xref>). Analogous to mammalian pregnancies, a common blood supply among kin is established and tolerated in <italic>B. schlosseri</italic> chimeras (<xref ref-type="bibr" rid="bib89">Voskoboynik et al., 2009</xref>). Thus, by studying PSG-like proteins in <italic>B. schlosseri</italic>, new insights might be gained into maternal and fetal medicine.<fig id="fig4" position="float"><object-id pub-id-type="doi">10.7554/eLife.00569.017</object-id><label>Figure 4.</label><caption><title>Innovations underlying the emergence and early diversification of vertebrates.</title><p>Protein-encoding genes in <italic>B. schlosseri</italic> were compared to a diverse sampling of 18 well-annotated genomes from other species, and for each genome, the presence or absence of homology to human or mouse proteins was assessed (all vs all blastp e-value threshold of 1e<sup>−10</sup>; <xref ref-type="supplementary-material" rid="SD1-data">Figure 4—source data 1A</xref>). Our data indicate that homologs of ∼660 human/mouse genes were present in the common ancestor of tunicates and vertebrates, but not non-chordate species <xref ref-type="supplementary-material" rid="SD1-data">Figure 4—source data 1B</xref>). Among them are genes associated with the development, function, and pathology of vertebrate features, including heart, eye, hearing, immunity, pregnancy and cancer (<xref ref-type="supplementary-material" rid="SD1-data">Figure 4—source data 1C</xref>). Gray box = no homology; Yellow box = homology.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.017">http://dx.doi.org/10.7554/eLife.00569.017</ext-link></p><p><supplementary-material id="SD1-data"><object-id pub-id-type="doi">10.7554/eLife.00569.018</object-id><label>Figure 4—source data 1.</label><caption><title>Vertebrates evolution.</title><p>(<bold>A</bold>) Innovations that underline the emergence and early diversification of vertebrates. We compared protein-encoding genes in <italic>B. schlosseri</italic> to a diverse sampling of 18 well-annotated genomes from other species. All protein sequences were compared by blastp against all other protein sequences. Based on this data set a list was generated of genes known from human and mouse and their existence (1) or absence (0) in the tested species (e-value < e<sup>−10</sup>). (<bold>B</bold>) The 660 putative genes present in protochordates, human and mouse, but absent in non-chordate species. This list was generated from <xref ref-type="supplementary-material" rid="SD1-data">Figure 4—source data 1A</xref>. Per every species, or species group we filtered for genes that were present in the tested species/species group and in human or mouse, but were absent in non-chordate species. (<bold>C</bold>) Innovations that underline the emergence and early diversification of vertebrates. This table is based on data gathered in <xref ref-type="supplementary-material" rid="SD1-data">Figure 4—source data 1B</xref> and is focused on the genes that are present in <italic>B. schlosseri</italic> and vertebrates (either alone or in combination with other protochordate species) but are absent in non-chordate species. A ToppGene analysis is presented of these sets of genes which summarized their molecular functions, biological processes, human and mouse phenotypes, and pathways they are involved in, gene families, drugs and human diseases.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.018">http://dx.doi.org/10.7554/eLife.00569.018</ext-link></p></caption><media mime-subtype="xlsx" mimetype="application" xlink:href="elife00569s001.xlsx"/></supplementary-material></p></caption><graphic xlink:href="elife00569f004"/></fig></p><p>Numerous genes predicted to have evolved in a common ancestor of <italic>B. schlosseri</italic> and vertebrates are essential to the immune system and hematopoiesis (<xref ref-type="fig" rid="fig4">Figure 4</xref>, <xref ref-type="supplementary-material" rid="SD1-data">Figure 4—source data 1B</xref>, <xref ref-type="supplementary-material" rid="SD1-data">Figure 4—source data 1C</xref>). Six genes unique to <italic>B. schlosseri</italic> and vertebrates (<italic>ZBTB1</italic>, <italic>MEFV</italic>, <italic>DSG3</italic>, <italic>NQO1</italic>, <italic>NQO2</italic> and <italic>BHLHE40</italic>) are associated with increased leukocyte and hematopoietic cell numbers (<xref ref-type="supplementary-material" rid="SD1-data">Figure 4—source data 1C</xref>; <xref ref-type="bibr" rid="bib12">Chen et al., 2009</xref>). In our analysis, these genes are absent in cephalochordates and solitary urochordates, which all lack a defined vascular system (<xref ref-type="bibr" rid="bib50">Moller and Philpott, 2005</xref>; <xref ref-type="bibr" rid="bib46">Lemaire, 2011</xref>). In contrast, the heart in each individual zooid in a <italic>B. schlosseri</italic> colony beats synchronously with the hearts of other zooids in the colony, driving a bidirectional blood flow throughout an interconnected vasculature (<xref ref-type="other" rid="video1">Video 1</xref>). Moreover, this blood system carries at least ten morphologically different cell types (<xref ref-type="bibr" rid="bib69">Schlumpberger et al., 1984</xref>; <xref ref-type="bibr" rid="bib4">Ballarin et al., 2008</xref>). Because of the anatomy of <italic>B. schlosseri</italic>, coupled with its hematopoietic-related gene repertoire, we hypothesize that colonial ascidians may have retained and elaborated many components of the ancestral hematopoietic program, much of which has been lost in extant solitary urochordates and cephalochordates.<media content-type="glencoe play-in-place height-250 width-310" id="video1" mime-subtype="wmv" mimetype="video" xlink:href="elife00569v001.wmv"><object-id pub-id-type="doi">10.7554/eLife.00569.019</object-id><label>Video 1.</label><caption><title><italic>B. schlosseri</italic> blood circulation.</title><p>(<bold>A)</bold> Time-lapse acquisition of blood flow in the blood vessels (bv) and ampullae of a chimeric <italic>B. schlosseri</italic> colony, generated from a fusion between a mother and its offspring (fused). (<bold>B</bold>) Ampullae contract, buds develop, and a colony gets ready to replace the old generation. (<bold>C</bold>) Old generation zooids are getting resorbed (res. z) and replaced by the new generation (buds). (<bold>D</bold>) A heart beating and pumping blood in the primary bud of a different colony. (<bold>E</bold>) Blood flow through a common blood vessel between two allogeneic/compatible colonies, creating a natural chimera.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.019">http://dx.doi.org/10.7554/eLife.00569.019</ext-link></p></caption></media></p></sec><sec id="s2-4"><title>Evolution of hematopoiesis</title><p>We next attempted to identify potential precursors of human hematopoietic populations in <italic>B. schlosseri</italic> and 17 other diverse species, including fungal, plant, and mammalian species. We analyzed gene expression microarray data from 26 different human blood cell populations, and additional non-blood human tissue samples. We identified a set of twenty signature genes that were highly expressed in each of the 26 hematopoietic populations (<xref ref-type="bibr" rid="bib6">Benita et al., 2010</xref>; <xref ref-type="bibr" rid="bib71">Seita et al., 2012</xref>; ‘Materials and methods’ under ‘Evolution analysis’). For each blood-related gene set, we identified homologous gene sequences in <italic>B. schlosseri</italic> and 17 other species (<xref ref-type="fig" rid="fig5">Figure 5</xref>, <xref ref-type="supplementary-material" rid="SD4-data">Supplementary file 3</xref>). Among <italic>B. schlosseri</italic> homologs, we found high enrichment for gene sets predominantly expressed in human hematopoietic stem cells (HSCs; i.e., 14 of 20 cord blood HSC genes), myeloid populations (i.e., 14 of 20 early erythroid CD71+ genes), and early but not mature lymphoid populations. Consistent with previous studies (<xref ref-type="bibr" rid="bib5">Bartl et al., 1994</xref>; <xref ref-type="bibr" rid="bib40">Laird et al., 2000</xref>; <xref ref-type="bibr" rid="bib21">Dishaw and Litman, 2009</xref>; <xref ref-type="bibr" rid="bib30">Guo et al., 2009</xref>; <xref ref-type="bibr" rid="bib25">Flajnik and Kasahara, 2010</xref>; <xref ref-type="bibr" rid="bib3">Bajoghli et al., 2011</xref>; <xref ref-type="bibr" rid="bib31">Hirano et al., 2011</xref>) this analysis indicates that the evolution of adaptive immunity progressed rapidly beginning with jawless vertebrates, with much of the genetic repertoire in place by the emergence of jawed vertebrates (<xref ref-type="fig" rid="fig5">Figure 5</xref>). However, homologs of human genes with specific expression in HSC and blood progenitor populations, including T and B progenitor cells, appear early in metazoan evolution (<xref ref-type="fig" rid="fig5">Figure 5</xref>; <xref ref-type="supplementary-material" rid="SD4-data">Supplementary file 3</xref>).<fig id="fig5" position="float"><object-id pub-id-type="doi">10.7554/eLife.00569.020</object-id><label>Figure 5.</label><caption><title>Analysis of blood and immune cell type-specific genes across evolution reveals evidence for hematopoietic precursors in <italic>B. schlosseri</italic>.</title><p>We analyzed gene expression microarray data from 26 different human blood cell populations, organized into four cell lineages (HSC; Lymphoid Progenitors; Myeloid and Lymphoid Lineage), and identified a set of twenty signature genes with highly enriched expression profiles for each population (<xref ref-type="supplementary-material" rid="SD4-data">Supplementary file 3</xref>). For each blood-related gene set, we identified homologous gene sequences in <italic>B. schlosseri</italic> and 17 other species; the fraction of genes (out of 20) found for each species is displayed as a heat map. Within each major lineage, cell populations are sorted in decreasing order by a conservation index, calculated as the average number of genes found across the 18 species (indicated by a blue bar graph).</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.020">http://dx.doi.org/10.7554/eLife.00569.020</ext-link></p></caption><graphic xlink:href="elife00569f005"/></fig></p><p>Unlike solitary tunicates (e.g., <italic>Ciona</italic>), <italic>B. schlosseri</italic> has a defined vasculature with circulating blood cells (including cells with lymphocyte-like and macrophage-like morphology; <xref ref-type="bibr" rid="bib69">Schlumpberger et al., 1984</xref>; <xref ref-type="bibr" rid="bib4">Ballarin et al., 2008</xref>; <xref ref-type="other" rid="video1">Video 1</xref>). As such, we further investigated by PCR and re-sequencing the expression of all 28 <italic>B. schlosseri</italic> genes with homology to human HSCs (n = 14) and early erythroid CD71+ blood cell (n = 14) gene sets. Strikingly, we found evidence for expression of 13 HSC homologs in the <italic>B. schlosseri</italic> endostyle stem cell niche (<xref ref-type="bibr" rid="bib88">Voskoboynik et al., 2008</xref>), and 7 in the vasculature. We also confirmed expression of all 14 early erythroid CD71+ genes in the vasculature and endostyle (<xref ref-type="supplementary-material" rid="SD4-data">Supplementary file 3</xref>). Thus, our analysis not only identified <italic>B. schlosseri</italic> genes that may define evolutionary precursor cells of human hematopoietic lineages, but also indicates that the evolution of hematopoiesis proceeded from stem cells to myeloid populations to lymphoid populations, leading to the eventual emergence, absent in <italic>B. schlosseri</italic>, of T/B-cell based adaptive immunity in vertebrates (<xref ref-type="fig" rid="fig5">Figure 5</xref>; <xref ref-type="supplementary-material" rid="SD4-data">Supplementary file 3</xref>).</p><p>Not surprisingly, the <italic>B. schlosseri</italic> genome lacks significant homology to most genes known to play an important role in the vertebrate adaptive immune system. For instance, no evidence for the following immune-related genes could be found: (i) assembled major histocompatibility genes, (ii) genes with homology to <italic>RAG1</italic>/<italic>RAG2</italic>, which are involved in immunoglobulin and T-cell receptor rearrangements, (iii) terminal deoxynucleotidyl transferase, which adds nucleotides to the rearranging VDJ elements to create receptor diversity, (iv) V region subgenic elements encoding T cell and immunoglobulin antigen receptor domains, or (v) VLR like immune receptor elements found in lampreys (<xref ref-type="bibr" rid="bib90">Weigert et al., 1970</xref>; <xref ref-type="bibr" rid="bib16">Davis et al., 1984</xref>; <xref ref-type="bibr" rid="bib55">Oettinger et al., 1990</xref>; <xref ref-type="bibr" rid="bib23">Fagan and Weissman, 1998</xref>; <xref ref-type="bibr" rid="bib40">Laird et al., 2000</xref>; <xref ref-type="bibr" rid="bib51">Muramatsu et al., 2000</xref>; <xref ref-type="bibr" rid="bib56">Pancer et al., 2004</xref>; <xref ref-type="bibr" rid="bib65">Rogozin et al., 2007</xref>; <xref ref-type="bibr" rid="bib21">Dishaw and Litman, 2009</xref>; <xref ref-type="bibr" rid="bib25">Flajnik and Kasahara, 2010</xref>; <xref ref-type="bibr" rid="bib31">Hirano et al., 2011</xref>). We identified a large fraction (∼45%; <xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2H</xref>; <xref ref-type="fig" rid="fig3s4">Figure 3—figure supplement 4</xref>) of intron-less genes in the <italic>B. schlosseri</italic> draft genome, including retroviral genes such as <italic>Gag</italic>, <italic>Poli</italic>, <italic>Env</italic> and LTRs, which are used by viruses to insert their genetic sequences into the host genomes. As adaptive immunity genes like <italic>RAG1</italic>/<italic>RAG2</italic> are intron-less and first appear in jawed vertebrates, it has been suggested that they may have originated via horizontal infections of primitive retroviral like agents, and/or gene transfer (<xref ref-type="bibr" rid="bib5">Bartl et al., 1994</xref>). In addition, the <italic>B. schlosseri</italic> genome encodes homologues of <italic>Foxn1</italic>, the thymus epithelial gene mutated in the immunodeficient nude mouse (nu/nu), a marker of the thymopoietic microenvironment in vertebrates (<xref ref-type="bibr" rid="bib53">Nehls et al., 1996</xref>; <xref ref-type="bibr" rid="bib3">Bajoghli et al., 2011</xref>). These data indicate that at least some genetic circuitry relevant for vertebrate adaptive immunity was already in place in the common ancestor of the protochordate <italic>B. schlosseri</italic> and vertebrates. It leaves open the question of whether Ig or TCR genes, and the MHC proteins that capture and present intracellular peptides to T cells expressing these TCR proteins, existed in antecedents to <italic>B. schlosseri</italic> but were lost or somehow introduced after the line from colonial tunicates to the organisms that have an adaptive immune system. As <italic>omnis DNA e DNA</italic>, this question is perhaps the most puzzling of our findings.</p><p>In conclusion, using a novel method for deciphering eukaryotic genomes, we assembled and analyzed the <italic>B. schlosseri</italic> genome, the first colonial tunicate to be sequenced. One of the great challenges in evolutionary biology is to understand how differences in DNA sequences between species underlie distinct phenotypes. The <italic>B. schlosseri</italic> genome provides an important new resource for unraveling the genes and regulatory logic that led to the emergence of vertebrates and lymphoid-mediated immunity. Moreover, the many important features encoded by the <italic>B. schlosseri</italic> genome will facilitate new insights into complex vasculature, chimerism among kin, whole-body stem cell-mediated regeneration, and a colonial lifestyle.</p></sec></sec><sec id="s3" sec-type="materials|methods"><title>Materials and methods</title><sec id="s3-1"><title>Animals and genomic DNA sample collection</title><p>Mature reproductive colonies of <italic>Botryllus schlosseri</italic> (Pallas) were collected from Santa Cruz and Monterey marinas, California . Hatched larvae were settled raised, and crossed in our mariculture facility as described (<xref ref-type="bibr" rid="bib8">Boyd et al., 1986</xref>; <xref ref-type="bibr" rid="bib17">De Tomaso et al., 1998</xref>). Long lived, highly regenerative colonies Sc6a-b and 356a, were chosen to be sequenced. Sc6a-b subclones were starved for 48 hr prior to sampling (to minimize DNA contamination), and 400 individuals (zooids) were sampled for gDNA sequencing. Subclones of this colony are still alive and maintained in our mariculture facility (<xref ref-type="fig" rid="fig2s2">Figure 2—figure supplement 2A</xref>). 150 individuals from colony 356a were sampled and their gDNA was sequenced. To confirm that all zooids belonged to one genotype, a few zooids were taken from every sample set and screened for polymorphism via amplified fragment length polymorphism (AFLP) analysis as described in (<xref ref-type="bibr" rid="bib88">Voskoboynik et al., 2008</xref>) and microsatellite loci analysis as described in (<xref ref-type="bibr" rid="bib80">Stoner et al., 2002</xref>), confirming one genotype for Sc6a-b and 356a colonies (<xref ref-type="fig" rid="fig2s2">Figure 2—figure supplement 2B–F</xref>). Tissue samples were dissected and flash-frozen in liquid nitrogen. Genomic DNA samples were extracted using a modified version of the Hoss and Paabo protocol (<xref ref-type="bibr" rid="bib33">Hoss and Paabo, 1993</xref>) as described (<xref ref-type="bibr" rid="bib17">De Tomaso et al., 1998</xref>).</p></sec><sec id="s3-2"><title>Genome sequencing and assembly</title><p>The <italic>B. schlosseri</italic> genome sequence assembly was performed using two independent methods.</p><p><bold>Colony Sc6a-b</bold> genome sequence data was obtained using single read and paired-end protocols on the Roche (Roche, Branford, CT) 454 GS-FLX and Illumina Genome Analyzer II (GAII; Illumina, San Diego, CA) instruments (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2C</xref>). Sc6a-b gDNA was fragmented, libraries prepared, and sequencing conducted according to the manufacturer’s protocols. The 454 platform generated a total of 3086 Mb sequence data, the Illumina platform generated 3597 Mbp sequence data .The 6683 Mbp of sequence data obtained corresponds to ∼11-fold coverage of the <italic>B. schlosseri</italic> genome (estimated size of 600 Mbp, 454kmer estimation; <xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2C</xref>). The 454 shotgun and Illumina GAII paired-end reads were assembled de novo using Newbler v2.5 (Roche) with default settings, heterozygote mode. 380 Mbp comprised of 518,856 contigs were assembled with N50 of 1160 bp (Sc6a-b draft assembly; <xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2D</xref>).</p><p><bold>Colony 356a</bold> We developed a novel method to obtain a sequence in order to assemble larger contigs and reduce assembly complexity. Colony 356a gDNA was sheared using HydroShear (speed setting 16; 20 cycles) into random fragments of 6–10 kb. Sheared gDNA was run on a 0.8% agarose gel, the 6–8 kb band was cut and the DNA extracted using Qiagen gel purification kit. Fragmented DNA was repaired using NEB end repair module (E6050S) to produce blunt ends. Blunt end DNA was purified on a Qiagen column. After purification standard double stranded adapters from the Roche 454 kit were ligated with NEB Quick Ligase, following Roche 454 Titanium protocols. 454 adaptor mix 27,145, a mix of two sequences was used:</p><p>Primer A1: 5′-CCATCTCATCCCTGCGTGTCTCCGACTCAG-3′; 3′-TCTCCGACTCAG-5′</p><p>Primer B: 5″-/5BioTEG/CCTATCCCCTGTGTGCCTTGGCAGTCTCAG-3′; 3′-TGGCAGTCTCAG-5′</p><p>Amplification primer mix: Ti forward: 5′-CCATCTCATCCCTGCGTGTC-3′; Ti reverse: 5′-CCTATCCCCTGTGTGCCTTG-3′</p><p>These adapters serve as priming sites for the downstream amplification of the long fragment library. Following DNA purification (Agencourt AMPureXP bead purification) and fill-in reaction, second size selection was performed to remove adapter dimers and narrow down DNA size range (6–8 kb). Qiagen gel purification kit was used to purify DNA. PCR amplification for long range amplification was performed as follows: initial denaturation at 94°C for 30 s, followed by 23 cycles of (94°C for 15 s, 65°C for 7 min), followed by a final extension 65°C for 7 min. Concentration of amplifiable molecules carrying both amplification adapters was estimated by comparing <italic>B. schlosseri</italic> samples to a human standard sample prepared using an identical protocol. qPCR with nonspecific intercalating dye (EvaGreen, Biotinum) was used to calculate concentrations. Human standard was prepared following an identical protocol from genomic DNA derived from HapMap sample NA7019. The amount of amplifiable DNA was obtained by mapping short reads to a human genome reference 36 and measuring the fraction of the genome that was covered (<xref ref-type="fig" rid="fig2s1">Figure 2—figure supplement 1</xref>). Mapping was done using Novoalign with default settings, counting the amount of bases covered by regions of more than 1500 bp with at least 2x coverage of properly mapping paired end reads. We then aliquoted the resulting library of <italic>B. schlosseri</italic> gDNA with amplification adapters into wells of two 96-well plates such that, on average, each well contained a predefined amount of amplifiable molecules (estimated number of 200–2000 molecule per well; 1–6 Mb of total amplifiable sequence). Randomly sampled molecules in each well were amplified using NEB LongAmp master mix in the presence of 400 nM of primers: LA-V2-LEFT 5′-CCATCTCATCCCTGCGTGTCTCCG-3′; LA-V2-RIGHT 5′-CCTATCCCCTGTGTGCCTTGGCAGT-3′) complementary to previously ligated adapters following the two-step protocol. The resulting library of amplicons was purified using Zymo ZR-96 DNA Clean & Concentrator-5 kit. Purified DNA was eluted into two 96-well plates according to the manufacturer’s protocol. DNA was fragmented and tagged using Nextera DNA sample prep kit. Following the standard protocol, samples were incubated for 5 min at 55°C in the provided high molecular weight buffer (Nextera DNA sample prep kit, Epicentre). Fragmented DNA was purified using Zymo ZR-96 DNA Clean & Concentrator-5 kit and was converted into Illumina compatible sequencing library using a custom protocol. Four oligos described in the Nextera DNA sample prep kit (Epicentre and Illumina) were added to the every well containing purified fragmented DNA in concentrations recommended by Epicentre.</p><p>Adaptor 1*: 5′AATGATACGGCGACCACCGAGATCTACACGCCTCCCTCGCGCCATCAG-3′; Primer 1*: 5′-AATGATACGGCGACCACCGA-3′; Primer 2*: 5′-CAAGCAGAAGACGGCATACGA-3′; Adaptor 2: 5′-CAAGCAGAAGACGGCATACGAGAT-[BAR CODE]*-CGGTCTGCCTTGCCAGCCCGCTCAG-3′</p><p>Adapter 2 carried a 7 bp barcode sequence unique for each well of two 96-well plates (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2I</xref>). Amplification was done using NEB Phusion GC master mix (2x) following the recommended Nextera limited cycle PCR protocol designed to incorporate barcoded adapters: 72°C for 3 min, 95°C for 40 s, followed by nine cycles of 62°C for 30 s, 72°C for 3 min. The resulting 192 Illumina libraries were pooled together and purified using Qiagen Quiavac96 DNA purification kit. Size selection was performed by running a 2% agarose gel and excising the 400–900 bp band. This gel band was purified (Qiagen), quantitated using Agilent Bioanalyzer 2100 High-Sensitivity chip and sequenced on Illumina HiSeq 2000 sequencer following manufacturer recommended protocols. After sequencing, multiplexed libraries reads were de-multiplexed and separated into independent files (according to barcodes). Reads were then screened to remove reads with low overall quality and reads containing Nextera adapters (5′-AGATGTGTATAAGAGACAG-3′) resulting from imperfect size selection. We have sequenced a total of eight libraries (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary files 2A,B</xref>). The resulting pool of reads was assembled using Velvet (<xref ref-type="bibr" rid="bib96">Zerbino, 2010</xref>) to reconstruct 6–8 kb original fragments using Velvet optimizer mode (<xref ref-type="fig" rid="fig2">Figure 2</xref>, <xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2A,B</xref>). Resulting contigs from Velvet were treated as input reads for downstream assembly with Celera Assembler (<xref ref-type="bibr" rid="bib52">Myers et al., 2000</xref>) version 6.1, to produce 356a draft assembly (<xref ref-type="fig" rid="fig2s3">Figure 2—figure supplement 3</xref>, <xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2D</xref>).</p></sec><sec id="s3-3"><title>Chromosome sequencing, assignment and assembly</title><p>Embryos were isolated from a wild <italic>B. schlosseri</italic> colony from Monterey Bay. Metaphase chromosomes were isolated as previously described (<xref ref-type="bibr" rid="bib73">Shoguchi et al., 2004</xref>). <italic>B. schlosseri</italic> metaphase chromosome suspension was partitioned into wells in the microfluidic device as previously described (<xref ref-type="bibr" rid="bib24">Fan et al., 2011</xref>; <xref ref-type="bibr" rid="bib92">Xu et al., 2011</xref>). The contents of each microfluidic well were amplified individually and prepared for sequencing. Each well contained between 1–4 metaphase chromosomes (<xref ref-type="fig" rid="fig3">Figure 3</xref>, <xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1</xref>, <xref ref-type="fig" rid="fig3s2">Figure 3—figure Supplement 2</xref>). 21 wells were made into libraries and sequenced using Illumina Hiseq (2 x 100).</p><sec id="s3-3-1"><title>Chromosome assignment</title><p>Since a particular chromosome has an equal chance of occupying any of the 21 wells, we can denote the presence of a particular chromosome for example chromosome A across the 21 wells in the form of a vector (1,0,1,0,1,0,1,0,0,0,0,0,1,0,0,0,1,0,0,0,1) where 1 denotes presence in a well and 0 as absent. To deduce this configuration and perform the assignment of contigs, we aligned the reads from each well onto the contigs of the assembly. Contigs that share the same configuration across 21 wells can be considered to be from the same chromosome. To determine which contigs belong together and share the same configuration, we cluster the contigs using the Pearson correlation with each other using the vector across 21 wells. The number of clusters that result from k-means clustering using the Pearson correlation as the distance is then inferred to be the number of chromosomes. To determine this optimal number of clusters K for K-means clustering, we perform the clustering procedure iteratively for each K and record the within sum of squares error for each iteration as shown in <xref ref-type="fig" rid="fig3">Figure 3</xref>. Additionally, using the clustered data, we were able to deduce the configuration and deduce the number of chromosomes in each well.</p><p>Reads from each of the chromosome preparation were aligned to the 356a draft genome assembly using the BWA (<xref ref-type="bibr" rid="bib47">Li and Durbin, 2009</xref>) package. Subsequently, SAMtools (<xref ref-type="bibr" rid="bib48">Li et al., 2009</xref>) were used to filter for high quality mapping of reads with MAPQ score of greater than 30. The filtering was performing by using AWK to filter the fifth column of the SAM file for alignments >25. In addition to filter for a reasonable insert size, AWK is used to filter the corresponding columns in SAM files. Filtered SAM files were then parsed using BEDtools (<xref ref-type="bibr" rid="bib62">Quinlan and Hall, 2010</xref>) to obtain the number of reads that are associated with each of the scaffolds. Specifically, the coverageBED command is used to calculate the number of reads and coverage associated with each of the scaffolds in the assembled genome. Utilizing the number of reads associated with each scaffold from a particular chromosome preparation were arranged in the following data format:<table-wrap id="tbl1" position="anchor"><table frame="hsides" rules="groups"><thead><tr><th>Names of scaffold</th><th>Chromosome preparation 1</th><th>…</th><th>Chromosome preparation n</th></tr></thead><tbody><tr><td>scaffold 1</td><td>Number of reads associated with the scaffold and preparation</td><td>…</td><td>…</td></tr><tr><td>…</td><td>…</td><td>…</td><td>…</td></tr><tr><td>Scaffold n</td><td>…</td><td>…</td><td>…</td></tr></tbody></table></table-wrap></p><p>In each cell the number of reads associated with the scaffold and preparation was normalized by the total number of reads across each chromosome preparation. This is done by dividing the number of reads associated with the particular scaffold and preparation by dividing each entry by the total number of reads from a chromosome preparation. This value is then scaled by the fractional coverage of reads for a particular scaffold. These normalization steps ensure that a valid comparison can be made across each preparation. These normalized reads are then used to perform the K-means clustering. The optimal number of clusters is determined by iteratively performing the clustering process with each value of K. Within sum of square errors for each cluster is calculated and plotted in <xref ref-type="fig" rid="fig3">Figure 3A</xref>. A knee exists in the curve near K = 13, after which increasing the number of clusters only creates marginal improvement in the error (<xref ref-type="fig" rid="fig3">Figure 3A</xref>). To estimate the configuration after the clustering step, 17 out of the 21 wells were deduced to contain information that is used in the clustering process. The average number of normalized reads counts from each well that align to each scaffold in a cluster group is calculated and plotted in <xref ref-type="fig" rid="fig3">Figure 3B</xref>, <xref ref-type="fig" rid="fig3s1 fig3s2">Figure 3—figure supplements 1 and 2</xref>. Each peak represented can be inferred to denote the presence of a specific chromosome in the well. This approach yielded 13 well resolved chromosomes (<xref ref-type="fig" rid="fig3">Figure 3</xref>, <xref ref-type="fig" rid="fig3s1">Figure 3—figure supplement 1</xref>), close to the ∼16 chromosomes that were predicted by a previous study using metaphase spreads (<xref ref-type="bibr" rid="bib14">Colombera, 1963</xref>).</p></sec><sec id="s3-3-2"><title>356a-chromosomes hybrid assembly</title><p>Reads from each of the individual chromosome sample preparation were subsequently assembled using Velvet (<xref ref-type="bibr" rid="bib96">Zerbino, 2010</xref>; <xref ref-type="fig" rid="fig3s2">Figure 3—figure supplement 2</xref>). Velvet was compiled for our assembly to have a max hash length of 75. This is to allow for the use of larger hash length for the assembly of the reads from the individual well. Since the paired reads from each preparation is ∼86 after filtering for low quality bases, an optimal hash length is selected from the range of 51–75 to obtain the optimal assembly for each preparation. The assembled chromosome level contigs were then merged with 356a draft assembly using Minimus2 <ext-link ext-link-type="uri" xlink:href="http://sourceforge.net/apps/mediawiki/amos/index.php?title=Minimus2">http://sourceforge.net/apps/mediawiki/amos/index.php?title=Minimus2</ext-link> (<xref ref-type="fig" rid="fig3s3">Figure 3—figure supplement 3</xref>). During this stage, minimus2 used a nucmer based overlap detector to detect overlap between sequences and subsequently merging the two sequence sets to generate the final merge assembly of chromosome with the draft. An overall improvement in N50 was achieved, yielding a final 580 Mbp draft 356a-chromosomes hybrid assembly (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2D</xref>).</p></sec></sec><sec id="s3-4"><title>Evaluation of 356a-chromosomes hybrid assembly</title><p>All of the 66 <italic>B. schlosseri</italic> genes, 11 fosmid sequences and most of the 98,611 expressed sequence tags (ESTs) available from NCBI aligned with the <italic>B. schlosseri</italic> final draft assembly (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2F</xref>; <xref ref-type="fig" rid="fig2s5">Figure 2—figure supplement 5</xref>). Nearly all of the independently sequenced and assembled Roche 454 Sc6a-b contigs (93%) were successfully mapped to the final assembly (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2F</xref>). The Sanger sequenced NCBI genes and ESTs, and the 454 and Illumina GAII sequenced Sc6a-b genome (∼11x fold coverage, <xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2C</xref>), provide validation and an independent test to the quality and integrity of the final assembly.</p></sec><sec id="s3-5"><title>RNA sequencing</title><p>RNA was isolated from 19 different individuals (developmental stages A–D; different ages). To minimize DNA contamination, colonies were starved for 48 hr before sampling. Total RNA was extracted following the manufacturer’s instructions (Ambion; Purelink RNA mini kit) and purified using the Purelink DNase kit (Invitrogen). cDNA libraries for Illumina HiSeq and MiSeq were prepared (Ovation RNA-Seq v1 system, Nugen; NEBnext DNA Master Mix for Illumina (New England Biolabs) and standard Illumina adapters and primers from IDT. RNA-Seq (2x100 bp; Illumina HiSeq) was performed. Each genotype was sequenced separately. In total, ∼88 Gb of raw transcriptome sequence data were generated for the 19 colonies (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2C</xref>). To investigate expression of genes in particular tissues, we also generated tissue-specific RNA-Seq libraries using the Illumina GAII (single-end 36 bp reads) and Illumina MiSeq (100-bp paired-end). For Illumina GAII RNAseq total RNA was isolated following Invitrogen’s recommendations. PolyA+ mRNA were isolated using oligoT Dynal beads. Reverse transcription and library construction protocols were provided by Illumina. In total, ∼4 Gb of raw transcriptome sequence data were generated for the tissue specific (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2C</xref>).</p></sec><sec id="s3-6"><title>Gene prediction</title><p>Using Cufflinks (<xref ref-type="bibr" rid="bib84">Trapnell et al., 2010</xref>) with default parameters, <italic>B. schlosseri</italic> cDNA reads were aligned to the draft assembly and a reference-guided transcript assembly was produced. To predict genes, we used the program Augustus v2.5.5 (<xref ref-type="bibr" rid="bib77">Stanke et al., 2008</xref>). The reference-guided transcripts assembly was aligned to the draft genome assembly and a ‘Hints’ gff file was generated to guide gene prediction. Augustus was run (using human HMM and parameters), and from 121,094 contigs, a total of 38,730 genes with a minimum of 30% transcript support were predicted (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2H</xref>).</p></sec><sec id="s3-7"><title>Gene annotation</title><p>All <italic>B. schlosseri</italic> candidate protein-coding genes were compared to human and mouse proteomes (UniProtKB/Swiss-Prot; see Sequence data in ‘Materials and methods ’ under ‘Phylogenomic analyses’) using blastp and an e-value threshold of e<sup>−10</sup> (see Sequence Data, ‘Materials and methods’ under ‘Evolution analysis’). In addition, all <italic>B. schlosseri</italic> candidate protein-coding genes were compared to the NCBI non-redundant protein database (NR) using blastx and an e-value threshold of e<sup>−10</sup>. For every predicted gene 2 annotations were assigned (1). The best hit (smallest e-value) from NR and (2). if available, the best hit from the UniProt mouse/human blastp results.</p></sec><sec id="s3-8"><title>Evaluation of genes</title><p>RNA from <italic>B. schlosseri</italic> endostyles, vasculature (ampullae) and blood cells were isolated using an Ambion Purelink RNA minikit and cDNA prepared using Protoscript AMV LongAmp Taq RT-PCR kit (NEB). cDNA was amplified using GE Illustra Hot Start RTG beads and amplified using primers designed for the tested genes.</p><p>For the amplification and Sanger sequencing of the putative genes from specific blood groups, specific primers were used. Per every gene, expression was tested using cDNA prepared from endostyle, vasculature and blood. PCR was performed on the MJ Research PTC-200 thermal cycler as follows: Initial denaturation at 95°C for 4 min, followed by 34 cycles of 95°C for 1 min, 59ofor 1 min, 72°C for 1 min, followed by a final extension 72°C for 20 min. Amplified products were run on an E-Gel EX 1% agarose gel (Invitrogen) to validate size, then sent to MCLAB (384 Oyster Pt Rd. S. San Francisco, CA) for sequencing. We tested a set of 145 predicted genes by PCR and Sanger-sequencing, and were able to confirm 144 of them (99.3%), further validating the genome assembly (<xref ref-type="fig" rid="fig2s6">Figure 2—figure supplement 6</xref>).</p></sec><sec id="s3-9"><title>Mitochondrial phylogeny</title><sec id="s3-9-1"><title>Mitochondrial genome sequencing</title><p>Two mt-like scaffolds were initially identified in the whole-genome assembly of the <italic>B. schlosseri</italic> Sc6a-b specimen (Pacific Ocean, Santa Cruz harbor, California) assembled from Roche 454, Illumina GA II (<xref ref-type="supplementary-material" rid="SD3-data">Supplementary file 2D</xref>). Although these scaffolds covered the entire mitochondrial genome (mtDNA), their sequences were further validated by a conventional mtDNA sequencing strategy. Indeed, these mt scaffolds showed several ORF frameshifts and dozens of single-nucleotide deletions/insertions (indels) compared to the unpublished mtDNA of a <italic>B. schlosseri</italic> ‘Ve’ specimen coming from the Mediterranean Sea (Venice Lagoon, Italy). The identified frameshifts and indels were distributed almost uniformly along the mt genome sequence, and most of them fell inside or close to homopolymeric tracts longer than 7 bp, that is at the hot spots of Roche 454 sequencing errors. Thus, the complete mtDNA of the Sc6a-b specimen was amplified in two short (1.8–2.2 kb) and two long (5–7.4 kb) overlapping fragments (data available on request) using the high-fidelity Takara LA Taq enzyme (Takara) and according to the manufacturer’s instructions. Amplicons were directly sequenced using a primer walking strategy, or used as template for nested/semi-nested PCRs in order to obtain fragments easily cloneable. All mt amplicons containing several homopolymeric tracts at short distance were cloned and then sequenced, as the direct sequencing of amplicons containing homopolymer tracts always produced low-quality sequences. Cloning was carried out with the CloneJET PCR Cloning Kit (Fermentas) and sequences were obtained as the consensus of three different clones. Sanger sequencing was performed by the Eurofins MWG-Operon. The mtDNA of the <italic>B. schlosseri</italic> Sc6a-b specimen is 14,928 bp long and contains the typical complement of tunicate mt genes (24 tRNAs, 2 rRNAs and 13 proteins).</p></sec><sec id="s3-9-2"><title>Mitochondrial phylogenetic analyses</title><p>Phylogenetic reconstructions of tunicates and deuterostomes were performed on the amino acid sequences of the 13 mitochondrially-encoded proteins. Sequences were extracted from revised entries of complete mitochondrial genomes collected in the MitoZoa database (<xref ref-type="bibr" rid="bib22">D’Onorio de Meo et al., 2012</xref>) The analyzed taxon sample consists of 66 species, that is, all available species of Tunicata, Cephalochordata and Xenoturbellida; almost all available species of Hemichordata and Echinodermata; few representatives of Vertebrata; and two outgroup species (the arthropod <italic>Drosophila melanogaster</italic> and the mollusk <italic>Aplysia californica</italic>) (<xref ref-type="supplementary-material" rid="SD2-data">Supplementary file 1</xref>). Outgroups were selected among taxa closely related to deuterostomes, in order to ensure the analysis of the largest possible set of unambiguously aligned sites. Moreover, priority was given to outgroup species that underwent genome-sequencing projects. Among Tunicata, the larvacean <italic>Oikopleura dioica</italic> was not examined because of the partial status of the mtDNA and its very fast substitution rate (<xref ref-type="bibr" rid="bib20">Denoeud et al., 2010</xref>). Few echinoderms were also excluded from the analyses due to their close relationship to other examined species. The mtDNA of the hemichordate <italic>Rhabdopleura compacta</italic> was excluded because of its unusual amino acid composition, causing a very long branch in phylogenetic reconstructions (<xref ref-type="bibr" rid="bib58">Perseke et al., 2011</xref>).</p><p>The mitochondrially-encoded proteins were individually aligned with MATTF v.6 (<xref ref-type="bibr" rid="bib36">Katoh et al., 2005</xref>), and each alignment was manually optimized. Poorly aligned positions were identified and removed by Gblocks version 0.91b (<xref ref-type="bibr" rid="bib10">Castresana, 2000</xref>), applied with relaxed selection parameters. Individual protein alignments were then concatenated, resulting in a total alignment of 2489 amino acid sites.</p><p>Phylogenetic reconstructions were performed with Bayesian and Maximum Likelihood methods. Since the non-parametric CAT mixture model has been shown to be less prone to Long Branch Attraction (LBA) artifacts compared to other models (<xref ref-type="bibr" rid="bib43">Lartillot et al., 2007</xref>, <xref ref-type="bibr" rid="bib44">2009</xref>; <xref ref-type="bibr" rid="bib59">Philippe et al., 2009</xref>), Bayesian inferences were carried out using PhyloBayes version 3.3 (<xref ref-type="bibr" rid="bib44">Lartillot et al., 2009</xref>) under the CAT model. In particular we applied the GTR+G+CAT model: the General Time Reversible (GTR) was used as a substitution rate matrix; the rate heterogeneity across sites was modeled according to a gamma (G) distribution with four discrete categories; and the equilibrium frequency profile was modeled with a Dirichlet Process (DP). Two independent Monte Carlo Markov chains were run for each dataset, and chain convergence was estimated checking the values of maximum discrepancy across bipartitions (<0.1) and minimum effective size of the summary variables listed in the ‘trace’ output (>100). The same tree topologies and similar posterior probabilities were obtained modeling the rate of heterogeneity with a Dirichlet process instead of a gamma distribution (GTR+DP+CAT model instead of GTR+G+CAT). The final 50% majority rule consensus tree was computed using the converged chains, discarding the initial 10% points (burn-in) and saving one point every ten cycles. The two independent chains were run for a total of 10,000 cycles, with a burn-in of 1000 cycles.</p><p>Phylogenetic trees were also inferred with PhyML 3.0 (<xref ref-type="bibr" rid="bib29">Guindon and Gascuel, 2003</xref>), with bootstrap values based on 100 replicates. The substitution model was set to MtArt+G+F (with F = observed amino acid frequencies), that is, the model best fitting to the alignment data, as estimated by ProtTest 3 among 80 candidate models according to both the AIC and BIC selection criteria (<xref ref-type="bibr" rid="bib1">Abascal et al., 2005</xref>).</p></sec><sec id="s3-9-3"><title><italic>B. schlosseri</italic> phylogenetic position</title><p>The mitochondrial phylogeny of <xref ref-type="fig" rid="fig1s1">Figure 1—figure supplement 1</xref> shows the position of <italic>B. schlosseri</italic> within tunicates and deuterostomes, as reconstructed by the CAT model. This phylogeny is in perfect agreement with recent phylogenomic reconstructions based on hundreds of nuclear-encoded proteins (<xref ref-type="bibr" rid="bib7">Bourlat et al., 2006</xref>; <xref ref-type="bibr" rid="bib19">Delsuc et al., 2006</xref>). Indeed, the tree identifies Tunicata as a sister group of Vertebrata (thus forming the clade Olfactores) and Cephalochordata as basal to all other chordates. Moreover, it recovers with high statistical support the monophyly of Chordata and all other deuterostome phyla/subphyla (Echinodermata, Hemichordata, Cephalochordata, Vertebrata and Tunicata), as well as the clustering of Echinodermata and Hemichordata in the Ambulacraria clade.</p><p>The reconstructed phylogeny highlights extremely long branches for all tunicate species, including <italic>B. schlosseri</italic>, confirming that the mt evolution is characterized by a high substitution rate in all currently available tunicate sequences (see also <xref ref-type="bibr" rid="bib75">Singh et al., 2009</xref>). This fast evolution causes a clear LBA phenomenon in the PhyML reconstruction, with the artifactual positioning of tunicates basal to all other deuterostomes (data not shown).</p><p>As for relationships within tunicates, Stolidobranchia form a monophyletic clade: <italic>B. schlosseri</italic> clusters with all other available Styelidae species, while the three Pyuridae species make a paraphyletic group. The paraphyly of Pyuridae (or even Styelidae) has been already observed in large molecular phylogenetic trees of Stolidobranchia based on single mitochondrial or nuclear genes, although with contrasting supports depending on the method and the selected outgroup (<xref ref-type="bibr" rid="bib95">Zeng et al., 2006</xref>; <xref ref-type="bibr" rid="bib57">Perez-Portela et al., 2009</xref>; <xref ref-type="bibr" rid="bib85">Tsagkogeorga et al., 2009</xref>). Our phylogeny, based on all 13 mitochondrially-encoded proteins, strongly supports the paraphyly of Pyuridae, ad waits for additional Stolidobranchia species/families to define the monophyletic/paraphyletic status of Styelidae.</p><p>The two orders of Aplousobranchia and Phlebobranchia cluster together, supporting the morphological subdivision of ascidians into Enterogona (i.e., Phlebobranchia + Aplousobranchia) and Pleurogona based on gonad position (<xref ref-type="bibr" rid="bib27">Garstang, 1928</xref>). Phlebobranchia also appear as a paraphyletic group since the family Cionidae clusters to Aplousobranchia, while the family Ascidiidae forms the basal branch inside the Aplousobranchia + Phlebobranchia group. Finally, the only available thaliacean species, <italic>Doliolum nationalis</italic>, is located basal to all Enterogona, supporting the paraphyletic nature of the class Ascidiacea. It should be noted that most published molecular phylogenies of tunicates identify a stable clade including Aplousobranchia, Phlebobranchia and Thaliacea but fail to unambiguously resolve the relationships inside this clade (see <xref ref-type="bibr" rid="bib85">Tsagkogeorga et al., 2009</xref> and references therein). For example, Thaliacea are alternately recovered as sister group of all Enterogona (<xref ref-type="bibr" rid="bib94">Yokobori et al., 2006</xref>; <xref ref-type="bibr" rid="bib85">Tsagkogeorga et al., 2009</xref>) or of the only Phlebobranchia (<xref ref-type="bibr" rid="bib82">Swalla et al., 2000</xref>; <xref ref-type="bibr" rid="bib93">Yokobori et al., 2005</xref>; <xref ref-type="bibr" rid="bib95">Zeng et al., 2006</xref>). Furthermore, the sister relationship between Cionidae and Aplousobranchia has been already supported by the analysis of the single mt <italic>cox1</italic> gene in a large ascidian sample (<xref ref-type="bibr" rid="bib86">Turon and Lopez-Legentil, 2004</xref>), hence confirming the inclusion of Cionidae within Aplousobranchia proposed by Kott (<xref ref-type="bibr" rid="bib38">Kott, 1990</xref>) on the basis of morphological characters. Noteworthy, in our phylogenetic reconstruction the Aplousobranchia + Phlebobranchia + Thaliacea clade is highly supported, but the PP values of the internal nodes (i.e., the nodes suggesting the Phlebobranchia paraphyly and the basal position of <italic>Doliolum</italic>) are not the maximum ones (0.82 and 0.88 in <xref ref-type="fig" rid="fig1s1">Figure 1—figure supplement 1</xref>). Moreover, this portion of the tree has a different topology in the PhyML and PhyloBayes trees reconstructed using more appropriate outgroup species (i.e., only Vertebrata, Agnatha, Cephalochordata, or Agnatha+Cephalochordata; Phylobayes according to GTR+G+CAT model with 10,000 cycles) (data not shown). In particular, in these trees, <italic>Doliolum</italic> groups to Ascidiidae, with Cionidae forming the basal group, while Aplousobranchia is a sister group of Thaliacea + Phlebobranchia (data not shown). These observations, together with the longest branches of Aplousobranchia and the availability of a single thaliacean sequence, suggest instability of this portion of the tree as a result of long branches and insufficient taxon sampling. Thus, the relationships between Aplousobranchia, Phlebobranchia and Thaliacea need to be further investigated through the analysis of additional species.</p></sec></sec><sec id="s3-10"><title>Phylogenomic analyses</title><sec id="s3-10-1"><title>Sequence data</title><p>The following well-annotated proteomes were downloaded from the UniProt Knowledgebase (UniProtKB; <ext-link ext-link-type="uri" xlink:href="http://www.uniprot.org">www.uniprot.org</ext-link>) on 06/29/2012, using the ‘complete proteome set’ filter: <italic>A. queenslandica</italic>, <italic>B. floridae</italic>, <italic>C. intestinalis</italic>, <italic>D. melanogaster</italic>, <italic>D. rerio</italic>, <italic>G. gallus</italic>, <italic>H. sapiens</italic>, <italic>M. musculus</italic>, <italic>N. vectensis</italic>, <italic>S. purpuratus</italic>, and <italic>X. tropicalus</italic>. All protein sequences associated with the <italic>M. brevicollis</italic> genome were downloaded from UnitProtKB on 07/07/2012. We also obtained proteomes from <italic>A. digitifera</italic> (v1.0.1; August 2011 update; <ext-link ext-link-type="uri" xlink:href="http://marinegenomics.oist.jp/genomes/download">http://marinegenomics.oist.jp/genomes/download</ext-link>) and <italic>P. marinus</italic> (assembly 7.0, release 67; known and novel gene predictions; <ext-link ext-link-type="uri" xlink:href="http://www.ensembl.org">www.ensembl.org</ext-link>). Finally, we included all 20,307 <italic>B. schlosseri</italic> predicted proteins with at least one intron and with RNA-Seq transcript support for at least 30% of the protein sequence.</p></sec><sec id="s3-10-2"><title>Orthologous gene identification and alignment</title><p>An all-against-all blastp comparison was performed on the 15 proteomes listed above, with an e-value threshold of 1e−10, and otherwise default search parameters. To identify potentially orthologous genes, we analyzed the blastp output for bi-directional best hits (BBH; <xref ref-type="bibr" rid="bib39">Kristensen et al., 2011</xref>), defined as pairs of mutually best-matching protein sequences from different species. We reduced the impact of confounding paralogs by employing a simple filter, as described previously (<xref ref-type="bibr" rid="bib76">Srivastava et al., 2010</xref>). As a result, 521 protein networks (or clusters) were identified, each of which covers at least 12 of the 15 analyzed proteomes. To assemble a sequence matrix for phylogenetic inference, each protein cluster was aligned using ClustalW (<xref ref-type="bibr" rid="bib42">Larkin et al., 2007</xref>) (default parameters), trimmed for high-quality alignment blocks with GBlocks (<xref ref-type="bibr" rid="bib10">Castresana, 2000</xref>) (default settings), sorted by species name, and concatenated. Strings of ‘X’ characters were introduced into the alignment for species with missing proteins. The final alignment matrix consisted of 15 species by 40,798 amino acids (521 nuclear genes).</p></sec><sec id="s3-10-3"><title>Maximum likelihood and Bayesian analyses</title><p>The evolutionary position of <italic>B. schlosseri</italic> was compared among the 15 species in the alignment matrix (above) using the PhyML 3.0 software tool (<xref ref-type="bibr" rid="bib29">Guindon and Gascuel, 2003</xref>) (with default parameters), which implements a maximum likelihood approach for phylogenetic tree reconstruction. The resulting tree is illustrated in <xref ref-type="fig" rid="fig1">Figure 1E</xref>.</p><p>As an alternative approach, we employed PhyloBayes3.3c, a non-parametric method incorporating Bayesian statistics and Markov Chain Monte Carlo sampling (<xref ref-type="bibr" rid="bib44">Lartillot et al., 2009</xref>). Importantly, PhyloBayes accounts for site-specific evolutionary effects, and by using non-parametric methods, can learn the distribution of each site’s amino acid profile and evolutionary rate directly from the data. Using a general time reversible (GTR) process to model exchange rates, and otherwise default parameters (CAT model: Dirichlet process of equilibrium frequency profiles, in which all parameters are learned from the data; branch lengths ∼ iid gamma), we ran two MCMC chains in parallel. After 1971 cycles, both chains were convergent. We subsequently generated majority-rule consensus trees for each chain by discarding the first 100 trees (burn-in), followed by sampling every other 10 trees. We required a posterior probability threshold of 0.95 for the final consensus tree, as only nodes achieving this threshold are considered well supported (<xref ref-type="bibr" rid="bib44">Lartillot et al., 2009</xref>). The final consensus tree was topologically consistent with the maximum likelihood tree (<xref ref-type="fig" rid="fig1">Figure 1E</xref>), supporting the inferred evolutionary position of <italic>B. schlosseri</italic> among the analyzed proteomes.</p></sec></sec><sec id="s3-11"><title>Evolution analysis</title><sec id="s3-11-1"><title>Identification of <italic>B. schlosseri</italic> genes potentially linked to the emergence of vertebrate phenotypes</title><p>To gain insights into individual genes underlying the emergence of vertebrates, we analyzed 19 proteomes for the presence or absence of genes displaying at least some homology to human/mouse proteomes. In addition to the 15 proteomes used for the phylogenomic analysis, we used the following well-annotated proteomes from UniProtKB (<italic>C. elegans</italic> and <italic>Oikopleura dioica</italic>, downloaded 06/29/2012; <italic>Arabidopsis thaliana</italic> and <italic>Neurospora crassa</italic>, downloaded 07/07/2012). Moreover, for completeness, we included all predicted <italic>B. schlosseri</italic> protein-encoding genes, including gene fragments. After running all-vs-all blastp, and applying an e-value cutoff of e<sup>−10</sup>, a binary matrix was assembled depicting the presence or absence of each gene as 1 or 0, respectively (<xref ref-type="supplementary-material" rid="SD1-data">Figure 4—source data 1A</xref>).</p></sec><sec id="s3-11-2"><title>Evolution of hematopoiesis and identification of candidate hematopoietic precursor genes in <italic>B. schlosseri</italic></title><p>To identify candidate evolutionary precursors of human blood cell populations in <italic>B. schlosseri</italic>, we examined the evolutionary progression of gene sets with expression patterns restricted to distinct immune cell populations. These gene sets were defined by re-analysis of data from a recent publication (<xref ref-type="bibr" rid="bib6">Benita et al., 2010</xref>), in which tissue/cell type-specific enrichment scores were derived for the expression of each gene in the human transcriptome, across 126 human tissues spanning 557 arrays profiled on the same microarray platform (Affymetrix U133A) (<ext-link ext-link-type="uri" xlink:href="http://xavierlab2.mgh.harvard.edu/EnrichmentProfiler/">http://xavierlab2.mgh.harvard.edu/EnrichmentProfiler/</ext-link>). We analyzed the top 20 most enriched genes for each of 26 representative immune cell populations (<xref ref-type="supplementary-material" rid="SD4-data">Supplementary file 3</xref>), and interrogated a broad taxonomic range of proteomes for the presence or absence of each gene (using the binary matrix in <xref ref-type="supplementary-material" rid="SD1-data">Figure 4—source data 1A</xref>). Importantly, we confirmed cell-type restricted expression patterns for representative gene sets using a database of highly purified mouse hematopoietic populations that we recently developed (<xref ref-type="bibr" rid="bib71">Seita et al., 2012</xref>). A blastp e-value threshold of e<sup>−10</sup> was used to establish minimal acceptable homology to human/mouse proteomes. Results are rendered as a heat map in <xref ref-type="fig" rid="fig5">Figure 5</xref>.</p></sec></sec><sec id="s3-12"><title>Data deposition</title><p>The sequence of the <italic>B. schlosseri</italic> mitochondrial genome has been submitted to the European Nucleotide Archive under accession number HF548551.</p><p>An integrated genome and transcriptome browser of <italic>B. schlosseri</italic> has been developed and is available at: <ext-link ext-link-type="uri" xlink:href="http://genepyramid.stanford.edu/botryllusgenome/">http://genepyramid.stanford.edu/botryllusgenome/</ext-link>.</p></sec></sec></body><back><ack id="ack"><title>Acknowledgements</title><p>The authors would like to thank Thomas Snyder, Ivan Dimov, Jun Seita, Chris Lowe, Kevin Uhlinger, Shukry Habib, Jennifer Okamoto, Lisa Me, Lisa Ooi, Antonia Dominguez, Kirill Zdornyy, Seth Karten, Chris Patton, Libuse Jerabek, and Terry Storm for invaluable technical advice and help.</p></ack><sec sec-type="additional-information"><title>Additional information</title><fn-group content-type="competing-interest"><title>Competing interests</title><fn fn-type="conflict" id="conf1"><p>Stanford has filed US and International patent application numbers 61/532,882 and 13/608,778 entitled “Methods for obtaining a sequence” with inventors AV, DP, and SRQ. DP and SRQ are co-founders of Moleculo Inc.</p></fn><fn fn-type="conflict" id="conf2"><p>The other authors declare that no competing interests exist.</p></fn></fn-group><fn-group content-type="author-contribution"><title>Author contributions</title><fn fn-type="con" id="con1"><p>AV, Conception and design of genome project, development of a novel genomic library construction method (long read sequencing- LRseq), genomic and RNA-seq library preparation, chromosome isolation and library preparation, genome assembly, genome assembly evaluation, gene annotation, comparative genomic analysis, writing of manuscript</p></fn><fn fn-type="con" id="con2"><p>NFN, Conception and design of genome project, development of a novel genomic library construction method (long read sequencing- LRseq), genomic and RNA-seq library design and preparation, high-throughput sequencing, writing of manuscript</p></fn><fn fn-type="con" id="con3"><p>DS, Conception and design of genome project, genome assembly, genome assembly evaluation, gene prediction and annotation, comparative genomic analysis, phylogenomic analysis, development of an integrated <italic>B. schlosseri</italic> genome and transcriptome database searching and genome browser website</p></fn><fn fn-type="con" id="con4"><p>AMN, Gene prediction and annotation, comparative genomic analysis, phylogenomic analysis, development of genome analytical tools, writing of manuscript</p></fn><fn fn-type="con" id="con5"><p>DP, Conception and design of genome project, development of a novel genomic library construction method, (long read sequencing- LRseq), genomic library preparation, genome assembly</p></fn><fn fn-type="con" id="con6"><p>WK, Genome assembly, chromosomes assembly and chromosome assignment</p></fn><fn fn-type="con" id="con7"><p>BP, Transcriptome assembly, gene prediction and annotation, high-throughput sequencing</p></fn><fn fn-type="con" id="con8"><p>CHF, Single chromosome isolation and single chromosome library preparation</p></fn><fn fn-type="con" id="con9"><p>GLM, Genomic and RNA-seq library preparation and high-throughput sequencing</p></fn><fn fn-type="con" id="con10"><p>KJP, Design and preparation of RNA-seq libraries, mariculture, systemic breeding, genotyping, Sanger validations, writing of manuscript</p></fn><fn fn-type="con" id="con11"><p>KJI, Mariculture, systemic breeding, genotyping, design of RNA-seq libraries, writing of manuscript</p></fn><fn fn-type="con" id="con12"><p>CG, Mitochondria DNA Sanger validation and mitogenomic phylogeny, writing of manuscript</p></fn><fn fn-type="con" id="con13"><p>FG, Mitochondria DNA Sanger validation and mitogenomic phylogeny</p></fn><fn fn-type="con" id="con14"><p>RB-S, Design and preparation of RNA-seq libraries, Sanger validations and evaluation of genes, writing of manuscript</p></fn><fn fn-type="con" id="con15"><p>DMC, Sanger validations and evaluation of genes</p></fn><fn fn-type="con" id="con16"><p>LP, Genomic library preparation and high-throughput sequencing</p></fn><fn fn-type="con" id="con17"><p>RAW, Genomic library preparation and high-throughput sequencing</p></fn><fn fn-type="con" id="con18"><p>ILW, Conception and design of genome project, writing of manuscript</p></fn><fn fn-type="con" id="con19"><p>SRQ, Conception and design of genome project, development of a novel genomic library construction method (long read sequencing- LRseq), writing of manuscript</p></fn></fn-group></sec><sec sec-type="supplementary-material"><title>Additional files</title><supplementary-material id="SD2-data"><object-id pub-id-type="doi">10.7554/eLife.00569.021</object-id><label>Supplementary file 1.</label><caption><title>Species classification and Accession Number (AC) of the complete mtDNA sequences used in the tunicate phylogenetic reconstructions.</title><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.021">http://dx.doi.org/10.7554/eLife.00569.021</ext-link></p></caption><media mime-subtype="xlsx" mimetype="application" xlink:href="elife00569s002.xlsx"/></supplementary-material><supplementary-material id="SD3-data"><object-id pub-id-type="doi">10.7554/eLife.00569.022</object-id><label>Supplementary file 2.</label><caption><title><italic>B. schlosseri</italic> genome statistics.</title><p>(<bold>A</bold>) Statistics of Velvet assembly of wells per every 356a genomic library preparation. (<bold>B</bold>) Detailed statistics of Velvet assembly of wells per every 356a genomic library preparation. Name: barcode number; #reads: number of filtered reads obtained, NumCtgs: number of assembled contigs, Min: minimum contig length obtained, Max: maximum contig length obtained, Middle: length of the middle contig; Sum: sum of assembled contigs (bp), N50: length of N50 (bp), NumAbove8k: number of assembled contigs above 8k, NumAbove20k: number of assembled contigs above 20k. Kmer: Kmer used by Velvet assembly, Ecov: estimated coverage, CovCutoff: minimum coverage used. (<bold>C</bold>) Total gDNA and RNA sequence data obtained. Genomic DNA was extracted from tissue from two long-lived colonies (356a and Sc6a-b) raised in our mariculture facility. Sequence reads from colony Sc6a-b were obtained using Roche 454 Titanium and Illumina GAIIx. Sequence reads from colony 356a and 21 individual chromosomes isolated from a wild colony were obtained by Illumina HiSeq 2000. RNA-seq reads from several tissues (endostyle, vasculature, gonads and digestive system) were obtained by Illumina GAIIx and Illumina MiSeq. RNA-seq reads from 19 different lab reared colonies were obtained by Illumina HiSeq 2000. (<bold>D</bold>) <italic>B. schlosseri</italic> genome assemblies and chromosome scaffolds statistics. (<bold>E</bold>) Interspersed repeats in <italic>B. schlosseri.</italic> Analysis of interspersed repeat content in <italic>B. schlosseri</italic>, compared to <italic>C. intestinalis</italic> (version ci2, downloaded from the UCSC genome browser). RepeatScout (version 1.0.5; <xref ref-type="bibr" rid="bib60">Price et al., 2005</xref>) was used to identify interspersed repeat elements de novo using a k-mer length of 14. All identified repeats were subsequently filtered for tandem repeat and low complexity content, using RepeatScout. Genome-wide interspersed repeats were catalogued using RepeatMasker (version open-4.0) (<xref ref-type="bibr" rid="bib74">Smit et al., 1996–2010</xref>). (<bold>F</bold>) Alignment statistic of all of the <italic>B. schlosseri</italic> non mitochondrial genes (66), expressed sequence tags (98,611 EST’s) and fosmids (11) available on NCBI and, Sc6a-b assembly (518,856 contigs) with the <italic>B. schlosseri</italic> 356a chromosome hybrid draft genome assembly. (<bold>G</bold>) Genome assemblies statistics of several wild type species. (<bold>H</bold>) <italic>B. schlosseri</italic> predicted gene structure statistics. (<bold>I</bold>) Barcoded adapters list for 192 wells.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.022">http://dx.doi.org/10.7554/eLife.00569.022</ext-link></p></caption><media mime-subtype="xlsx" mimetype="application" xlink:href="elife00569s003.xlsx"/></supplementary-material><supplementary-material id="SD4-data"><object-id pub-id-type="doi">10.7554/eLife.00569.023</object-id><label>Supplementary file 3.</label><caption><title>Potential precursors of human hematopoietic populations in <italic>B. schlosseri</italic>.</title><p>We analyzed gene expression microarray data from 26 different human blood cell populations, along with a large diversity of non-blood human tissue samples, and identified a set of twenty signature genes with highly enriched expression profiles for each hematopoietic population. The 20 signature genes for each blood-related gene set, and the identified orthologous gene sequences in <italic>B. schlosseri</italic> are presented. Status = 1 predicted gene is present in <italic>B. schlosseri</italic> genome; Status = 0 predicted gene is absent from <italic>B. schlosseri</italic> genome.</p><p><bold>DOI:</bold> <ext-link ext-link-type="doi" xlink:href="10.7554/eLife.00569.023">http://dx.doi.org/10.7554/eLife.00569.023</ext-link></p></caption><media mime-subtype="xls" mimetype="application" xlink:href="elife00569s004.xls"/></supplementary-material></sec><sec sec-type="datasets"><title>Major datasets</title><p>The following datasets were generated:</p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro1"><name><surname>Voskoboynik</surname><given-names>A</given-names></name>, <name><surname>Neff</surname><given-names>NF</given-names></name>, <name><surname>Sahoo</surname><given-names>D</given-names></name>, <name><surname>Newman</surname><given-names>AM</given-names></name>, <name><surname>Pushkarev</surname><given-names>D</given-names></name>, <name><surname>Koh</surname><given-names>W</given-names></name>, <name><surname>Passarelli</surname><given-names>B</given-names></name>, <name><surname>Fan</surname><given-names>CH</given-names></name>, <name><surname>Mantalas</surname><given-names>GL</given-names></name>, <name><surname>Palmeri</surname><given-names>KJ</given-names></name>, <name><surname>Ishizuka</surname><given-names>KJ</given-names></name>, <name><surname>Gissi</surname><given-names>C</given-names></name>, <name><surname>Griggio</surname><given-names>F</given-names></name>, <name><surname>Ben-Shlomo</surname><given-names>R</given-names></name>, <name><surname>Corey</surname><given-names>DM</given-names></name>, <name><surname>Penland</surname><given-names>L</given-names></name>, <name><surname>White</surname><given-names>RA</given-names><suffix>III</suffix></name>, <name><surname>Weissman</surname><given-names>IL</given-names></name>, <name><surname>Quake</surname><given-names>SR</given-names></name>, <year>2013</year><x>, </x><source>The genome sequence of the colonial chordate, Botryllus schlosseri</source><x>, </x><object-id pub-id-type="art-access-id">PRJNA205369</object-id><x>; </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/bioproject/PRJNA205369">http://www.ncbi.nlm.nih.gov/bioproject/PRJNA205369</ext-link><x>, </x><comment>Publicly available at NCBI BioProject (<ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/bioproject">http://www.ncbi.nlm.nih.gov/bioproject</ext-link>).</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro2"><name><surname>Voskoboynik</surname><given-names>A</given-names></name>, <name><surname>Neff</surname><given-names>NF</given-names></name>, <name><surname>Sahoo</surname><given-names>D</given-names></name>, <name><surname>Newman</surname><given-names>AM</given-names></name>, <name><surname>Pushkarev</surname><given-names>D</given-names></name>, <name><surname>Koh</surname><given-names>W</given-names></name>, <name><surname>Passarelli</surname><given-names>B</given-names></name>, <name><surname>Fan</surname><given-names>CH</given-names></name>, <name><surname>Mantalas</surname><given-names>GL</given-names></name>, <name><surname>Palmeri</surname><given-names>KJ</given-names></name>, <name><surname>Ishizuka</surname><given-names>KJ</given-names></name>, <name><surname>Gissi</surname><given-names>C</given-names></name>, <name><surname>Griggio</surname><given-names>F</given-names></name>, <name><surname>Ben-Shlomo</surname><given-names>R</given-names></name>, <name><surname>Corey</surname><given-names>DM</given-names></name>, <name><surname>Penland</surname><given-names>L</given-names></name>, <name><surname>White</surname><given-names>RA</given-names><suffix>III</suffix></name>, <name><surname>Weissman</surname><given-names>IL</given-names></name>, <name><surname>Quake</surname><given-names>SR</given-names></name>, <year>2013</year><x>, </x><source>Botryllus schlosseri complete mitochondrial genome, isolate sc6a-b</source><x>, </x><object-id pub-id-type="art-access-id">HF548551</object-id><x>; </x><ext-link ext-link-type="uri" xlink:href="http://www.ebi.ac.uk/cgi-bin/sva/sva.pl?search=Go&query=HF548551">http://www.ebi.ac.uk/cgi-bin/sva/sva.pl?search=Go&query=HF548551</ext-link><x>, </x><comment>Publicly available at the European Nucleotide Archive (<ext-link ext-link-type="uri" xlink:href="http://www.ebi.ac.uk/ena/">http://www.ebi.ac.uk/ena/</ext-link>).</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro3"><name><surname>Voskoboynik</surname><given-names>A</given-names></name>, <name><surname>Neff</surname><given-names>NF</given-names></name>, <name><surname>Sahoo</surname><given-names>D</given-names></name>, <name><surname>Newman</surname><given-names>AM</given-names></name>, <name><surname>Pushkarev</surname><given-names>D</given-names></name>, <name><surname>Koh</surname><given-names>W</given-names></name>, <name><surname>Passarelli</surname><given-names>B</given-names></name>, <name><surname>Fan</surname><given-names>CH</given-names></name>, <name><surname>Mantalas</surname><given-names>GL</given-names></name>, <name><surname>Palmeri</surname><given-names>KJ</given-names></name>, <name><surname>Ishizuka</surname><given-names>KJ</given-names></name>, <name><surname>Gissi</surname><given-names>C</given-names></name>, <name><surname>Griggio</surname><given-names>F</given-names></name>, <name><surname>Ben-Shlomo</surname><given-names>R</given-names></name>, <name><surname>Corey</surname><given-names>DM</given-names></name>, <name><surname>Penland</surname><given-names>L</given-names></name>, <name><surname>White</surname><given-names>RA</given-names><suffix>III</suffix></name>, <name><surname>Weissman</surname><given-names>IL</given-names></name>, <name><surname>Quake</surname><given-names>SR</given-names></name>, <year>2013</year><x>, </x><source>Botryllus schlosseri Genome Project</source><x>, </x><ext-link ext-link-type="uri" xlink:href="http://genepyramid.stanford.edu/botryllusgenome/">http://genepyramid.stanford.edu/botryllusgenome/</ext-link><x>, </x><comment>Publicly available</comment></related-object></p><p>The following previously published datasets were used:</p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro4"><name><surname>Bhatla</surname><given-names>M</given-names></name>, <year>2006</year><x>, </x><source>Molecular signatures orchestrating the fate of human hematopoietic stem cells originating from different stages of ontogeny</source><x>, </x><object-id pub-id-type="art-access-id">GSE3823</object-id><x>; </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE3823">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE3823</ext-link><x>, </x><comment>Publicly available at the Gene Expression Omnibus (<ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/">http://www.ncbi.nlm.nih.gov/geo/</ext-link>).</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro5"><name><surname>Eckfeldt</surname><given-names>CE</given-names></name>, <name><surname>Mendenhall</surname><given-names>EM</given-names></name>, <name><surname>Flynn</surname><given-names>CM</given-names></name>, <name><surname>Wang</surname><given-names>T</given-names></name>, <name><surname>Grindle</surname><given-names>SM</given-names></name>, <name><surname>Ekker</surname><given-names>SC</given-names></name>, <name><surname>Verfallie</surname><given-names>CM</given-names></name>, <name><surname>Pickart</surname><given-names>MA</given-names></name>, <year>2005</year><x>, </x><source>Human Hematopoietic Stem Cell (HSC) and Progenitor Cell (HPC) expression profilies</source><x>, </x><object-id pub-id-type="art-access-id">GSE2666</object-id><x>; </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE2666">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE2666</ext-link><x>, </x><comment>Publicly available at the Gene Expression Omnibus (<ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/">http://www.ncbi.nlm.nih.gov/geo/</ext-link>).</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro6"><name><surname>Gustafsson</surname><given-names>C</given-names></name>, <name><surname>Mjüsberg</surname><given-names>J</given-names></name>, <name><surname>Matussek</surname><given-names>A</given-names></name>, <name><surname>Geffers</surname><given-names>R</given-names></name>, <name><surname>Matthiesen</surname><given-names>L</given-names></name>, <name><surname>Berg</surname><given-names>G</given-names></name>, <name><surname>Sharma</surname><given-names>S</given-names></name>, <name><surname>Buer</surname><given-names>J</given-names></name>, <name><surname>Ernerudh</surname><given-names>J</given-names></name>, <year>2008</year><x>, </x><source>Gene expression profiling of human decidual macrophages: evidence for immunosuppressive phenotype</source><x>, </x><object-id pub-id-type="art-access-id">GSE10612</object-id><x>; </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE10612">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE10612</ext-link><x>, </x><comment>Publicly available at the Gene Expression Omnibus (<ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/">http://www.ncbi.nlm.nih.gov/geo/</ext-link>).</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro7"><name><surname>Hutcheson</surname><given-names>J</given-names></name>, <name><surname>Scatizzi</surname><given-names>JC</given-names></name>, <name><surname>Siddiqui</surname><given-names>AM</given-names></name>, <name><surname>Haines</surname><given-names>GK</given-names><suffix>3rd</suffix></name>, <name><surname>Wu</surname><given-names>T</given-names></name>, <name><surname>Li</surname><given-names>QZ</given-names></name>, <name><surname>Davis</surname><given-names>LS</given-names></name>, <name><surname>Mohan</surname><given-names>C</given-names></name>, <name><surname>Perlman</surname><given-names>H</given-names></name>, <year>2008</year><x>, </x><source>Combined deficiency of proapoptotic regulators Bim and Fas results in the early onset of systemic autoimmunity</source><x>, </x><object-id pub-id-type="art-access-id">GSE10325</object-id><x>; </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE10325">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE10325</ext-link><x>, </x><comment>Publicly available at the Gene Expression Omnibus (<ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/">http://www.ncbi.nlm.nih.gov/geo/</ext-link>).</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro8"><name><surname>Hyrcza</surname><given-names>MD</given-names></name>, <name><surname>Kovacs</surname><given-names>C</given-names></name>, <name><surname>Loutfy</surname><given-names>M</given-names></name>, <name><surname>Halpenny</surname><given-names>R</given-names></name>, <name><surname>Heisler</surname><given-names>L</given-names></name>, <name><surname>Yang</surname><given-names>S</given-names></name>, <name><surname>Wilkins</surname><given-names>O</given-names></name>, <name><surname>Ostrowski</surname><given-names>M</given-names></name>, <name><surname>Der</surname><given-names>SD</given-names></name>, <year>2007</year><x>, </x><source>Distinct transcriptional profiles in ex vivo CD4+ and CD8+ T cells are established early in human immunodeficiency virus type 1 infection and are characterized by a chronic interferon response as well as extensive transcriptional changes in CD8+ T cells</source><x>, </x><object-id pub-id-type="art-access-id">GSE6740</object-id><x>; </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE6740">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE6740</ext-link><x>, </x><comment>Publicly available at the Gene Expression Omnibus (<ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/">http://www.ncbi.nlm.nih.gov/geo/</ext-link>).</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro9"><name><surname>Jura</surname><given-names>J</given-names></name>, <name><surname>Wegrzyn</surname><given-names>P</given-names></name>, <name><surname>Korostyński</surname><given-names>M</given-names></name>, <name><surname>Guzik</surname><given-names>K</given-names></name>, <name><surname>Oczko-Wojciechowska</surname><given-names>M</given-names></name>, <name><surname>Jarzab</surname><given-names>M</given-names></name>, <name><surname>Kowalska</surname><given-names>M</given-names></name>, <name><surname>Piechota</surname><given-names>M</given-names></name>, <name><surname>Przewłocki</surname><given-names>R</given-names></name>, <name><surname>Koj</surname><given-names>A</given-names></name>, <year>2007</year><x>, </x><source>Identification of interleukin-1 and interleukin-6-responsive genes in human monocyte-derived macrophages using microarrays</source><x>, </x><object-id pub-id-type="art-access-id">GSE8515</object-id><x>; </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE8515">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE8515</ext-link><x>, </x><comment>Publicly available at the Gene Expression Omnibus (<ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/">http://www.ncbi.nlm.nih.gov/geo/</ext-link>).</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro10"><name><surname>Lee</surname><given-names>MS</given-names></name>, <name><surname>Hanspers</surname><given-names>K</given-names></name>, <name><surname>Barker</surname><given-names>CS</given-names></name>, <name><surname>Korn</surname><given-names>AP</given-names></name>, <name><surname>McCune</surname><given-names>JM</given-names></name>, <year>2004</year><x>, </x><source>Gene expression profiles during human CD4+ T cell differentiation</source><x>, </x><object-id pub-id-type="art-access-id">GSE1460</object-id><x>; </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE1460">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE1460</ext-link><x>, </x><comment>Publicly available at the Gene Expression Omnibus (<ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/">http://www.ncbi.nlm.nih.gov/geo/</ext-link>).</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro11"><name><surname>Liu</surname><given-names>H</given-names></name>, <name><surname>Shi</surname><given-names>B</given-names></name>, <name><surname>Huang</surname><given-names>CC</given-names></name>, <name><surname>Eksarko</surname><given-names>P</given-names></name>, <name><surname>Pope</surname><given-names>RM</given-names></name>, <year>2007</year><x>, </x><source>Transcriptional diversity during monocyte to macrophage differentiation</source><x>, </x><object-id pub-id-type="art-access-id">GSE8286</object-id><x>; </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE8286">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE8286</ext-link><x>, </x><comment>Publicly available at the Gene Expression Omnibus (<ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/">http://www.ncbi.nlm.nih.gov/geo/</ext-link>).</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro12"><name><surname>Lund</surname><given-names>RJ</given-names></name>, <name><surname>Aittokallio</surname><given-names>T</given-names></name>, <name><surname>Nevalainen</surname><given-names>O</given-names></name>, <name><surname>Lahesmaa</surname><given-names>R</given-names></name>, <name><surname>Kainonen</surname><given-names>E</given-names></name>, <name><surname>Lahesmaa</surname><given-names>A</given-names></name>, <name><surname>Dixon</surname><given-names>C</given-names></name>, <name><surname>Ahlfors</surname><given-names>H</given-names></name>, <name><surname>Melin</surname><given-names>O</given-names></name>, <name><surname>Miller</surname><given-names>M</given-names></name>, <year>2005</year><x>, </x><source>Identification of novel genes regulated by IL-12, IL-4, or TGF-beta during the early polarization of CD4+ lymphocytes</source><x>, </x><object-id pub-id-type="art-access-id">GSE2770</object-id><x>; </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE2770">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE2770</ext-link><x>, </x><comment>Publicly available at the Gene Expression Omnibus (<ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/">http://www.ncbi.nlm.nih.gov/geo/</ext-link>).</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro13"><name><surname>Martens</surname><given-names>JH</given-names></name>, <name><surname>Kzhyshkowska</surname><given-names>J</given-names></name>, <name><surname>Falkowski-Hansen</surname><given-names>M</given-names></name>, <name><surname>Schledzewski</surname><given-names>K</given-names></name>, <name><surname>Gratchev</surname><given-names>A</given-names></name>, <name><surname>Mansmann</surname><given-names>U</given-names></name>, <name><surname>Schmuttermaier</surname><given-names>C</given-names></name>, <name><surname>Dippel</surname><given-names>E</given-names></name>, <name><surname>Koenen</surname><given-names>W</given-names></name>, <name><surname>Riedel</surname><given-names>F</given-names></name>, <name><surname>Goerdt</surname><given-names>S</given-names></name>, <year>2006</year><x>, </x><source>Differential expression of a gene signature for scavenger/lectin receptors by endothelial cells and macrophages in human lymph node sinuses, the primary sites of regional metastasis</source><x>, </x><object-id pub-id-type="art-access-id">GSE2665</object-id><x>; </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE2665">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE2665</ext-link><x>, </x><comment>Publicly available at the Gene Expression Omnibus (<ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/">http://www.ncbi.nlm.nih.gov/geo/</ext-link>).</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro14"><name><surname>Ocklenburg</surname><given-names>F</given-names></name>, <name><surname>Moharregh-Khiabani</surname><given-names>D</given-names></name>, <name><surname>Geffers</surname><given-names>R</given-names></name>, <name><surname>Janke</surname><given-names>V</given-names></name>, <name><surname>Pfoertner</surname><given-names>S</given-names></name>, <name><surname>Garritsen</surname><given-names>H</given-names></name>, <name><surname>Groebe</surname><given-names>L</given-names></name>, <name><surname>Klempnauer</surname><given-names>J</given-names></name>, <name><surname>Dittmar</surname><given-names>KE</given-names></name>, <name><surname>Weiss</surname><given-names>S</given-names></name>, <name><surname>Buer</surname><given-names>J</given-names></name>, <name><surname>Probst-Kepper</surname><given-names>M</given-names></name>, <year>2006</year><x>, </x><source>UBD, a downstream element of FOXP3, allows the identification of LGALS3, a new marker of human regulatory T cells</source><x>, </x><object-id pub-id-type="art-access-id">GSE4527</object-id><x>; </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE4527">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE4527</ext-link><x>, </x><comment>Publicly available at the Gene Expression Omnibus (<ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/">http://www.ncbi.nlm.nih.gov/geo/</ext-link>).</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro15"><name><surname>Popov</surname><given-names>A</given-names></name>, <name><surname>Driesen</surname><given-names>J</given-names></name>, <name><surname>Abdullah</surname><given-names>Z</given-names></name>, <name><surname>Wickenhauser</surname><given-names>C</given-names></name>, <name><surname>Beyer</surname><given-names>M</given-names></name>, <name><surname>Debey-Pascher</surname><given-names>S</given-names></name>, <name><surname>Saric</surname><given-names>T</given-names></name>, <name><surname>Kummer</surname><given-names>S</given-names></name>, <name><surname>Takikawa</surname><given-names>O</given-names></name>, <name><surname>Domann</surname><given-names>E</given-names></name>, <name><surname>Chakraborty</surname><given-names>T</given-names></name>, <name><surname>Krünke</surname><given-names>M</given-names></name>, <name><surname>Utermühlen</surname><given-names>O</given-names></name>, <name><surname>Schultze</surname><given-names>JL</given-names></name>, <year>2008</year><x>, </x><source>Infection of myeloid dendritic cells with Listeria monocytogenes leads to the suppression of T cell function by multiple inhibitory mechanisms</source><x>, </x><object-id pub-id-type="art-access-id">GSE9946</object-id><x>; </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE9946">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE9946</ext-link><x>, </x><comment>Publicly available at the Gene Expression Omnibus (<ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/">http://www.ncbi.nlm.nih.gov/geo/</ext-link>).</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro16"><name><surname>Seita</surname><given-names>J</given-names></name>, <name><surname>Sahoo</surname><given-names>D</given-names></name>, <name><surname>Rossi</surname><given-names>DJ</given-names></name>, <name><surname>Bhattacharya</surname><given-names>D</given-names></name>, <name><surname>Serwold</surname><given-names>T</given-names></name>, <name><surname>Inlay</surname><given-names>M</given-names></name>, <name><surname>Ehrlich</surname><given-names>LI</given-names></name>, <name><surname>Fathman</surname><given-names>JW</given-names></name>, <name><surname>Dill</surname><given-names>DL</given-names></name>, <name><surname>Weissman</surname><given-names>IL</given-names></name>, <year>2012</year><x>, </x><source>Gene expression common: an open platform for absolute gene expression profiling</source><x>, </x><object-id pub-id-type="art-access-id">GSE34723</object-id><x>; </x><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE34723">http://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE34723</ext-link><x>, </x><comment>Publicly available at the Gene Expression Omnibus (<ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/geo/">http://www.ncbi.nlm.nih.gov/geo/</ext-link>).</comment></related-object></p><p><related-object content-type="generated-dataset" document-id="Dataset ID and/or url" document-id-type="dataset" document-type="data" id="dataro17"><name><surname>D’Onorio de Meo</surname><given-names>P</given-names></name>, <name><surname>D’Antonio</surname><given-names>M</given-names></name>, <name><surname>Griggio</surname><given-names>F</given-names></name>, <name><surname>Lupi</surname><given-names>R</given-names></name>, <name><surname>Borsani</surname><given-names>M</given-names></name>, <name><surname>Pavesi</surname><given-names>G</given-names></name>, <name><surname>Castrignanü</surname><given-names>T</given-names></name>, <name><surname>Pesole</surname><given-names>G</given-names></name>, <name><surname>Gissi</surname><given-names>C</given-names></name>, <year>2012</year><x>, </x><source>MitoZoa 2.0: a database resource and search tools for comparative and evolutionary analyses of mitochondrial genomes in Metazoa</source><x>, </x><object-id pub-id-type="art-access-id">PMID: 22123747</object-id><x>; </x><ext-link ext-link-type="uri" xlink:href="http://mi.caspur.it/mitozoa/">http://mi.caspur.it/mitozoa/</ext-link></related-object></p></sec><ref-list><title>References</title><ref id="bib1"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Abascal</surname><given-names>F</given-names></name><name><surname>Zardoya</surname><given-names>R</given-names></name><name><surname>Posada</surname><given-names>D</given-names></name></person-group><year>2005</year><article-title>ProtTest: selection of best-fit models of protein evolution</article-title><source>Bioinformatics</source><volume>21</volume><fpage>2104</fpage><lpage>5</lpage><pub-id pub-id-type="doi">10.1093/bioinformatics/bti263</pub-id></element-citation></ref><ref id="bib2"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Abitua</surname><given-names>PB</given-names></name><name><surname>Wagner</surname><given-names>E</given-names></name><name><surname>Navarrete</surname><given-names>IA</given-names></name><name><surname>Levine</surname><given-names>M</given-names></name></person-group><year>2012</year><article-title>Identification of a rudimentary neural crest in a non-vertebrate chordate</article-title><source>Nature</source><volume>492</volume><fpage>104</fpage><lpage>7</lpage><pub-id pub-id-type="doi">10.1038/nature11589</pub-id></element-citation></ref><ref id="bib3"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bajoghli</surname><given-names>B</given-names></name><name><surname>Guo</surname><given-names>P</given-names></name><name><surname>Aghaallaei</surname><given-names>N</given-names></name><name><surname>Hirano</surname><given-names>M</given-names></name><name><surname>Strohmeier</surname><given-names>C</given-names></name><name><surname>McCurley</surname><given-names>N</given-names></name><etal/></person-group><year>2011</year><article-title>A thymus candidate in lampreys</article-title><source>Nature</source><volume>470</volume><fpage>90</fpage><lpage>4</lpage><pub-id pub-id-type="doi">10.1038/nature09655</pub-id></element-citation></ref><ref id="bib4"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ballarin</surname><given-names>L</given-names></name><name><surname>Menin</surname><given-names>A</given-names></name><name><surname>Tallandini</surname><given-names>L</given-names></name><name><surname>Matozzo</surname><given-names>V</given-names></name><name><surname>Burighel</surname><given-names>P</given-names></name><name><surname>Basso</surname><given-names>G</given-names></name><etal/></person-group><year>2008</year><article-title>Haemocytes and blastogenetic cycle in the colonial ascidian <italic>Botryllus schlosseri</italic>: a matter of life and death</article-title><source>Cell Tissue Res</source><volume>331</volume><fpage>555</fpage><lpage>64</lpage><pub-id pub-id-type="doi">10.1007/s00441-007-0513-4</pub-id></element-citation></ref><ref id="bib5"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bartl</surname><given-names>S</given-names></name><name><surname>Baltimore</surname><given-names>D</given-names></name><name><surname>Weissman</surname><given-names>IL</given-names></name></person-group><year>1994</year><article-title>Molecular evolution of the vertebrate immune system</article-title><source>Proc Natl Acad Sci USA</source><volume>91</volume><fpage>10769</fpage><lpage>70</lpage><pub-id pub-id-type="doi">10.1073/pnas.91.23.10769</pub-id></element-citation></ref><ref id="bib6"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Benita</surname><given-names>Y</given-names></name><name><surname>Cao</surname><given-names>Z</given-names></name><name><surname>Giallourakis</surname><given-names>C</given-names></name><name><surname>Li</surname><given-names>C</given-names></name><name><surname>Gardet</surname><given-names>A</given-names></name><name><surname>Xavier</surname><given-names>RJ</given-names></name></person-group><year>2010</year><article-title>Gene enrichment profiles reveal T-cell development, differentiation, and lineage-specific transcription factors including ZBTB25 as a novel NF-AT repressor</article-title><source>Blood</source><volume>115</volume><fpage>5376</fpage><lpage>84</lpage><pub-id pub-id-type="doi">10.1182/blood-2010-01-263855</pub-id></element-citation></ref><ref id="bib7"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bourlat</surname><given-names>SJ</given-names></name><name><surname>Juliusdottir</surname><given-names>T</given-names></name><name><surname>Lowe</surname><given-names>CJ</given-names></name><name><surname>Freeman</surname><given-names>R</given-names></name><name><surname>Aronowicz</surname><given-names>J</given-names></name><name><surname>Kirschner</surname><given-names>M</given-names></name><etal/></person-group><year>2006</year><article-title>Deuterostome phylogeny reveals monophyletic chordates and the new phylum Xenoturbellida</article-title><source>Nature</source><volume>444</volume><fpage>85</fpage><lpage>8</lpage><pub-id pub-id-type="doi">10.1038/nature05241</pub-id></element-citation></ref><ref id="bib8"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Boyd</surname><given-names>HC</given-names></name><name><surname>Brown</surname><given-names>SK</given-names></name><name><surname>Harp</surname><given-names>JA</given-names></name><name><surname>Weissman</surname><given-names>IL</given-names></name></person-group><year>1986</year><article-title>Growth and sexual maturation of laboratory-cultured Monterey</article-title><source>B schlosseri Biol Bull</source><volume>170</volume><fpage>91</fpage><lpage>109</lpage><pub-id pub-id-type="doi">10.2307/1541383</pub-id></element-citation></ref><ref id="bib9"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Camolotto</surname><given-names>S</given-names></name><name><surname>Racca</surname><given-names>A</given-names></name><name><surname>Rena</surname><given-names>V</given-names></name><name><surname>Nores</surname><given-names>R</given-names></name><name><surname>Patrito</surname><given-names>LC</given-names></name><name><surname>Genti-Raimondi</surname><given-names>S</given-names></name><etal/></person-group><year>2010</year><article-title>Expression and transcriptional regulation of individual pregnancy specific glycoprotein genes in differentiating trophoblast cells</article-title><source>Placenta</source><volume>31</volume><fpage>312</fpage><lpage>9</lpage><pub-id pub-id-type="doi">10.1016/j.placenta.2010.01.004</pub-id></element-citation></ref><ref id="bib10"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Castresana</surname><given-names>J</given-names></name></person-group><year>2000</year><article-title>Selection of conserved blocks from multiple alignments for their use in phylogenetic analysis</article-title><source>Mol Biol Evol</source><volume>17</volume><fpage>540</fpage><lpage>52</lpage><pub-id pub-id-type="doi">10.1093/oxfordjournals.molbev.a026334</pub-id></element-citation></ref><ref id="bib12"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname><given-names>J</given-names></name><name><surname>Bardes</surname><given-names>EE</given-names></name><name><surname>Aronow</surname><given-names>BJ</given-names></name><name><surname>Jegga</surname><given-names>AG</given-names></name></person-group><year>2009</year><article-title>ToppGene Suite for gene list enrichment analysis and candidate gene prioritization</article-title><source>Nucleic Acids Res</source><volume>37</volume><fpage>W305</fpage><lpage>11</lpage><pub-id pub-id-type="doi">10.1093/nar/gkp427</pub-id></element-citation></ref><ref id="bib13"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Cima</surname><given-names>F</given-names></name><name><surname>Manni</surname><given-names>L</given-names></name><name><surname>Basso</surname><given-names>G</given-names></name><name><surname>Fortunato</surname><given-names>E</given-names></name><name><surname>Accordi</surname><given-names>B</given-names></name><name><surname>Schiavon</surname><given-names>F</given-names></name><etal/></person-group><year>2009</year><article-title>Hovering between death and life: natural apoptosis and phagocytes in the blastogenetic cycle of the colonial ascidian Botryllus schlosseri</article-title><source>Dev Comp Immunol</source><volume>34</volume><fpage>272</fpage><lpage>85</lpage><pub-id pub-id-type="doi">10.1016/j.dci.2009.10.005</pub-id></element-citation></ref><ref id="bib14"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Colombera</surname><given-names>D</given-names></name></person-group><year>1963</year><article-title>I cromosomi di <italic>Botryllus schlosseri</italic> (Ascidiacea)</article-title><source>Ric Sci</source><volume>33</volume><fpage>443</fpage><lpage>8</lpage><pub-id pub-id-type="doi">10.1007/BF00389087</pub-id></element-citation></ref><ref id="bib15"><element-citation publication-type="book"><person-group person-group-type="author"><name><surname>Darwin</surname><given-names>C</given-names></name></person-group><year>1874</year><source>The Descent of man</source><publisher-loc>New York</publisher-loc><publisher-name>The Modern library</publisher-name></element-citation></ref><ref id="bib16"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Davis</surname><given-names>MM</given-names></name><name><surname>Chien</surname><given-names>YH</given-names></name><name><surname>Gascoigne</surname><given-names>NR</given-names></name><name><surname>Hedrick</surname><given-names>SM</given-names></name></person-group><year>1984</year><article-title>A murine T cell receptor gene complex: isolation, structure and rearrangement</article-title><source>Immunol Rev</source><volume>81</volume><fpage>235</fpage><lpage>58</lpage><pub-id pub-id-type="doi">10.1111/j.1600-065X.1984.tb01113.x</pub-id></element-citation></ref><ref id="bib37"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>de Konning</surname><given-names>APJ</given-names></name><name><surname>Gu</surname><given-names>W</given-names></name><name><surname>Castoe</surname><given-names>TA</given-names></name><name><surname>Batzer</surname><given-names>MA</given-names></name><name><surname>Pollock</surname><given-names>DD</given-names></name></person-group><year>2011</year><article-title>Repetitive elements may comprise over two thirds of the human genome</article-title><source>PLOS Genet</source><volume>7</volume><fpage>e1002384</fpage><pub-id pub-id-type="doi">10.1371/journal.pgen.1002384</pub-id></element-citation></ref><ref id="bib17"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>De Tomaso</surname><given-names>AW</given-names></name><name><surname>Saito</surname><given-names>Y</given-names></name><name><surname>Ishizuka</surname><given-names>KJ</given-names></name><name><surname>Palmeri</surname><given-names>KJ</given-names></name><name><surname>Weissman</surname><given-names>IL</given-names></name></person-group><year>1998</year><article-title>Mapping the genome of a model protochordate. I. A low resolution genetic map encompassing the fusion/histocompatibility (Fu/HC) locus of <italic>B. schlosseri</italic></article-title><source>Genetics</source><volume>149</volume><fpage>277</fpage><lpage>87</lpage></element-citation></ref><ref id="bib18"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Dehal</surname><given-names>P</given-names></name><name><surname>Satou</surname><given-names>Y</given-names></name><name><surname>Campbell</surname><given-names>RK</given-names></name><name><surname>Chapman</surname><given-names>J</given-names></name><name><surname>Degnan</surname><given-names>B</given-names></name><name><surname>De Tomaso</surname><given-names>A</given-names></name><etal/></person-group><year>2002</year><article-title>The draft genome of <italic>Ciona intestinalis</italic>: insights into chordate and vertebrate origins</article-title><source>Science</source><volume>298</volume><fpage>2157</fpage><lpage>67</lpage><pub-id pub-id-type="doi">10.1126/science.1080049</pub-id></element-citation></ref><ref id="bib19"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Delsuc</surname><given-names>F</given-names></name><name><surname>Brinkmann</surname><given-names>H</given-names></name><name><surname>Chourrout</surname><given-names>D</given-names></name><name><surname>Philippe</surname><given-names>H</given-names></name></person-group><year>2006</year><article-title>Tunicate and not cephalochordates are the closest living relatives of vertebrates</article-title><source>Nature</source><volume>439</volume><fpage>965</fpage><lpage>8</lpage><pub-id pub-id-type="doi">10.1038/nature04336</pub-id></element-citation></ref><ref id="bib20"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Denoeud</surname><given-names>F</given-names></name><name><surname>Henriet</surname><given-names>S</given-names></name><name><surname>Mungpakdee</surname><given-names>S</given-names></name><name><surname>Aury</surname><given-names>JM</given-names></name><name><surname>Da Silva</surname><given-names>C</given-names></name><name><surname>Brinkmann</surname><given-names>H</given-names></name><etal/></person-group><year>2010</year><article-title>Plasticity of animal genome architecture unmasked by rapid evolution of a pelagic tunicate</article-title><source>Science</source><volume>330</volume><fpage>1381</fpage><lpage>5</lpage><pub-id pub-id-type="doi">10.1126/science.1194167</pub-id></element-citation></ref><ref id="bib21"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Dishaw</surname><given-names>LJ</given-names></name><name><surname>Litman</surname><given-names>GW</given-names></name></person-group><year>2009</year><article-title>Invertebrate allorecognition: the origins of histocompatibility</article-title><source>Current Biol</source><volume>19</volume><fpage>R286</fpage><lpage>8</lpage><pub-id pub-id-type="doi">10.1016/j.cub.2009.02.035</pub-id></element-citation></ref><ref id="bib22"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>D’Onorio de Meo</surname><given-names>P</given-names></name><name><surname>D’Antonio</surname><given-names>M</given-names></name><name><surname>Griggio</surname><given-names>F</given-names></name><name><surname>Lupi</surname><given-names>R</given-names></name><name><surname>Borsani</surname><given-names>M</given-names></name><name><surname>Pavesi</surname><given-names>G</given-names></name><etal/></person-group><year>2012</year><article-title>MitoZoa 2.0: a database resource and search tools for comparative and evolutionary analyses of mitochondrial genomes in Metazoa</article-title><source>Nucleic Acids Res</source><volume>40</volume><fpage>D1168</fpage><lpage>72</lpage><pub-id pub-id-type="doi">10.1093/nar/gkr1144</pub-id></element-citation></ref><ref id="bib23"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Fagan</surname><given-names>MB</given-names></name><name><surname>Weissman</surname><given-names>IL</given-names></name></person-group><year>1998</year><article-title>Linkage analysis of HSP70 genes and historecognition locus in <italic>Botryllus schlosseri</italic></article-title><source>Immunogenetics</source><volume>47</volume><fpage>468</fpage><lpage>76</lpage><pub-id pub-id-type="doi">10.1007/s002510050384</pub-id></element-citation></ref><ref id="bib24"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Fan</surname><given-names>HC</given-names></name><name><surname>Wang</surname><given-names>J</given-names></name><name><surname>Potanina</surname><given-names>A</given-names></name><name><surname>Quake</surname><given-names>SR</given-names></name></person-group><year>2011</year><article-title>Whole-genome molecular haplotyping of single cells</article-title><source>Nat Biotechnol</source><volume>29</volume><fpage>51</fpage><lpage>7</lpage><pub-id pub-id-type="doi">10.1038/nbt.1739</pub-id></element-citation></ref><ref id="bib25"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Flajnik</surname><given-names>MF</given-names></name><name><surname>Kasahara</surname><given-names>M</given-names></name></person-group><year>2010</year><article-title>Origin and evolution of the adaptive immune system: genetic events and selective pressures</article-title><source>Nat Rev Genet</source><volume>11</volume><fpage>47</fpage><lpage>59</lpage><pub-id pub-id-type="doi">10.1038/nrg2703</pub-id></element-citation></ref><ref id="bib26"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Frey</surname><given-names>N</given-names></name><name><surname>Luedde</surname><given-names>M</given-names></name><name><surname>Katus</surname><given-names>HA</given-names></name></person-group><year>2012</year><article-title>Mechanisms of disease: hypertrophic cardiomyopathy</article-title><source>Nat Rev Cardiol</source><volume>9</volume><fpage>91</fpage><lpage>100</lpage><pub-id pub-id-type="doi">10.1038/nrcardio.2011.159</pub-id></element-citation></ref><ref id="bib27"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Garstang</surname><given-names>W</given-names></name></person-group><year>1928</year><article-title>The morphology of the Tunicata, and its bearings on the phylogeny of the Chordata</article-title><source>Quart J Microsc Sci</source><volume>72</volume><fpage>51</fpage><lpage>187</lpage></element-citation></ref><ref id="bib28"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gasparini</surname><given-names>F</given-names></name><name><surname>Burighel</surname><given-names>P</given-names></name><name><surname>Manni</surname><given-names>L</given-names></name><name><surname>Zaniolo</surname><given-names>G</given-names></name></person-group><year>2008</year><article-title>Vascular regeneration and angiogenic-like sprouting mechanism in a compouned ascidian is similar to vertebrates</article-title><source>Evol Dev</source><volume>10</volume><fpage>591</fpage><lpage>605</lpage><pub-id pub-id-type="doi">10.1111/j.1525-142X.2008.00274.x</pub-id></element-citation></ref><ref id="bib29"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Guindon</surname><given-names>S</given-names></name><name><surname>Gascuel</surname><given-names>O</given-names></name></person-group><year>2003</year><article-title>A simple, fast, and accurate algorithm to estimate large phylogenies by maximum likelihood</article-title><source>Syst Biol</source><volume>52</volume><fpage>696</fpage><lpage>704</lpage><pub-id pub-id-type="doi">10.1080/10635150390235520</pub-id></element-citation></ref><ref id="bib30"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Guo</surname><given-names>P</given-names></name><name><surname>Hirano</surname><given-names>M</given-names></name><name><surname>Herrin</surname><given-names>BR</given-names></name><name><surname>Li</surname><given-names>J</given-names></name><name><surname>Yu</surname><given-names>C</given-names></name><name><surname>Sadlonova</surname><given-names>A</given-names></name><etal/></person-group><year>2009</year><article-title>Dual nature of the adaptive immune system in lampreys</article-title><source>Nature</source><volume>459</volume><fpage>796</fpage><lpage>802</lpage><pub-id pub-id-type="doi">10.1038/nature08068</pub-id></element-citation></ref><ref id="bib31"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hirano</surname><given-names>M</given-names></name><name><surname>Das</surname><given-names>S</given-names></name><name><surname>Guo</surname><given-names>P</given-names></name><name><surname>Cooper</surname><given-names>MD</given-names></name></person-group><year>2011</year><article-title>Chapter 4 – the evolution of adaptive immunity in vertebrate</article-title><source>Adv In Immunol</source><volume>109</volume><fpage>125</fpage><lpage>57</lpage><pub-id pub-id-type="doi">10.1016/B978-0-12-387664-5.00004-2</pub-id></element-citation></ref><ref id="bib32"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hosoda</surname><given-names>T</given-names></name><name><surname>Monzen</surname><given-names>K</given-names></name><name><surname>Hiroi</surname><given-names>Y</given-names></name><name><surname>Oka</surname><given-names>T</given-names></name><name><surname>Takimoto</surname><given-names>E</given-names></name><name><surname>Yazaki</surname><given-names>Y</given-names></name><etal/></person-group><year>2001</year><article-title>A novel myocyte-specific gene Midori promotes the differentiation of P19CL6 cells into cardiomyocytes</article-title><source>J Biol Chem</source><volume>38</volume><fpage>35978</fpage><lpage>89</lpage><pub-id pub-id-type="doi">10.1074/jbc.M100485200</pub-id></element-citation></ref><ref id="bib33"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hoss</surname><given-names>M</given-names></name><name><surname>Paabo</surname><given-names>S</given-names></name></person-group><year>1993</year><article-title>DNA extraction from Pleistocene bones by a silica-based purification method</article-title><source>Nucleic Acids Res</source><volume>21</volume><fpage>3913</fpage><lpage>4</lpage><pub-id pub-id-type="doi">10.1093/nar/21.16.3913</pub-id></element-citation></ref><ref id="bib34"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Jeffery</surname><given-names>WR</given-names></name><name><surname>Strickler</surname><given-names>AG</given-names></name><name><surname>Yamamoto</surname><given-names>Y</given-names></name></person-group><year>2004</year><article-title>Migratory neural crest-like cells from body pigmentation in a urochordate embryo</article-title><source>Nature</source><volume>431</volume><fpage>696</fpage><lpage>9</lpage><pub-id pub-id-type="doi">10.1038/nature02975</pub-id></element-citation></ref><ref id="bib35"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Johnston</surname><given-names>JJ</given-names></name><name><surname>Kelley</surname><given-names>RI</given-names></name><name><surname>Crawford</surname><given-names>TO</given-names></name><name><surname>Morton</surname><given-names>DH</given-names></name><name><surname>Agarwala</surname><given-names>R</given-names></name><name><surname>Koch</surname><given-names>T</given-names></name><etal/></person-group><year>2000</year><article-title>A novel nemaline myopathy in the Amish caused by a mutation in troponin T1</article-title><source>Am J Hum Genet</source><volume>67</volume><fpage>814</fpage><lpage>21</lpage><pub-id pub-id-type="doi">10.1086/303089</pub-id></element-citation></ref><ref id="bib36"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Katoh</surname><given-names>K</given-names></name><name><surname>Kuma</surname><given-names>K</given-names></name><name><surname>Toh</surname><given-names>H</given-names></name><name><surname>Miyata</surname><given-names>T</given-names></name></person-group><year>2005</year><article-title>MAFFT version 5: improvement in accuracy of multiple sequence alignment</article-title><source>Nucleic Acids Res</source><volume>33</volume><fpage>511</fpage><lpage>8</lpage><pub-id pub-id-type="doi">10.1093/nar/gki198</pub-id></element-citation></ref><ref id="bib38"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kott</surname><given-names>P</given-names></name></person-group><year>1990</year><article-title>The Australian Ascidiacea. Part 2, Aplousobranchiata (1)</article-title><source>Mem Qld Mus</source><volume>29</volume><fpage>1</fpage><lpage>299</lpage></element-citation></ref><ref id="bib39"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kristensen</surname><given-names>DM</given-names></name><name><surname>Wolf</surname><given-names>YI</given-names></name><name><surname>Mushegian</surname><given-names>AR</given-names></name><name><surname>Koonin</surname><given-names>EV</given-names></name></person-group><year>2011</year><article-title>Computational methods for gene orthology inference</article-title><source>Brief Bioinform</source><volume>12</volume><fpage>379</fpage><lpage>91</lpage><pub-id pub-id-type="doi">10.1093/bib/bbr030</pub-id></element-citation></ref><ref id="bib40"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Laird</surname><given-names>DJ</given-names></name><name><surname>De Tomaso</surname><given-names>AW</given-names></name><name><surname>Cooper</surname><given-names>MD</given-names></name><name><surname>Weissman</surname><given-names>IL</given-names></name></person-group><year>2000</year><article-title>50 million years of chordate evolution: seeking the origins of adaptive immunity</article-title><source>Proc Natl Acad Sci USA</source><volume>97</volume><fpage>6924</fpage><lpage>6</lpage><pub-id pub-id-type="doi">10.1073/pnas.97.13.6924</pub-id></element-citation></ref><ref id="bib41"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Laird</surname><given-names>DJ</given-names></name><name><surname>De Tomaso</surname><given-names>AW</given-names></name><name><surname>Weissman</surname><given-names>IL</given-names></name></person-group><year>2005</year><article-title>Stem cells are units of natural selection in a colonial ascidian</article-title><source>Cell</source><volume>123</volume><fpage>1351</fpage><lpage>60</lpage><pub-id pub-id-type="doi">10.1016/j.cell.2005.10.026</pub-id></element-citation></ref><ref id="bib42"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Larkin</surname><given-names>MA</given-names></name><name><surname>Blackshields</surname><given-names>G</given-names></name><name><surname>Brown</surname><given-names>NP</given-names></name><name><surname>Chenna</surname><given-names>R</given-names></name><name><surname>McGettigan</surname><given-names>PA</given-names></name><name><surname>McWilliam</surname><given-names>H</given-names></name><etal/></person-group><year>2007</year><article-title>Clustal W and clustal X version 2.0</article-title><source>Bioinformatics</source><volume>23</volume><fpage>2947</fpage><lpage>8</lpage><pub-id pub-id-type="doi">10.1093/bioinformatics/btm404</pub-id></element-citation></ref><ref id="bib43"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lartillot</surname><given-names>N</given-names></name><name><surname>Brinkmann</surname><given-names>H</given-names></name><name><surname>Philippe</surname><given-names>H</given-names></name></person-group><year>2007</year><article-title>Suppression of long-branch attraction artefacts in the animal phylogeny using a site-heterogeneous model</article-title><source>BMC Evol Biol</source><volume>7</volume><fpage>S4</fpage><pub-id pub-id-type="doi">10.1186/1471-2148-7-S1-S4</pub-id></element-citation></ref><ref id="bib44"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lartillot</surname><given-names>N</given-names></name><name><surname>Lepage</surname><given-names>T</given-names></name><name><surname>Blanquart</surname><given-names>S</given-names></name></person-group><year>2009</year><article-title>PhyloBayes 3: a Bayesian software package for phylogenetic reconstruction and molecular dating</article-title><source>Bioinformatics</source><volume>25</volume><fpage>2286</fpage><lpage>8</lpage><pub-id pub-id-type="doi">10.1093/bioinformatics/btp368</pub-id></element-citation></ref><ref id="bib45"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lauzon</surname><given-names>RJ</given-names></name><name><surname>Patton</surname><given-names>CW</given-names></name><name><surname>Weissman</surname><given-names>IL</given-names></name></person-group><year>1993</year><article-title>A morphological and immunohistochemical study of programmed cell death in <italic>Botryllus schlosseri</italic> (Tunicata, Ascidiacea)</article-title><source>Cell Tissue Res</source><volume>272</volume><fpage>115</fpage><lpage>27</lpage><pub-id pub-id-type="doi">10.1007/BF00323577</pub-id></element-citation></ref><ref id="bib46"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lemaire</surname><given-names>P</given-names></name></person-group><year>2011</year><article-title>Evolutionary crossroads in developmental biology: the tunicates</article-title><source>Development</source><volume>138</volume><fpage>2143</fpage><lpage>52</lpage><pub-id pub-id-type="doi">10.1242/dev.048975</pub-id></element-citation></ref><ref id="bib47"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Li</surname><given-names>H</given-names></name><name><surname>Durbin</surname><given-names>R</given-names></name></person-group><year>2009</year><article-title>Fast and accurate short read alignment with Burrows-Wheeler Transform</article-title><source>Bioinformatics</source><volume>25</volume><fpage>1754</fpage><lpage>60</lpage><pub-id pub-id-type="doi">10.1093/bioinformatics/btp324</pub-id></element-citation></ref><ref id="bib48"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Li</surname><given-names>H</given-names></name><name><surname>Handsaker</surname><given-names>B</given-names></name><name><surname>Wysoker</surname><given-names>A</given-names></name><name><surname>Fennell</surname><given-names>T</given-names></name><name><surname>Ruan</surname><given-names>J</given-names></name><name><surname>Homer</surname><given-names>N</given-names></name><etal/></person-group><year>2009</year><article-title>The sequence alignment map format and SAM tools</article-title><source>Bioinformatics</source><volume>25</volume><fpage>2078</fpage><lpage>9</lpage><pub-id pub-id-type="doi">10.1093/bioinformatics/btp352</pub-id></element-citation></ref><ref id="bib49"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Manni</surname><given-names>L</given-names></name><name><surname>Burighel</surname><given-names>P</given-names></name></person-group><year>2006</year><article-title>Common and divergent pathways in alternative developmental processes of ascidians</article-title><source>Bioessays</source><volume>28</volume><fpage>902</fpage><lpage>12</lpage><pub-id pub-id-type="doi">10.1002/bies.20462</pub-id></element-citation></ref><ref id="bib50"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Moller</surname><given-names>PC</given-names></name><name><surname>Philpott</surname><given-names>CH</given-names></name></person-group><year>2005</year><article-title>The circulatory system of Amphioxus (<italic>Branchiostoma floridae</italic>)</article-title><source>J Morphol</source><volume>139</volume><fpage>389</fpage><lpage>406</lpage><pub-id pub-id-type="doi">10.1002/jmor.1051390403</pub-id></element-citation></ref><ref id="bib51"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Muramatsu</surname><given-names>M</given-names></name><name><surname>Kinoshita</surname><given-names>K</given-names></name><name><surname>Fagarasan</surname><given-names>S</given-names></name><name><surname>Yamada</surname><given-names>S</given-names></name><name><surname>Shinkai</surname><given-names>Y</given-names></name><name><surname>Honjo</surname><given-names>T</given-names></name></person-group><year>2000</year><article-title>Class switch recombination and hypermutation require activation-induced cytidine deaminase (AID), a potential RNA editing enzyme</article-title><source>Cell</source><volume>102</volume><fpage>553</fpage><lpage>63</lpage><pub-id pub-id-type="doi">10.1016/S0092-8674(00)00078-7</pub-id></element-citation></ref><ref id="bib52"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Myers</surname><given-names>EW</given-names></name><name><surname>Sutton</surname><given-names>GG</given-names></name><name><surname>Delcher</surname><given-names>AL</given-names></name><name><surname>Dew</surname><given-names>IM</given-names></name><name><surname>Fasulo</surname><given-names>DP</given-names></name><name><surname>Flanigan</surname><given-names>MJ</given-names></name><etal/></person-group><year>2000</year><article-title>A whole-genome assembly of Drosophila</article-title><source>Science</source><volume>287</volume><fpage>2196</fpage><lpage>204</lpage><pub-id pub-id-type="doi">10.1126/science.287.5461.2196</pub-id></element-citation></ref><ref id="bib53"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nehls</surname><given-names>M</given-names></name><name><surname>Kyewski</surname><given-names>B</given-names></name><name><surname>Messerie</surname><given-names>M</given-names></name><name><surname>Wadschutz</surname><given-names>R</given-names></name><name><surname>Schuddekopf</surname><given-names>K</given-names></name><name><surname>Smith</surname><given-names>AJH</given-names></name><etal/></person-group><year>1996</year><article-title>Two genetically separable steps in the differentiation of thymic epithelium</article-title><source>Science</source><volume>272</volume><fpage>886</fpage><lpage>9</lpage><pub-id pub-id-type="doi">10.1126/science.272.5263.886</pub-id></element-citation></ref><ref id="bib54"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Newman</surname><given-names>AM</given-names></name><name><surname>Cooper</surname><given-names>JB</given-names></name></person-group><year>2007</year><article-title>XSTREAM: A practical algorithm for identification and architecture modeling of tandem repeats in protein sequences</article-title><source>BMC Bioinformatics</source><volume>8</volume><fpage>382</fpage><lpage>400</lpage><pub-id pub-id-type="doi">10.1186/1471-2105-8-382</pub-id></element-citation></ref><ref id="bib55"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Oettinger</surname><given-names>MA</given-names></name><name><surname>Schatz</surname><given-names>DG</given-names></name><name><surname>Gorka</surname><given-names>C</given-names></name><name><surname>Baltimore</surname><given-names>D</given-names></name></person-group><year>1990</year><article-title><italic>RAG-1</italic> and <italic>RAG-2</italic>, adjacent genes that synergistically activate V(D)J recombination</article-title><source>Science</source><volume>248</volume><fpage>1517</fpage><lpage>23</lpage><pub-id pub-id-type="doi">10.1126/science.2360047</pub-id></element-citation></ref><ref id="bib56"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Pancer</surname><given-names>Z</given-names></name><name><surname>Amemiya</surname><given-names>CT</given-names></name><name><surname>Ehrhardt</surname><given-names>GR</given-names></name><name><surname>Ceitlin</surname><given-names>J</given-names></name><name><surname>Gartland</surname><given-names>GL</given-names></name><name><surname>Cooper</surname><given-names>MD</given-names></name></person-group><year>2004</year><article-title>Somatic diversification of variable lymphocyte receptors in the agnathan sea lamprey</article-title><source>Nature</source><volume>430</volume><fpage>174</fpage><lpage>80</lpage><pub-id pub-id-type="doi">10.1038/nature02740</pub-id></element-citation></ref><ref id="bib57"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Perez-Portela</surname><given-names>R</given-names></name><name><surname>Bishop</surname><given-names>JD</given-names></name><name><surname>Davis</surname><given-names>AR</given-names></name><name><surname>Turon</surname><given-names>X</given-names></name></person-group><year>2009</year><article-title>Phylogeny of the families Pyuridae and Styelidae (Stolidobranchiata, Ascidiacea) inferred from mitochondrial and nuclear DNA sequences</article-title><source>Mol Phylogenet Evol</source><volume>50</volume><fpage>560</fpage><lpage>70</lpage><pub-id pub-id-type="doi">10.1016/j.ympev.2008.11.014</pub-id></element-citation></ref><ref id="bib58"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Perseke</surname><given-names>M</given-names></name><name><surname>Hetmank</surname><given-names>J</given-names></name><name><surname>Bernt</surname><given-names>M</given-names></name><name><surname>Stadler</surname><given-names>PF</given-names></name><name><surname>Schlegel</surname><given-names>M</given-names></name><name><surname>Bernhard</surname><given-names>D</given-names></name></person-group><year>2011</year><article-title>The enigmatic mitochondrial genome of <italic>Rhabdopleura compacta</italic> (Pterobranchia) reveals insights into selection of an efficient tRNA system and supports monophyly of Ambulacraria</article-title><source>BMC Evol Biol</source><volume>11</volume><fpage>134</fpage><pub-id pub-id-type="doi">10.1186/1471-2148-11-134</pub-id></element-citation></ref><ref id="bib59"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Philippe</surname><given-names>H</given-names></name><name><surname>Derelle</surname><given-names>R</given-names></name><name><surname>Lopez</surname><given-names>P</given-names></name><name><surname>Pick</surname><given-names>K</given-names></name><name><surname>Borchiellini</surname><given-names>C</given-names></name><name><surname>Boury-Esnault</surname><given-names>N</given-names></name><etal/></person-group><year>2009</year><article-title>Phylogenomics revives traditional views on deep animal relationships</article-title><source>Curr Biol</source><volume>19</volume><fpage>706</fpage><lpage>12</lpage><pub-id pub-id-type="doi">10.1016/j.cub.2009.02.052</pub-id></element-citation></ref><ref id="bib60"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Price</surname><given-names>AL</given-names></name><name><surname>Jones</surname><given-names>NC</given-names></name><name><surname>Pevzner</surname><given-names>PA</given-names></name></person-group><year>2005</year><article-title>De novo identification of repeat families in large genomes</article-title><source>Bioinformatics</source><volume>21</volume><fpage>i351</fpage><lpage>8</lpage><pub-id pub-id-type="doi">10.1093/bioinformatics/bti1018</pub-id></element-citation></ref><ref id="bib61"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Putnam</surname><given-names>NH</given-names></name><name><surname>Srivastava</surname><given-names>M</given-names></name><name><surname>Hellsten</surname><given-names>U</given-names></name><name><surname>Dirks</surname><given-names>B</given-names></name><name><surname>Chapman</surname><given-names>J</given-names></name><name><surname>Salamov</surname><given-names>A</given-names></name><etal/></person-group><year>2007</year><article-title>Sea anemone genome reveals ancestral eumetazoan gene repertoire and genomic organization</article-title><source>Science</source><volume>317</volume><fpage>86</fpage><lpage>94</lpage><pub-id pub-id-type="doi">10.1126/science.1139158</pub-id></element-citation></ref><ref id="bib62"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Quinlan</surname><given-names>AR</given-names></name><name><surname>Hall</surname><given-names>IM</given-names></name></person-group><year>2010</year><article-title>BEDTools: a flexible suite of utilities for comparing genomic features</article-title><source>Bioinformatics</source><volume>26</volume><fpage>841</fpage><lpage>2</lpage><pub-id pub-id-type="doi">10.1093/bioinformatics/btq033</pub-id></element-citation></ref><ref id="bib63"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Rabionet</surname><given-names>R</given-names></name><name><surname>Gasparini</surname><given-names>P</given-names></name><name><surname>Estivill</surname><given-names>X</given-names></name></person-group><year>2000</year><article-title>Molecular genetics of hearing impairment due to mutations in gap junction genes encoding beta connexins</article-title><source>Hum Mutat</source><volume>16</volume><fpage>190</fpage><lpage>202</lpage><pub-id pub-id-type="doi">10.1002/1098-1004(200009)16:3<190::AID-HUMU2>3.0.CO;2-I</pub-id></element-citation></ref><ref id="bib64"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Rinkevich</surname><given-names>Y</given-names></name><name><surname>Voskoboynik</surname><given-names>A</given-names></name><name><surname>Rosner</surname><given-names>A</given-names></name><name><surname>Rabinowitz</surname><given-names>C</given-names></name><name><surname>Paz</surname><given-names>G</given-names></name><name><surname>Oren</surname><given-names>M</given-names></name><etal/></person-group><year>2013</year><article-title>Repeated, long term cycling of putative stem cells between niches in a basal chordate</article-title><source>Dev Cell</source><volume>24</volume><fpage>76</fpage><lpage>88</lpage><pub-id pub-id-type="doi">10.1016/j.devcel.2012.11.010</pub-id></element-citation></ref><ref id="bib65"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Rogozin</surname><given-names>IB</given-names></name><name><surname>Iyer</surname><given-names>LM</given-names></name><name><surname>Liang</surname><given-names>L</given-names></name><name><surname>Glazko</surname><given-names>GV</given-names></name><name><surname>Liston</surname><given-names>VG</given-names></name><name><surname>Pavlov</surname><given-names>YI</given-names></name><etal/></person-group><year>2007</year><article-title>Evolution and diversification of lamprey antigen receptors: evidence for involvement of an AID-APOBEC family cytosine deaminase</article-title><source>Nature Immunol</source><volume>8</volume><fpage>647</fpage><lpage>56</lpage><pub-id pub-id-type="doi">10.1038/ni1463</pub-id></element-citation></ref><ref id="bib66"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sabbadin</surname><given-names>A</given-names></name></person-group><year>1962</year><article-title>Le basi genetiche della capacità di fusione fra colonie in <italic>Botryllus schlosseri</italic> (Ascidiacea)</article-title><source>Rend Accad Naz Lincei Ser</source><volume>32</volume><fpage>1031</fpage><lpage>5</lpage></element-citation></ref><ref id="bib67"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sabbadin</surname><given-names>A</given-names></name><name><surname>Zaniolo</surname><given-names>G</given-names></name><name><surname>Majone</surname><given-names>F</given-names></name></person-group><year>1975</year><article-title>Determination of polarity and bilateral asymmetry in palleal and vascular buds of the ascidian</article-title><source>Botryllus schlosseri Dev Biol</source><volume>46</volume><fpage>79</fpage><lpage>87</lpage><pub-id pub-id-type="doi">10.1016/0012-1606(75)90088-3</pub-id></element-citation></ref><ref id="bib68"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Salzberg</surname><given-names>SL</given-names></name><name><surname>Phillippy</surname><given-names>AM</given-names></name><name><surname>Zimin</surname><given-names>A</given-names></name><name><surname>Puiu</surname><given-names>D</given-names></name><name><surname>Magoc</surname><given-names>T</given-names></name><name><surname>Koren</surname><given-names>S</given-names></name><etal/></person-group><year>2012</year><article-title>GAGE: a critical evaluation of genome assemblies and assembly algorithms</article-title><source>Genome Res</source><volume>22</volume><fpage>557</fpage><lpage>67</lpage><pub-id pub-id-type="doi">10.1101/gr.131383.111</pub-id></element-citation></ref><ref id="bib69"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Schlumpberger</surname><given-names>JM</given-names></name><name><surname>Weissman</surname><given-names>IL</given-names></name><name><surname>Scofield</surname><given-names>VL</given-names></name></person-group><year>1984</year><article-title>Separation and labeling of specific subpopulations of <italic>Botryllus</italic> blood cells</article-title><source>J Exp Zool</source><volume>229</volume><fpage>41</fpage><lpage>411</lpage><pub-id pub-id-type="doi">10.1002/jez.1402290308</pub-id></element-citation></ref><ref id="bib70"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Scofield</surname><given-names>VL</given-names></name><name><surname>Schlumpberger</surname><given-names>JM</given-names></name><name><surname>West</surname><given-names>LA</given-names></name><name><surname>Weissman</surname><given-names>IL</given-names></name></person-group><year>1982</year><article-title>Protochordate allorecognition is controlled by a MHC-like gene system</article-title><source>Nature</source><volume>295</volume><fpage>499</fpage><lpage>502</lpage><pub-id pub-id-type="doi">10.1038/295499a0</pub-id></element-citation></ref><ref id="bib71"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Seita</surname><given-names>J</given-names></name><name><surname>Sahoo</surname><given-names>D</given-names></name><name><surname>Rossi</surname><given-names>DJ</given-names></name><name><surname>Bhattacharya</surname><given-names>D</given-names></name><name><surname>Serwold</surname><given-names>T</given-names></name><name><surname>Inlay</surname><given-names>MA</given-names></name><etal/></person-group><year>2012</year><article-title>Gene expression commons: an open platform for absolute gene expression profiling</article-title><source>PLOS ONE</source><volume>7</volume><fpage>e40321</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0040321</pub-id></element-citation></ref><ref id="bib72"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Shinzato</surname><given-names>C</given-names></name><name><surname>Shoguchi</surname><given-names>E</given-names></name><name><surname>Kawashima</surname><given-names>T</given-names></name><name><surname>Hamada</surname><given-names>M</given-names></name><name><surname>Hisata</surname><given-names>K</given-names></name><name><surname>Tanaka</surname><given-names>M</given-names></name><etal/></person-group><year>2011</year><article-title>Using the <italic>Acropora digitifera</italic> genome to understand coral responses to environmental change</article-title><source>Nature</source><volume>476</volume><fpage>320</fpage><lpage>3</lpage><pub-id pub-id-type="doi">10.1038/nature10249</pub-id></element-citation></ref><ref id="bib73"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Shoguchi</surname><given-names>E</given-names></name><name><surname>Ikuta</surname><given-names>T</given-names></name><name><surname>Yoshizaki</surname><given-names>F</given-names></name><name><surname>Satou</surname><given-names>Y</given-names></name><name><surname>Satoh</surname><given-names>N</given-names></name><name><surname>Asano</surname><given-names>K</given-names></name><etal/></person-group><year>2004</year><article-title>Fluorescent in situ hybridization to ascidian chromosomes</article-title><source>Zoolog Sci</source><volume>21</volume><fpage>153</fpage><lpage>7</lpage><pub-id pub-id-type="doi">10.2108/zsj.21.153</pub-id></element-citation></ref><ref id="bib74"><element-citation publication-type="book"><person-group person-group-type="author"><name><surname>Smit</surname><given-names>AFA</given-names></name><name><surname>Hubley</surname><given-names>R</given-names></name><name><surname>Green</surname><given-names>P</given-names></name></person-group><year>1996–2010</year><source>RepeatMasker Open-3.0</source><ext-link ext-link-type="uri" xlink:href="http://www.repeatmasker.org/">http://www.repeatmasker.org</ext-link></element-citation></ref><ref id="bib75"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Singh</surname><given-names>TR</given-names></name><name><surname>Tsagkogeorga</surname><given-names>G</given-names></name><name><surname>Delsuc</surname><given-names>F</given-names></name><name><surname>Blanquart</surname><given-names>S</given-names></name><name><surname>Shenkar</surname><given-names>N</given-names></name><name><surname>Loya</surname><given-names>Y</given-names></name><etal/></person-group><year>2009</year><article-title>Tunicate mitogenomics and phylogenetics: peculiarities of the <italic>Herdmania momus</italic> mitochondrial genome and support for the new chordate phylogeny</article-title><source>BMC Genomics</source><volume>10</volume><fpage>534</fpage><pub-id pub-id-type="doi">10.1186/1471-2164-10-534</pub-id></element-citation></ref><ref id="bib76"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Srivastava</surname><given-names>M</given-names></name><name><surname>Simakov</surname><given-names>O</given-names></name><name><surname>Chapman</surname><given-names>J</given-names></name><name><surname>Fahey</surname><given-names>B</given-names></name><name><surname>Gauthier</surname><given-names>ME</given-names></name><name><surname>Mitros</surname><given-names>T</given-names></name><etal/></person-group><year>2010</year><article-title>The <italic>Amphimedon queenslandica</italic> genome and the evolution of animal complexity</article-title><source>Nature</source><volume>466</volume><fpage>720</fpage><lpage>6</lpage><pub-id pub-id-type="doi">10.1038/nature09201</pub-id></element-citation></ref><ref id="bib77"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Stanke</surname><given-names>M</given-names></name><name><surname>Diekhans</surname><given-names>M</given-names></name><name><surname>Baertsch</surname><given-names>R</given-names></name><name><surname>Haussler</surname><given-names>D</given-names></name></person-group><year>2008</year><article-title>Using native and syntenically mapped cDNA alignments to improve <italic>de novo</italic> gene finding</article-title><source>Bioinformatics</source><volume>24</volume><fpage>637</fpage><lpage>44</lpage><pub-id pub-id-type="doi">10.1093/bioinformatics/btn013</pub-id></element-citation></ref><ref id="bib78"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Stoner</surname><given-names>DS</given-names></name><name><surname>Weissman</surname><given-names>IL</given-names></name></person-group><year>1996</year><article-title>Somatic and germ cell parasitism in a colonial ascidian possible role for a highly polymorphic allorecognition system</article-title><source>Proc Natl Acad Sci USA</source><volume>24</volume><fpage>15254</fpage><lpage>9</lpage><pub-id pub-id-type="doi">10.1073/pnas.93.26.15254</pub-id></element-citation></ref><ref id="bib79"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Stoner</surname><given-names>DS</given-names></name><name><surname>Rinkevich</surname><given-names>B</given-names></name><name><surname>Weissman</surname><given-names>IL</given-names></name></person-group><year>1999</year><article-title>Heritable germ and somatic cell lineage competitions in chimeric colonial protochordates</article-title><source>Proc Natl Acad Sci USA</source><volume>96</volume><fpage>9148</fpage><lpage>53</lpage><pub-id pub-id-type="doi">10.1073/pnas.96.16.9148</pub-id></element-citation></ref><ref id="bib80"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Stoner</surname><given-names>DS</given-names></name><name><surname>Ben-Shlomo</surname><given-names>R</given-names></name><name><surname>Rinkevich</surname><given-names>B</given-names></name><name><surname>Weissman</surname><given-names>IL</given-names></name></person-group><year>2002</year><article-title>Genetic variability of <italic>Botryllus schlosseri</italic> invasions to the east and west coasts of the USA</article-title><source>Mar Ecol Prog Ser</source><volume>243</volume><fpage>93</fpage><lpage>100</lpage><pub-id pub-id-type="doi">10.3354/meps243093</pub-id></element-citation></ref><ref id="bib81"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sun</surname><given-names>W</given-names></name><name><surname>Xiao</surname><given-names>X</given-names></name><name><surname>Li</surname><given-names>S</given-names></name><name><surname>Guo</surname><given-names>X</given-names></name><name><surname>Zhang</surname><given-names>Q</given-names></name></person-group><year>2011</year><article-title>Mutation analysis of 12 genes in Chinese families with congenital cataracts</article-title><source>Mol Vis</source><volume>17</volume><fpage>2197</fpage><lpage>206</lpage></element-citation></ref><ref id="bib82"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Swalla</surname><given-names>BJ</given-names></name><name><surname>Cameron</surname><given-names>CB</given-names></name><name><surname>Corley</surname><given-names>LS</given-names></name><name><surname>Garey</surname><given-names>JR</given-names></name></person-group><year>2000</year><article-title>Urochordates are monophyletic within the deuterostomes</article-title><source>Syst Biol</source><volume>49</volume><fpage>52</fpage><pub-id pub-id-type="doi">10.1080/10635150050207384</pub-id></element-citation></ref><ref id="bib83"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tiozzo</surname><given-names>S</given-names></name><name><surname>Voskoboynik</surname><given-names>A</given-names></name><name><surname>Brown</surname><given-names>FD</given-names></name><name><surname>De Tomaso</surname><given-names>AW</given-names></name></person-group><year>2008</year><article-title>A conserved role of the VEGF pathway in angiogenesis of an ectodermally-derived vasculature</article-title><source>Dev Biol</source><volume>315</volume><fpage>243</fpage><lpage>55</lpage><pub-id pub-id-type="doi">10.1016/j.ydbio.2007.12.035</pub-id></element-citation></ref><ref id="bib84"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Trapnell</surname><given-names>C</given-names></name><name><surname>Williams</surname><given-names>BA</given-names></name><name><surname>Pertea</surname><given-names>G</given-names></name><name><surname>Mortazavi</surname><given-names>A</given-names></name><name><surname>Kwan</surname><given-names>G</given-names></name><name><surname>van Baren</surname><given-names>MJ</given-names></name><etal/></person-group><year>2010</year><article-title>Transcript assembly and quantification by RNA-Seq reveals unannotated transcripts and isoform switching during cell differentiation</article-title><source>Nat Biotechnol</source><volume>28</volume><fpage>511</fpage><lpage>5</lpage><pub-id pub-id-type="doi">10.1038/nbt.1621</pub-id></element-citation></ref><ref id="bib85"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tsagkogeorga</surname><given-names>G</given-names></name><name><surname>Turon</surname><given-names>X</given-names></name><name><surname>Hopcroft</surname><given-names>R</given-names></name><name><surname>Tilak</surname><given-names>M</given-names></name><name><surname>Feldstein</surname><given-names>T</given-names></name><name><surname>Shenkar</surname><given-names>N</given-names></name><etal/></person-group><year>2009</year><article-title>18S rRNA phylogeny of tunicates based on mixture and secondary structure modes</article-title><source>BMC Evoul Biol</source><volume>9</volume><fpage>187</fpage><pub-id pub-id-type="doi">10.1186/1471-2148-9-187</pub-id></element-citation></ref><ref id="bib86"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Turon</surname><given-names>X</given-names></name><name><surname>Lopez-Legentil</surname><given-names>S</given-names></name></person-group><year>2004</year><article-title>Ascidian molecular phylogeny inferred from mtDNA data with emphasis on the Aplousobranchiata</article-title><source>Mol Phylogenet Evol</source><volume>33</volume><fpage>309</fpage><lpage>20</lpage><pub-id pub-id-type="doi">10.1016/j.ympev.2004.06.011</pub-id></element-citation></ref><ref id="bib87"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Voskoboynik</surname><given-names>A</given-names></name><name><surname>Simon-Blecher</surname><given-names>N</given-names></name><name><surname>Soen</surname><given-names>Y</given-names></name><name><surname>Rinkevich</surname><given-names>B</given-names></name><name><surname>De Tomaso</surname><given-names>AW</given-names></name><etal/></person-group><year>2007</year><article-title>Striving for normality: whole body regeneration through a series of abnormal generations</article-title><source>FASEB J</source><volume>21</volume><fpage>1335</fpage><lpage>44</lpage><pub-id pub-id-type="doi">10.1096/fj.06-7337com</pub-id></element-citation></ref><ref id="bib88"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Voskoboynik</surname><given-names>A</given-names></name><name><surname>Soen</surname><given-names>Y</given-names></name><name><surname>Rinkevich</surname><given-names>Y</given-names></name><name><surname>Rosner</surname><given-names>A</given-names></name><name><surname>Ueno</surname><given-names>H</given-names></name><name><surname>Reshef</surname><given-names>R</given-names></name><etal/></person-group><year>2008</year><article-title>Identification of the endostyle as a stem cell niche in a colonial chordate</article-title><source>Cell Stem Cell</source><volume>3</volume><fpage>456</fpage><lpage>64</lpage><pub-id pub-id-type="doi">10.1016/j.stem.2008.07.023</pub-id></element-citation></ref><ref id="bib89"><element-citation publication-type="book"><person-group person-group-type="author"><name><surname>Voskoboynik</surname><given-names>A</given-names></name><name><surname>Rinkevich</surname><given-names>B</given-names></name><name><surname>Weissman</surname><given-names>IL</given-names></name></person-group><year>2009</year><article-title>Stem cells chimerism and tolerance: lessons from mammals and ascidians</article-title><source>Stem Cells in Marine Organisms</source><person-group person-group-type="editor"><name><surname>Rinkevich</surname><given-names>B</given-names></name><name><surname>Matranga</surname><given-names>V</given-names></name></person-group><publisher-loc>The Netherlands</publisher-loc><publisher-name>Springer</publisher-name><fpage>281</fpage><lpage>308</lpage></element-citation></ref><ref id="bib97"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Voskoboynik</surname><given-names>A</given-names></name><name><surname>Newman</surname><given-names>AM</given-names></name><name><surname>Corey</surname><given-names>DM</given-names></name><name><surname>Sahoo</surname><given-names>D</given-names></name><name><surname>Pushkarev</surname><given-names>D</given-names></name><name><surname>Neff</surname><given-names>NF</given-names></name><etal/></person-group><year>2013</year><article-title>Identification of a colonial chordate histocompatibility gene</article-title><source>Science</source><comment>in press</comment></element-citation></ref><ref id="bib90"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Weigert</surname><given-names>MG</given-names></name><name><surname>Cesari</surname><given-names>IM</given-names></name><name><surname>Yonkovich</surname><given-names>SJ</given-names></name><name><surname>Cohn</surname><given-names>M</given-names></name></person-group><year>1970</year><article-title>Variability in the λ light chain sequences of mouse antibody</article-title><source>Nature</source><volume>228</volume><fpage>1045</fpage><lpage>7</lpage><pub-id pub-id-type="doi">10.1038/2281045a0</pub-id></element-citation></ref><ref id="bib91"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wilcox</surname><given-names>ER</given-names></name><name><surname>Burton</surname><given-names>QL</given-names></name><name><surname>Naz</surname><given-names>S</given-names></name><name><surname>Riazuddin</surname><given-names>S</given-names></name><name><surname>Smith</surname><given-names>TN</given-names></name><name><surname>Ploplis</surname><given-names>B</given-names></name><etal/></person-group><year>2001</year><article-title>Mutations in the gene encoding tight junction claudin-14 cause autosomal recessive deafness DFNB29</article-title><source>Cell</source><volume>104</volume><fpage>165</fpage><lpage>72</lpage><pub-id pub-id-type="doi">10.1016/S0092-8674(01)00200-8</pub-id></element-citation></ref><ref id="bib92"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Xu</surname><given-names>X</given-names></name><name><surname>Nagarajan</surname><given-names>H</given-names></name><name><surname>Lewis</surname><given-names>NE</given-names></name><name><surname>Pan</surname><given-names>S</given-names></name><name><surname>Cai</surname><given-names>Z</given-names></name><name><surname>Liu</surname><given-names>X</given-names></name><etal/></person-group><year>2011</year><article-title>The genomic sequence of the Chinese hamster ovary (CHO)-K1 cell line</article-title><source>Nat Biotechnol</source><volume>29</volume><fpage>735</fpage><lpage>41</lpage><pub-id pub-id-type="doi">10.1038/nbt.1932</pub-id></element-citation></ref><ref id="bib93"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yokobori</surname><given-names>S</given-names></name><name><surname>Oshima</surname><given-names>T</given-names></name><name><surname>Wada</surname><given-names>H</given-names></name></person-group><year>2005</year><article-title>Complete nucleotide sequence of the mitochondrial genome of <italic>Doliolum nationalis</italic> with implications for evolution of urochordates</article-title><source>Mol Phylogenet Evol</source><volume>34</volume><fpage>273</fpage><pub-id pub-id-type="doi">10.1016/j.ympev.2004.10.002</pub-id></element-citation></ref><ref id="bib94"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yokobori</surname><given-names>S</given-names></name><name><surname>Kurabayashi</surname><given-names>A</given-names></name><name><surname>Neilan</surname><given-names>BA</given-names></name><name><surname>Maruyama</surname><given-names>T</given-names></name><name><surname>Hirose</surname><given-names>E</given-names></name></person-group><year>2006</year><article-title>Multiple origins of the ascidian-Prochloron symbiosis: molecular phylogeny of photosymbiotic and non-symbiotic colonial ascidians inferred from 18S rDNA sequences</article-title><source>Mol Phylogenet Evol</source><volume>40</volume><fpage>8</fpage><pub-id pub-id-type="doi">10.1016/j.ympev.2005.11.025</pub-id></element-citation></ref><ref id="bib95"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zeng</surname><given-names>L</given-names></name><name><surname>Jacobs</surname><given-names>MW</given-names></name><name><surname>Swalla</surname><given-names>BJ</given-names></name></person-group><year>2006</year><article-title>Coloniality has evolved once in <italic>Stolidobranch Ascidians</italic></article-title><source>Integr Comp Biol</source><volume>46</volume><fpage>255</fpage><lpage>68</lpage><pub-id pub-id-type="doi">10.1093/icb/icj035</pub-id></element-citation></ref><ref id="bib96"><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zerbino</surname><given-names>DR</given-names></name></person-group><year>2010</year><article-title>Using the Velvet de novo assembler for short-read sequencing technologies</article-title><source>Curr Protoc Bioinformatics</source><volume>11</volume><fpage>11.5.1</fpage><lpage>12</lpage><pub-id pub-id-type="doi">10.1002/0471250953.bi1105s31</pub-id></element-citation></ref></ref-list></back></article> |